blob: 492a00073cdb78743dd534cedadec91e1ce68f31 [file] [log] [blame]
Dan Shif8b71d12014-09-03 10:31:08 -07001#!/usr/bin/env python
2
3# Copyright (c) 2014 The Chromium OS Authors. All rights reserved.
4# Use of this source code is governed by a BSD-style license that can be
5# found in the LICENSE file.
6
7# Script to check the history of stage calls made to devserver.
8# Following are some sample use cases:
9#
10# 1. Find all stage request for autotest and image nyan_big-release/R38-6055.0.0
11# in the last 10 days across all devservers.
12# ./devserver_history.py --image_filters nyan_big 38 6055.0.0 -l 240 \
13# --artifact_filters autotest -v
14# output:
15# ==============================================================================
16# 170.21.64.22
17# ==============================================================================
18# Number of calls: 1
19# Number of unique images: 1
20# 2014-08-23 12:45:00: nyan_big-release/R38-6055.0.0 autotest
21# ==============================================================================
22# 170.21.64.23
23# ==============================================================================
24# Number of calls: 2
25# Number of unique images: 1
26# 2014-08-23 12:45:00: nyan_big-release/R38-6055.0.0 autotest, test_suites
27# 2014-08-23 12:55:00: nyan_big-release/R38-6055.0.0 autotest, test_suites
28#
29# 2. Find all duplicated stage request for the last 10 days.
30# ./devserver_history.py -d -l 240
31# output:
32# Detecting artifacts staged in multiple devservers.
33# ==============================================================================
34# nyan_big-release/R38-6055.0.0
35# ==============================================================================
36# 170.21.64.22: 23 requests 2014-09-04 22:44:28 -- 2014-09-05 00:03:23
37# 170.21.64.23: 6 requests 2014-09-04 22:48:58 -- 2014-09-04 22:49:42
38#
39# Count of images with duplicated stages on each devserver:
40# 170.21.64.22 : 22
41# 170.21.64.23 : 11
42
43
44import argparse
45import datetime
46import logging
47import operator
48import re
49import time
50from itertools import groupby
51
52import common
53from autotest_lib.client.common_lib import global_config
54from autotest_lib.client.common_lib import time_utils
55from autotest_lib.client.common_lib.cros.graphite import es_utils
56
57
58class devserver_call(object):
59 """A container to store the information of devserver stage call.
60 """
61
62 def __init__(self, hit):
63 """Retrieve information from a ES query hit.
64 """
65 self.devserver = hit['_source']['devserver']
66 self.subname = hit['_source']['subname']
67 self.artifacts = hit['_source']['artifacts'].split(' ')
68 self.image = hit['_source']['image']
69 self.value = hit['_source']['value']
70 self.time_recorded = time_utils.epoch_time_to_date_string(
71 hit['_source']['time_recorded'])
72
73
74 def __str__(self):
75 pairs = ['%-20s: %s' % (attr, getattr(self, attr)) for attr in dir(self)
76 if not attr.startswith('__') and
77 not callable(getattr(self, attr))]
78 return '\n'.join(pairs)
79
80
81def get_calls(time_start, time_end, artifact_filters=None,
82 regex_constraints=None, devserver=None, size=1e7):
83 """Gets all devserver calls from es db with the given constraints.
84
85 @param time_start: Earliest time entry was recorded.
86 @param time_end: Latest time entry was recorded.
87 @param artifact_filters: A list of names to match artifacts.
88 @param regex_constraints: A list of regex constraints for ES query.
89 @param devserver: name of devserver to query for. If it's set to None,
90 return calls for all devservers. Default is set to None.
91 @param size: Max number of entries to return, default to 1 million.
92
93 @returns: Entries from esdb.
94 """
95 eqs = [('_type', 'devserver')]
96 if devserver:
97 eqs.append(('devserver', devserver))
98 if artifact_filters:
99 for artifact in artifact_filters:
100 eqs.append(('artifacts', artifact))
Gabe Black55bfe142015-01-05 14:42:26 -0800101 time_start_epoch = time_utils.to_epoch_time(time_start)
102 time_end_epoch = time_utils.to_epoch_time(time_end)
Dan Shif8b71d12014-09-03 10:31:08 -0700103 query = es_utils.create_range_eq_query_multiple(
104 fields_returned=None,
105 equality_constraints=eqs,
Gabe Black55bfe142015-01-05 14:42:26 -0800106 range_constraints=[('time_recorded', time_start_epoch,
107 time_end_epoch)],
Dan Shif8b71d12014-09-03 10:31:08 -0700108 size=size,
109 sort_specs=[{'time_recorded': 'desc'}],
110 regex_constraints=regex_constraints)
111 results = es_utils.execute_query(query, timeout=30)
112 devserver_calls = []
113 for hit in results['hits']['hits']:
114 devserver_calls.append(devserver_call(hit))
115 logging.info('Found %d calls.', len(devserver_calls))
116 return devserver_calls
117
118
119def print_call_details(calls, verbose):
120 """Print details of each call to devserver to stage artifacts.
121
122 @param calls: A list of devserver stage requests.
123 @param verbose: Set to True to print out all devserver calls.
124 """
125 calls = sorted(calls, key=lambda c: c.devserver)
126 for devserver,calls_for_devserver in groupby(calls, lambda c: c.devserver):
127 calls_for_devserver = list(calls_for_devserver)
128 print '='*80
129 print devserver
130 print '='*80
131 print 'Number of calls: %d' % len(calls_for_devserver)
132 print ('Number of unique images: %d' %
133 len(set([call.image for call in calls_for_devserver])))
134 if verbose:
135 for call in sorted(calls_for_devserver,
136 key=lambda c: c.time_recorded):
137 print ('%s %s %s' % (call.time_recorded, call.image,
138 ', '.join(call.artifacts)))
139
140
141def detect_duplicated_stage(calls):
142 """Detect any artifact for same build was staged in multiple devservers.
143
144 @param calls: A list of devserver stage requests.
145 """
146 print '\nDetecting artifacts staged in multiple devservers.'
147 calls = sorted(calls, key=lambda c: c.image)
148 # Count how many times a devserver staged duplicated artifacts. A number
149 # significantly larger then others can indicate that the devserver failed
150 # check_health too often and needs to be removed from production.
151 duplicated_stage_count = {}
152 for image,calls_for_image in groupby(calls, lambda c: c.image):
153 calls_for_image = list(calls_for_image)
154 devservers = set([call.devserver for call in calls_for_image])
155 if len(devservers) > 1:
156 print '='*80
157 print image
158 print '='*80
159 calls_for_image = sorted(calls_for_image, key=lambda c: c.devserver)
160 for devserver,calls_for_devserver in groupby(calls_for_image,
161 lambda c: c.devserver):
162 timestamps = [c.time_recorded for c in calls_for_devserver]
163 print ('%s: %-3d requests %s -- %s' %
164 (devserver, len(timestamps), min(timestamps),
165 max(timestamps)))
166 duplicated_stage_count[devserver] = (
167 duplicated_stage_count.get(devserver, 0) + 1)
168 print '\nCount of images with duplicated stages on each devserver:'
169 counts = sorted(duplicated_stage_count.iteritems(),
170 key=operator.itemgetter(1), reverse=True)
171 for k,v in counts:
172 print '%-15s: %d' % (k, v)
173
174
175def main():
176 """main script. """
177 t_now = time.time()
178 t_now_minus_one_day = t_now - 3600 * 24
179 parser = argparse.ArgumentParser()
180 parser.add_argument('-l', type=float, dest='last',
181 help='last hours to search results across',
182 default=None)
183 parser.add_argument('--start', type=str, dest='start',
184 help=('Enter start time as: yyyy-mm-dd hh-mm-ss,'
185 'defualts to 24h ago. This option is ignored when'
186 ' -l is used.'),
187 default=time_utils.epoch_time_to_date_string(
188 t_now_minus_one_day))
189 parser.add_argument('--end', type=str, dest='end',
190 help=('Enter end time in as: yyyy-mm-dd hh-mm-ss,'
191 'defualts to current time. This option is ignored'
192 ' when -l is used.'),
193 default=time_utils.epoch_time_to_date_string(t_now))
194 parser.add_argument('--devservers', nargs='+', dest='devservers',
195 help=('Enter space deliminated devservers. Default are'
196 ' all devservers specified in global config.'),
197 default=[])
198 parser.add_argument('--artifact_filters', nargs='+',
199 dest='artifact_filters',
200 help=('Enter space deliminated filters on artifact '
201 'name. For example "autotest test_suites". The '
202 'filter does not support regex.'),
203 default=[])
204 parser.add_argument('--image_filters', nargs='+', dest='image_filters',
205 help=('Enter space deliminated filters on image name. '
206 'For example "nyan 38 6566", search will use '
207 'regex to match each filter. Do not use filters '
208 'with mixed letter and number, e.g., R38.'),
209 default=[])
210 parser.add_argument('-d', '--detect_duplicated_stage', action='store_true',
211 dest='detect_duplicated_stage',
212 help=('Set to True to detect if an artifacts for a same'
213 ' build was staged in multiple devservers. '
214 'Default is True.'),
215 default=False)
216 parser.add_argument('-v', action='store_true', dest='verbose',
217 default=False,
218 help='-v to print out ALL entries.')
219 options = parser.parse_args()
220 if options.verbose:
221 logging.getLogger().setLevel(logging.INFO)
222
223 if options.last:
224 end_time = datetime.datetime.now()
225 start_time = end_time - datetime.timedelta(seconds=3600 * options.last)
226 else:
227 start_time = datetime.datetime.strptime(options.start,
228 time_utils.TIME_FMT)
229 end_time = datetime.datetime.strptime(options.end, time_utils.TIME_FMT)
230 logging.info('Searching devserver calls from %s to %s', start_time,
231 end_time)
232
233 devservers = options.devservers
234 if not devservers:
235 devserver_urls = global_config.global_config.get_config_value(
236 'CROS', 'dev_server', type=list, default=[])
237 devservers = []
238 for url in devserver_urls:
239 match = re.match('http://([^:]*):*\d*', url)
240 devservers.append(match.groups(0)[0] if match else url)
241 logging.info('Found devservers: %s', devservers)
242
243 regex_constraints = []
244 for filter in options.image_filters:
245 regex_constraints.append(('image', '.*%s.*' % filter))
246 calls = []
247 for devserver in devservers:
248 calls.extend(get_calls(start_time, end_time, options.artifact_filters,
249 regex_constraints, devserver=devserver))
250
251 print_call_details(calls, options.verbose)
252
253 if options.detect_duplicated_stage:
254 detect_duplicated_stage(calls)
255
256
257if __name__ == '__main__':
258 main()