systrace.py - platform/external/chromium-trace - Git at Google

 #!/usr/bin/env python

 # Copyright (c) 2011 The Chromium Authors. All rights reserved.
 # Use of this source code is governed by a BSD-style license that can be
 # found in the LICENSE file.

 """Android system-wide tracing utility.

 This is a tool for capturing a trace that includes data from both userland and
 the kernel.  It creates an HTML file for visualizing the trace.
 """

 import sys

 # Make sure we're using a new enough version of Python.
 # The flags= parameter of re.sub() is new in Python 2.7.
 if sys.version_info[:2] < (2, 7):
   print >> sys.stderr, '\nThis script requires Python 2.7 or newer.'
   sys.exit(1)

 # pylint: disable=g-bad-import-order,g-import-not-at-top
 import optparse
 import os
 import Queue
 import re
 import subprocess
 import threading
 import time
 import zlib

 # Text that ADB sends, but does not need to be displayed to the user.
 ADB_IGNORE_REGEXP = r'^capturing trace\.\.\. done|^capturing trace\.\.\.'
 # The number of seconds to wait on output from ADB.
 ADB_STDOUT_READ_TIMEOUT = 0.2
 # The adb shell command to initiate a trace.
 ATRACE_BASE_ARGS = ['atrace']
 # If a custom list of categories is not specified, traces will include
 # these categories (if available on the device).
 DEFAULT_CATEGORIES = 'sched gfx view dalvik webview input disk am wm'.split()
 # The command to list trace categories.
 LIST_CATEGORIES_ARGS = ATRACE_BASE_ARGS + ['--list_categories']
 # Minimum number of seconds between displaying status updates.
 MIN_TIME_BETWEEN_STATUS_UPDATES = 0.2
 # ADB sends this text to indicate the beginning of the trace data.
 TRACE_START_REGEXP = r'TRACE\:'
 # Plain-text trace data should always start with this string.
 TRACE_TEXT_HEADER = '# tracer'


 class OptionParserIgnoreErrors(optparse.OptionParser):
   """Wrapper for OptionParser that ignores errors and produces no output."""

   def error(self, msg):
     pass

   def exit(self):
     pass

   def print_usage(self):
     pass

   def print_help(self):
     pass

   def print_version(self):
     pass


 class FileReaderThread(threading.Thread):
   """Reads data from a file/pipe on a worker thread.

   Use the standard threading.Thread object API to start and interact with the
   thread (start(), join(), etc.).
   """

   def __init__(self, file_object, output_queue, text_file, chunk_size=-1):
     """Initializes a FileReaderThread.

     Args:
       file_object: The file or pipe to read from.
       output_queue: A Queue.Queue object that will receive the data
       text_file: If True, the file will be read one line at a time, and
           chunk_size will be ignored.  If False, line breaks are ignored and
           chunk_size must be set to a positive integer.
       chunk_size: When processing a non-text file (text_file = False),
           chunk_size is the amount of data to copy into the queue with each
           read operation.  For text files, this parameter is ignored.
     """
     threading.Thread.__init__(self)
     self._file_object = file_object
     self._output_queue = output_queue
     self._text_file = text_file
     self._chunk_size = chunk_size
     assert text_file or chunk_size > 0

   def run(self):
     """Overrides Thread's run() function.

     Returns when an EOF is encountered.
     """
     if self._text_file:
       # Read a text file one line at a time.
       for line in self._file_object:
         self._output_queue.put(line)
     else:
       # Read binary or text data until we get to EOF.
       while True:
         chunk = self._file_object.read(self._chunk_size)
         if not chunk:
           break
         self._output_queue.put(chunk)

   def set_chunk_size(self, chunk_size):
     """Change the read chunk size.

     This function can only be called if the FileReaderThread object was
     created with an initial chunk_size > 0.
     Args:
       chunk_size: the new chunk size for this file.  Must be > 0.
     """
     # The chunk size can be changed asynchronously while a file is being read
     # in a worker thread.  However, type of file can not be changed after the
     # the FileReaderThread has been created.  These asserts verify that we are
     # only changing the chunk size, and not the type of file.
     assert not self._text_file
     assert chunk_size > 0
     self._chunk_size = chunk_size


 def add_adb_serial(adb_command, device_serial):
   if device_serial is not None:
     adb_command.insert(1, device_serial)
     adb_command.insert(1, '-s')


 def construct_adb_shell_command(shell_args, device_serial):
   adb_command = ['adb', 'shell', ' '.join(shell_args)]
   add_adb_serial(adb_command, device_serial)
   return adb_command


 def run_adb_shell(shell_args, device_serial):
   """Runs "adb shell" with the given arguments.

   Args:
     shell_args: array of arguments to pass to adb shell.
     device_serial: if not empty, will add the appropriate command-line
         parameters so that adb targets the given device.
   Returns:
     A tuple containing the adb output (stdout & stderr) and the return code
     from adb.  Will exit if adb fails to start.
   """
   adb_command = construct_adb_shell_command(shell_args, device_serial)

   adb_output = []
   adb_return_code = 0
   try:
     adb_output = subprocess.check_output(adb_command, stderr=subprocess.STDOUT,
                                          shell=False, universal_newlines=True)
   except OSError as error:
     # This usually means that the adb executable was not found in the path.
     print >> sys.stderr, ('\nThe command "%s" failed with the following error:'
                           % ' '.join(adb_command))
     print >> sys.stderr, '    %s\n' % str(error)
     print >> sys.stderr, 'Is adb in your path?'
     sys.exit(1)
   except subprocess.CalledProcessError as error:
     # The process exited with an error.
     adb_return_code = error.returncode
     adb_output = error.output

   return (adb_output, adb_return_code)


 def get_device_sdk_version():
   """Uses adb to attempt to determine the SDK version of a running device."""

   getprop_args = ['getprop', 'ro.build.version.sdk']

   # get_device_sdk_version() is called before we even parse our command-line
   # args.  Therefore, parse just the device serial number part of the
   # command-line so we can send the adb command to the correct device.
   parser = OptionParserIgnoreErrors()
   parser.add_option('-e', '--serial', dest='device_serial', type='string')
   options, unused_args = parser.parse_args()

   success = False

   adb_output, adb_return_code = run_adb_shell(getprop_args,
                                               options.device_serial)

   if adb_return_code == 0:
     # ADB may print output other than the version number (e.g. it chould
     # print a message about starting the ADB server).
     # Break the ADB output into white-space delimited segments.
     parsed_output = str.split(adb_output)
     if parsed_output:
       # Assume that the version number is the last thing printed by ADB.
       version_string = parsed_output[-1]
       if version_string:
         try:
           # Try to convert the text into an integer.
           version = int(version_string)
         except ValueError:
           version = -1
         else:
           success = True

   if not success:
     print >> sys.stderr, (
         '\nThe command "%s" failed with the following message:'
         % ' '.join(getprop_args))
     print >> sys.stderr, adb_output
     sys.exit(1)

   return version


 def get_default_categories(device_serial):
   categories_output, return_code = run_adb_shell(LIST_CATEGORIES_ARGS,
                                                  device_serial)

   if return_code == 0 and categories_output:
     categories = [c.split('-')[0].strip()
                   for c in categories_output.splitlines()]
     return [c for c in categories if c in DEFAULT_CATEGORIES]

   return []


 def status_update(last_update_time):
   current_time = time.time()
   if (current_time - last_update_time) >= MIN_TIME_BETWEEN_STATUS_UPDATES:
     # Gathering a trace may take a while.  Keep printing something so users
     # don't think the script has hung.
     sys.stdout.write('.')
     sys.stdout.flush()
     return current_time

   return last_update_time


 def parse_options():
   """Parses and checks the command-line options.

   Returns:
     A tuple containing the options structure and a list of categories to
     be traced.
   """
   usage = 'Usage: %prog [options] [category1 [category2 ...]]'
   desc = 'Example: %prog -b 32768 -t 15 gfx input view sched freq'
   parser = optparse.OptionParser(usage=usage, description=desc)
   parser.add_option('-o', dest='output_file', help='write HTML to FILE',
                     default='trace.html', metavar='FILE')
   parser.add_option('-t', '--time', dest='trace_time', type='int',
                     help='trace for N seconds', metavar='N')
   parser.add_option('-b', '--buf-size', dest='trace_buf_size', type='int',
                     help='use a trace buffer size of N KB', metavar='N')
   parser.add_option('-k', '--ktrace', dest='kfuncs', action='store',
                     help='specify a comma-separated list of kernel functions '
                     'to trace')
   parser.add_option('-l', '--list-categories', dest='list_categories',
                     default=False, action='store_true',
                     help='list the available categories and exit')
   parser.add_option('-a', '--app', dest='app_name', default=None, type='string',
                     action='store',
                     help='enable application-level tracing for comma-separated '
                     'list of app cmdlines')
   parser.add_option('--no-fix-threads', dest='fix_threads', default=True,
                     action='store_false',
                     help='don\'t fix missing or truncated thread names')
   parser.add_option('--no-fix-circular', dest='fix_circular', default=True,
                     action='store_false',
                     help='don\'t fix truncated circular traces')
   parser.add_option('--no-compress', dest='compress_trace_data',
                     default=True, action='store_false',
                     help='Tell the device not to send the trace data in '
                     'compressed form.')
   parser.add_option('--link-assets', dest='link_assets', default=False,
                     action='store_true',
                     help='(deprecated)')
   parser.add_option('--from-file', dest='from_file', action='store',
                     help='read the trace from a file (compressed) rather than '
                     'running a live trace')
   parser.add_option('--asset-dir', dest='asset_dir', default='trace-viewer',
                     type='string', help='(deprecated)')
   parser.add_option('-e', '--serial', dest='device_serial', type='string',
                     help='adb device serial number')

   options, categories = parser.parse_args()

   if options.link_assets or options.asset_dir != 'trace-viewer':
     parser.error('--link-assets and --asset-dir are deprecated.')

   if (options.trace_time is not None) and (options.trace_time <= 0):
     parser.error('the trace time must be a positive number')

   if (options.trace_buf_size is not None) and (options.trace_buf_size <= 0):
     parser.error('the trace buffer size must be a positive number')

   return (options, categories)


 def construct_trace_command(options, categories):
   """Builds a command-line used to invoke a trace process.

   Args:
     options: The command-line options.
     categories: The trace categories to capture.
   Returns:
     A tuple where the first element is an array of command-line arguments, and
     the second element is a boolean which will be true if the commend will
     stream trace data.
   """
   if options.list_categories:
     tracer_args = construct_adb_shell_command(LIST_CATEGORIES_ARGS,
                                               options.device_serial)
     expect_trace = False
   elif options.from_file is not None:
     tracer_args = ['cat', options.from_file]
     expect_trace = True
   else:
     atrace_args = ATRACE_BASE_ARGS
     expect_trace = True
     if options.compress_trace_data:
       atrace_args.extend(['-z'])

     if (options.trace_time is not None) and (options.trace_time > 0):
       atrace_args.extend(['-t', str(options.trace_time)])

     if (options.trace_buf_size is not None) and (options.trace_buf_size > 0):
       atrace_args.extend(['-b', str(options.trace_buf_size)])

     if options.app_name is not None:
       atrace_args.extend(['-a', options.app_name])

     if options.kfuncs is not None:
       atrace_args.extend(['-k', options.kfuncs])

     if not categories:
       categories = get_default_categories(options.device_serial)
     atrace_args.extend(categories)

     if options.fix_threads:
       atrace_args.extend([';', 'ps', '-t'])
     tracer_args = construct_adb_shell_command(atrace_args,
                                               options.device_serial)

   return (tracer_args, expect_trace)


 def collect_trace_data(tracer_args, expect_trace):
   """Invokes and communicates with the trace process.

   Args:
     tracer_args: The command-line to execute.
     expect_trace: True if the given command should return tracing data.
   Returns:
     The captured trace data.
   """
   try:
     adb = subprocess.Popen(tracer_args, stdout=subprocess.PIPE,
                            stderr=subprocess.PIPE)
   except OSError as error:
     print >> sys.stderr, ('The command "%s" failed with the following error:' %
                           ' '.join(tracer_args))
     print >> sys.stderr, '    ', error
     sys.exit(1)

   # Read the output from ADB in a worker thread.  This allows us to monitor the
   # progress of ADB and bail if ADB becomes unresponsive for any reason.

   # Limit the stdout_queue to 128 entries because we will initially be reading
   # one byte at a time.  When the queue fills up, the reader thread will
   # block until there is room in the queue.  Once we start downloading the trace
   # data, we will switch to reading data in larger chunks, and 128 entries
   # should be plenty for that purpose.
   stdout_queue = Queue.Queue(maxsize=128)
   stderr_queue = Queue.Queue()

   if expect_trace:
     # Use stdout.write() (here and for the rest of this function) instead
     # of print() to avoid extra newlines.
     sys.stdout.write('Capturing trace...')

   # Use a chunk_size of 1 for stdout so we can display the output to
   # the user without waiting for a full line to be sent.
   stdout_thread = FileReaderThread(adb.stdout, stdout_queue, text_file=False,
                                    chunk_size=1)
   stderr_thread = FileReaderThread(adb.stderr, stderr_queue, text_file=True)
   stdout_thread.start()
   stderr_thread.start()

   # Holds the trace data returned by ADB.
   trace_data = []
   # Keep track of the current line so we can find the TRACE_START_REGEXP.
   current_line = ''
   # Set to True once we've received the TRACE_START_REGEXP.
   reading_trace_data = False

   last_status_update_time = time.time()

   while (stdout_thread.isAlive() or stderr_thread.isAlive() or
          not stdout_queue.empty() or not stderr_queue.empty()):
     if expect_trace:
       last_status_update_time = status_update(last_status_update_time)

     while not stderr_queue.empty():
       # Pass along errors from adb.
       line = stderr_queue.get()
       sys.stderr.write(line)

     # Read stdout from adb.  The loop exits if we don't get any data for
     # ADB_STDOUT_READ_TIMEOUT seconds.
     while True:
       try:
         chunk = stdout_queue.get(True, ADB_STDOUT_READ_TIMEOUT)
       except Queue.Empty:
         # Didn't get any data, so exit the loop to check that ADB is still
         # alive and print anything sent to stderr.
         break

       if reading_trace_data:
         # Save, but don't print, the trace data.
         trace_data.append(chunk)
       else:
         if not expect_trace:
           sys.stdout.write(chunk)
         else:
           # Buffer the output from ADB so we can remove some strings that
           # don't need to be shown to the user.
           current_line += chunk
           if re.match(TRACE_START_REGEXP, current_line):
             # We are done capturing the trace.
             sys.stdout.write('Done.\n')
             # Now we start downloading the trace data.
             sys.stdout.write('Downloading trace...')
             current_line = ''
             # Use a larger chunk size for efficiency since we no longer
             # need to worry about parsing the stream.
             stdout_thread.set_chunk_size(4096)
             reading_trace_data = True
           elif chunk == '\n' or chunk == '\r':
             # Remove ADB output that we don't care about.
             current_line = re.sub(ADB_IGNORE_REGEXP, '', current_line)
             if len(current_line) > 1:
               # ADB printed something that we didn't understand, so show it
               # it to the user (might be helpful for debugging).
               sys.stdout.write(current_line)
             # Reset our current line.
             current_line = ''

   if expect_trace:
     if reading_trace_data:
       # Indicate to the user that the data download is complete.
       sys.stdout.write('Done.\n')
     else:
       # We didn't receive the trace start tag, so something went wrong.
       sys.stdout.write('ERROR.\n')
       # Show any buffered ADB output to the user.
       current_line = re.sub(ADB_IGNORE_REGEXP, '', current_line)
       if current_line:
         sys.stdout.write(current_line)
         sys.stdout.write('\n')

   # The threads should already have stopped, so this is just for cleanup.
   stdout_thread.join()
   stderr_thread.join()

   adb.stdout.close()
   adb.stderr.close()

   # The adb process should be done since it's io pipes are closed.  Call
   # poll() to set the returncode.
   adb.poll()

   if adb.returncode != 0:
     print >> sys.stderr, ('The command "%s" returned error code %d.' %
                           (' '.join(tracer_args), adb.returncode))
     sys.exit(1)

   return trace_data


 def extract_thread_list(trace_data):
   """Removes the thread list from the given trace data.

   Args:
     trace_data: The raw trace data (before decompression).
   Returns:
     A tuple containing the trace data and a map of thread ids to thread names.
   """
   threads = {}
   parts = re.split('USER +PID +PPID +VSIZE +RSS +WCHAN +PC +NAME',
                    trace_data, 1)
   if len(parts) == 2:
     trace_data = parts[0]
     for line in parts[1].splitlines():
       cols = line.split(None, 8)
       if len(cols) == 9:
         tid = int(cols[1])
         name = cols[8]
         threads[tid] = name

   return (trace_data, threads)


 def strip_and_decompress_trace(trace_data):
   """Fixes new-lines and decompresses trace data.

   Args:
     trace_data: The trace data returned by atrace.
   Returns:
     The decompressed trace data.
   """
   # Collapse CRLFs that are added by adb shell.
   if trace_data.startswith('\r\n'):
     trace_data = trace_data.replace('\r\n', '\n')
   elif trace_data.startswith('\r\r\n'):
     # On windows, adb adds an extra '\r' character for each line.
     trace_data = trace_data.replace('\r\r\n', '\n')

   # Skip the initial newline.
   trace_data = trace_data[1:]

   if not trace_data.startswith(TRACE_TEXT_HEADER):
     # No header found, so assume the data is compressed.
     trace_data = zlib.decompress(trace_data)

   # Enforce Unix line-endings.
   trace_data = trace_data.replace('\r', '')

   # Skip any initial newlines.
   while trace_data and trace_data[0] == '\n':
     trace_data = trace_data[1:]

   return trace_data


 def fix_thread_names(trace_data, thread_names):
   """Replaces thread ids with their names.

   Args:
     trace_data: The atrace data.
     thread_names: A mapping of thread ids to thread names.
   Returns:
     The updated trace data.
   """
   def repl(m):
     tid = int(m.group(2))
     if tid > 0:
       name = thread_names.get(tid)
       if name is None:
         name = m.group(1)
         if name == '<...>':
           name = '<' + str(tid) + '>'
         thread_names[tid] = name
       return name + '-' + m.group(2)
     else:
       return m.group(0)
   trace_data = re.sub(r'^\s*(\S+)-(\d+)', repl, trace_data,
                       flags=re.MULTILINE)
   return trace_data


 def preprocess_trace_data(options, trace_data):
   """Performs various processing on atrace data.

   Args:
     options: The command-line options passed to this script.
     trace_data: The raw trace data.
   Returns:
     The processed trace data.
   """
   trace_data = ''.join(trace_data)

   if options.fix_threads:
     # Extract the thread list dumped by ps.
     trace_data, thread_names = extract_thread_list(trace_data)

   if trace_data:
     trace_data = strip_and_decompress_trace(trace_data)

   if not trace_data:
     print >> sys.stderr, ('No data was captured.  Output file was not '
                           'written.')
     sys.exit(1)

   if options.fix_threads:
     trace_data = fix_thread_names(trace_data, thread_names)

   if options.fix_circular:
     trace_data = fix_circular_traces(trace_data)

   return trace_data


 def write_trace_html(html_filename, script_dir, trace_data):
   """Writes out a trace html file.

   Args:
     html_filename: The name of the file to write.
     script_dir: The directory containing this script.
     trace_data: The atrace data.
   """
   html_prefix = read_asset(script_dir, 'prefix.html')
   html_suffix = read_asset(script_dir, 'suffix.html')
   trace_viewer_html = read_asset(script_dir, 'systrace_trace_viewer.html')

   # Open the file in binary mode to prevent python from changing the
   # line endings.
   html_file = open(html_filename, 'wb')
   html_file.write(html_prefix.replace('{{SYSTRACE_TRACE_VIEWER_HTML}}',
                                       trace_viewer_html))

   html_file.write('<!-- BEGIN TRACE -->\n'
                   '  <script class="trace-data" type="application/text">\n')
   html_file.write(trace_data)
   html_file.write('  </script>\n<!-- END TRACE -->\n')

   html_file.write(html_suffix)
   html_file.close()
   print '\n    wrote file://%s\n' % os.path.abspath(html_filename)


 def main():
   device_sdk_version = get_device_sdk_version()
   if device_sdk_version < 18:
     legacy_script = os.path.join(os.path.dirname(sys.argv[0]),
                                  'systrace-legacy.py')
     # execv() does not return.
     os.execv(legacy_script, sys.argv)

   options, categories = parse_options()
   tracer_args, expect_trace = construct_trace_command(options, categories)

   trace_data = collect_trace_data(tracer_args, expect_trace)

   if not expect_trace:
     # Nothing more to do.
     return

   trace_data = preprocess_trace_data(options, trace_data)

   script_dir = os.path.dirname(os.path.abspath(sys.argv[0]))
   write_trace_html(options.output_file, script_dir, trace_data)


 def read_asset(src_dir, filename):
   return open(os.path.join(src_dir, filename)).read()


 def fix_circular_traces(out):
   """Fix inconsistentcies in traces due to circular buffering.

   The circular buffers are kept per CPU, so it is not guaranteed that the
   beginning of a slice is overwritten before the end. To work around this, we
   throw away the prefix of the trace where not all CPUs have events yet.

   Args:
     out: The data to fix.
   Returns:
     The updated trace data.
   """
   # If any of the CPU's buffers have filled up and
   # older events have been dropped, the kernel
   # emits markers of the form '##### CPU 2 buffer started ####' on
   # the line before the first event in the trace on that CPU.
   #
   # No such headers are emitted if there were no overflows or the trace
   # was captured with non-circular buffers.
   buffer_start_re = re.compile(r'^#+ CPU \d+ buffer started', re.MULTILINE)

   start_of_full_trace = 0

   while True:
     result = buffer_start_re.search(out, start_of_full_trace + 1)
     if result:
       start_of_full_trace = result.start()
     else:
       break

   if start_of_full_trace > 0:
     # Need to keep the header intact to make the importer happy.
     end_of_header = re.search(r'^[^#]', out, re.MULTILINE).start()
     out = out[:end_of_header] + out[start_of_full_trace:]
   return out

 if __name__ == '__main__':
   main()