mirror of
				https://github.com/sqlmapproject/sqlmap.git
				synced 2025-11-04 01:47:37 +03:00 
			
		
		
		
	
		
			
				
	
	
		
			2625 lines
		
	
	
		
			82 KiB
		
	
	
	
		
			Python
		
	
	
		
			Executable File
		
	
	
	
	
			
		
		
	
	
			2625 lines
		
	
	
		
			82 KiB
		
	
	
	
		
			Python
		
	
	
		
			Executable File
		
	
	
	
	
#!/usr/bin/env python
 | 
						|
#
 | 
						|
# Copyright 2008-2009 Jose Fonseca
 | 
						|
#
 | 
						|
# This program is free software: you can redistribute it and/or modify it
 | 
						|
# under the terms of the GNU Lesser General Public License as published
 | 
						|
# by the Free Software Foundation, either version 3 of the License, or
 | 
						|
# (at your option) any later version.
 | 
						|
#
 | 
						|
# This program is distributed in the hope that it will be useful,
 | 
						|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
						|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
						|
# GNU Lesser General Public License for more details.
 | 
						|
#
 | 
						|
# You should have received a copy of the GNU Lesser General Public License
 | 
						|
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
 | 
						|
#
 | 
						|
 | 
						|
"""Generate a dot graph from the output of several profilers."""
 | 
						|
 | 
						|
__author__ = "Jose Fonseca"
 | 
						|
 | 
						|
__version__ = "1.0"
 | 
						|
 | 
						|
 | 
						|
import sys
 | 
						|
import math
 | 
						|
import os.path
 | 
						|
import re
 | 
						|
import textwrap
 | 
						|
import optparse
 | 
						|
import xml.parsers.expat
 | 
						|
 | 
						|
 | 
						|
try:
 | 
						|
    # Debugging helper module
 | 
						|
    import debug
 | 
						|
except ImportError:
 | 
						|
    pass
 | 
						|
 | 
						|
 | 
						|
def times(x):
 | 
						|
    return u"%u\xd7" % (x,)
 | 
						|
 | 
						|
def percentage(p):
 | 
						|
    return "%.02f%%" % (p*100.0,)
 | 
						|
 | 
						|
def add(a, b):
 | 
						|
    return a + b
 | 
						|
 | 
						|
def equal(a, b):
 | 
						|
    if a == b:
 | 
						|
        return a
 | 
						|
    else:
 | 
						|
        return None
 | 
						|
 | 
						|
def fail(a, b):
 | 
						|
    assert False
 | 
						|
 | 
						|
 | 
						|
tol = 2 ** -23
 | 
						|
 | 
						|
def ratio(numerator, denominator):
 | 
						|
    try:
 | 
						|
        ratio = float(numerator)/float(denominator)
 | 
						|
    except ZeroDivisionError:
 | 
						|
        # 0/0 is undefined, but 1.0 yields more useful results
 | 
						|
        return 1.0
 | 
						|
    if ratio < 0.0:
 | 
						|
        if ratio < -tol:
 | 
						|
            sys.stderr.write('warning: negative ratio (%s/%s)\n' % (numerator, denominator))
 | 
						|
        return 0.0
 | 
						|
    if ratio > 1.0:
 | 
						|
        if ratio > 1.0 + tol:
 | 
						|
            sys.stderr.write('warning: ratio greater than one (%s/%s)\n' % (numerator, denominator))
 | 
						|
        return 1.0
 | 
						|
    return ratio
 | 
						|
 | 
						|
 | 
						|
class UndefinedEvent(Exception):
 | 
						|
    """Raised when attempting to get an event which is undefined."""
 | 
						|
    
 | 
						|
    def __init__(self, event):
 | 
						|
        Exception.__init__(self)
 | 
						|
        self.event = event
 | 
						|
 | 
						|
    def __str__(self):
 | 
						|
        return 'unspecified event %s' % self.event.name
 | 
						|
 | 
						|
 | 
						|
class Event(object):
 | 
						|
    """Describe a kind of event, and its basic operations."""
 | 
						|
 | 
						|
    def __init__(self, name, null, aggregator, formatter = str):
 | 
						|
        self.name = name
 | 
						|
        self._null = null
 | 
						|
        self._aggregator = aggregator
 | 
						|
        self._formatter = formatter
 | 
						|
 | 
						|
    def __eq__(self, other):
 | 
						|
        return self is other
 | 
						|
 | 
						|
    def __hash__(self):
 | 
						|
        return id(self)
 | 
						|
 | 
						|
    def null(self):
 | 
						|
        return self._null
 | 
						|
 | 
						|
    def aggregate(self, val1, val2):
 | 
						|
        """Aggregate two event values."""
 | 
						|
        assert val1 is not None
 | 
						|
        assert val2 is not None
 | 
						|
        return self._aggregator(val1, val2)
 | 
						|
    
 | 
						|
    def format(self, val):
 | 
						|
        """Format an event value."""
 | 
						|
        assert val is not None
 | 
						|
        return self._formatter(val)
 | 
						|
 | 
						|
 | 
						|
CALLS = Event("Calls", 0, add, times)
 | 
						|
SAMPLES = Event("Samples", 0, add)
 | 
						|
SAMPLES2 = Event("Samples", 0, add)
 | 
						|
 | 
						|
TIME = Event("Time", 0.0, add, lambda x: '(' + str(x) + ')')
 | 
						|
TIME_RATIO = Event("Time ratio", 0.0, add, lambda x: '(' + percentage(x) + ')')
 | 
						|
TOTAL_TIME = Event("Total time", 0.0, fail)
 | 
						|
TOTAL_TIME_RATIO = Event("Total time ratio", 0.0, fail, percentage)
 | 
						|
 | 
						|
 | 
						|
class Object(object):
 | 
						|
    """Base class for all objects in profile which can store events."""
 | 
						|
 | 
						|
    def __init__(self, events=None):
 | 
						|
        if events is None:
 | 
						|
            self.events = {}
 | 
						|
        else:
 | 
						|
            self.events = events
 | 
						|
 | 
						|
    def __hash__(self):
 | 
						|
        return id(self)
 | 
						|
 | 
						|
    def __eq__(self, other):
 | 
						|
        return self is other
 | 
						|
 | 
						|
    def __contains__(self, event):
 | 
						|
        return event in self.events
 | 
						|
    
 | 
						|
    def __getitem__(self, event):
 | 
						|
        try:
 | 
						|
            return self.events[event]
 | 
						|
        except KeyError:
 | 
						|
            raise UndefinedEvent(event)
 | 
						|
    
 | 
						|
    def __setitem__(self, event, value):
 | 
						|
        if value is None:
 | 
						|
            if event in self.events:
 | 
						|
                del self.events[event]
 | 
						|
        else:
 | 
						|
            self.events[event] = value
 | 
						|
 | 
						|
 | 
						|
class Call(Object):
 | 
						|
    """A call between functions.
 | 
						|
    
 | 
						|
    There should be at most one call object for every pair of functions.
 | 
						|
    """
 | 
						|
 | 
						|
    def __init__(self, callee_id):
 | 
						|
        Object.__init__(self)
 | 
						|
        self.callee_id = callee_id
 | 
						|
        self.ratio = None
 | 
						|
        self.weight = None
 | 
						|
 | 
						|
 | 
						|
class Function(Object):
 | 
						|
    """A function."""
 | 
						|
 | 
						|
    def __init__(self, id, name):
 | 
						|
        Object.__init__(self)
 | 
						|
        self.id = id
 | 
						|
        self.name = name
 | 
						|
        self.module = None
 | 
						|
        self.process = None
 | 
						|
        self.calls = {}
 | 
						|
        self.called = None
 | 
						|
        self.weight = None
 | 
						|
        self.cycle = None
 | 
						|
    
 | 
						|
    def add_call(self, call):
 | 
						|
        if call.callee_id in self.calls:
 | 
						|
            sys.stderr.write('warning: overwriting call from function %s to %s\n' % (str(self.id), str(call.callee_id)))
 | 
						|
        self.calls[call.callee_id] = call
 | 
						|
 | 
						|
    # TODO: write utility functions
 | 
						|
 | 
						|
    def __repr__(self):
 | 
						|
        return self.name
 | 
						|
 | 
						|
 | 
						|
class Cycle(Object):
 | 
						|
    """A cycle made from recursive function calls."""
 | 
						|
 | 
						|
    def __init__(self):
 | 
						|
        Object.__init__(self)
 | 
						|
        # XXX: Do cycles need an id?
 | 
						|
        self.functions = set()
 | 
						|
 | 
						|
    def add_function(self, function):
 | 
						|
        assert function not in self.functions
 | 
						|
        self.functions.add(function)
 | 
						|
        # XXX: Aggregate events?
 | 
						|
        if function.cycle is not None:
 | 
						|
            for other in function.cycle.functions:
 | 
						|
                if function not in self.functions:
 | 
						|
                    self.add_function(other)
 | 
						|
        function.cycle = self
 | 
						|
 | 
						|
 | 
						|
class Profile(Object):
 | 
						|
    """The whole profile."""
 | 
						|
 | 
						|
    def __init__(self):
 | 
						|
        Object.__init__(self)
 | 
						|
        self.functions = {}
 | 
						|
        self.cycles = []
 | 
						|
 | 
						|
    def add_function(self, function):
 | 
						|
        if function.id in self.functions:
 | 
						|
            sys.stderr.write('warning: overwriting function %s (id %s)\n' % (function.name, str(function.id)))
 | 
						|
        self.functions[function.id] = function
 | 
						|
 | 
						|
    def add_cycle(self, cycle):
 | 
						|
        self.cycles.append(cycle)
 | 
						|
 | 
						|
    def validate(self):
 | 
						|
        """Validate the edges."""
 | 
						|
 | 
						|
        for function in self.functions.itervalues():
 | 
						|
            for callee_id in function.calls.keys():
 | 
						|
                assert function.calls[callee_id].callee_id == callee_id
 | 
						|
                if callee_id not in self.functions:
 | 
						|
                    sys.stderr.write('warning: call to undefined function %s from function %s\n' % (str(callee_id), function.name))
 | 
						|
                    del function.calls[callee_id]
 | 
						|
 | 
						|
    def find_cycles(self):
 | 
						|
        """Find cycles using Tarjan's strongly connected components algorithm."""
 | 
						|
 | 
						|
        # Apply the Tarjan's algorithm successively until all functions are visited
 | 
						|
        visited = set()
 | 
						|
        for function in self.functions.itervalues():
 | 
						|
            if function not in visited:
 | 
						|
                self._tarjan(function, 0, [], {}, {}, visited)
 | 
						|
        cycles = []
 | 
						|
        for function in self.functions.itervalues():
 | 
						|
            if function.cycle is not None and function.cycle not in cycles:
 | 
						|
                cycles.append(function.cycle)
 | 
						|
        self.cycles = cycles
 | 
						|
        if 0:
 | 
						|
            for cycle in cycles:
 | 
						|
                sys.stderr.write("Cycle:\n")
 | 
						|
                for member in cycle.functions:
 | 
						|
                    sys.stderr.write("\tFunction %s\n" % member.name)
 | 
						|
    
 | 
						|
    def _tarjan(self, function, order, stack, orders, lowlinks, visited):
 | 
						|
        """Tarjan's strongly connected components algorithm.
 | 
						|
 | 
						|
        See also:
 | 
						|
        - http://en.wikipedia.org/wiki/Tarjan's_strongly_connected_components_algorithm
 | 
						|
        """
 | 
						|
 | 
						|
        visited.add(function)
 | 
						|
        orders[function] = order
 | 
						|
        lowlinks[function] = order
 | 
						|
        order += 1
 | 
						|
        pos = len(stack)
 | 
						|
        stack.append(function)
 | 
						|
        for call in function.calls.itervalues():
 | 
						|
            callee = self.functions[call.callee_id]
 | 
						|
            # TODO: use a set to optimize lookup
 | 
						|
            if callee not in orders:
 | 
						|
                order = self._tarjan(callee, order, stack, orders, lowlinks, visited)
 | 
						|
                lowlinks[function] = min(lowlinks[function], lowlinks[callee])
 | 
						|
            elif callee in stack:
 | 
						|
                lowlinks[function] = min(lowlinks[function], orders[callee])
 | 
						|
        if lowlinks[function] == orders[function]:
 | 
						|
            # Strongly connected component found
 | 
						|
            members = stack[pos:]
 | 
						|
            del stack[pos:]
 | 
						|
            if len(members) > 1:
 | 
						|
                cycle = Cycle()
 | 
						|
                for member in members:
 | 
						|
                    cycle.add_function(member)
 | 
						|
        return order
 | 
						|
 | 
						|
    def call_ratios(self, event):
 | 
						|
        # Aggregate for incoming calls
 | 
						|
        cycle_totals = {}
 | 
						|
        for cycle in self.cycles:
 | 
						|
            cycle_totals[cycle] = 0.0
 | 
						|
        function_totals = {}
 | 
						|
        for function in self.functions.itervalues():
 | 
						|
            function_totals[function] = 0.0
 | 
						|
        for function in self.functions.itervalues():
 | 
						|
            for call in function.calls.itervalues():
 | 
						|
                if call.callee_id != function.id:
 | 
						|
                    callee = self.functions[call.callee_id]
 | 
						|
                    function_totals[callee] += call[event]
 | 
						|
                    if callee.cycle is not None and callee.cycle is not function.cycle:
 | 
						|
                        cycle_totals[callee.cycle] += call[event]
 | 
						|
 | 
						|
        # Compute the ratios
 | 
						|
        for function in self.functions.itervalues():
 | 
						|
            for call in function.calls.itervalues():
 | 
						|
                assert call.ratio is None
 | 
						|
                if call.callee_id != function.id:
 | 
						|
                    callee = self.functions[call.callee_id]
 | 
						|
                    if callee.cycle is not None and callee.cycle is not function.cycle:
 | 
						|
                        total = cycle_totals[callee.cycle]
 | 
						|
                    else:
 | 
						|
                        total = function_totals[callee]
 | 
						|
                    call.ratio = ratio(call[event], total)
 | 
						|
 | 
						|
    def integrate(self, outevent, inevent):
 | 
						|
        """Propagate function time ratio allong the function calls.
 | 
						|
 | 
						|
        Must be called after finding the cycles.
 | 
						|
 | 
						|
        See also:
 | 
						|
        - http://citeseer.ist.psu.edu/graham82gprof.html
 | 
						|
        """
 | 
						|
 | 
						|
        # Sanity checking
 | 
						|
        assert outevent not in self
 | 
						|
        for function in self.functions.itervalues():
 | 
						|
            assert outevent not in function
 | 
						|
            assert inevent in function
 | 
						|
            for call in function.calls.itervalues():
 | 
						|
                assert outevent not in call
 | 
						|
                if call.callee_id != function.id:
 | 
						|
                    assert call.ratio is not None
 | 
						|
 | 
						|
        # Aggregate the input for each cycle 
 | 
						|
        for cycle in self.cycles:
 | 
						|
            total = inevent.null()
 | 
						|
            for function in self.functions.itervalues():
 | 
						|
                total = inevent.aggregate(total, function[inevent])
 | 
						|
            self[inevent] = total
 | 
						|
 | 
						|
        # Integrate along the edges
 | 
						|
        total = inevent.null()
 | 
						|
        for function in self.functions.itervalues():
 | 
						|
            total = inevent.aggregate(total, function[inevent])
 | 
						|
            self._integrate_function(function, outevent, inevent)
 | 
						|
        self[outevent] = total
 | 
						|
 | 
						|
    def _integrate_function(self, function, outevent, inevent):
 | 
						|
        if function.cycle is not None:
 | 
						|
            return self._integrate_cycle(function.cycle, outevent, inevent)
 | 
						|
        else:
 | 
						|
            if outevent not in function:
 | 
						|
                total = function[inevent]
 | 
						|
                for call in function.calls.itervalues():
 | 
						|
                    if call.callee_id != function.id:
 | 
						|
                        total += self._integrate_call(call, outevent, inevent)
 | 
						|
                function[outevent] = total
 | 
						|
            return function[outevent]
 | 
						|
    
 | 
						|
    def _integrate_call(self, call, outevent, inevent):
 | 
						|
        assert outevent not in call
 | 
						|
        assert call.ratio is not None
 | 
						|
        callee = self.functions[call.callee_id]
 | 
						|
        subtotal = call.ratio *self._integrate_function(callee, outevent, inevent)
 | 
						|
        call[outevent] = subtotal
 | 
						|
        return subtotal
 | 
						|
 | 
						|
    def _integrate_cycle(self, cycle, outevent, inevent):
 | 
						|
        if outevent not in cycle:
 | 
						|
 | 
						|
            # Compute the outevent for the whole cycle
 | 
						|
            total = inevent.null()
 | 
						|
            for member in cycle.functions:
 | 
						|
                subtotal = member[inevent]
 | 
						|
                for call in member.calls.itervalues():
 | 
						|
                    callee = self.functions[call.callee_id]
 | 
						|
                    if callee.cycle is not cycle:
 | 
						|
                        subtotal += self._integrate_call(call, outevent, inevent)
 | 
						|
                total += subtotal
 | 
						|
            cycle[outevent] = total
 | 
						|
            
 | 
						|
            # Compute the time propagated to callers of this cycle
 | 
						|
            callees = {}
 | 
						|
            for function in self.functions.itervalues():
 | 
						|
                if function.cycle is not cycle:
 | 
						|
                    for call in function.calls.itervalues():
 | 
						|
                        callee = self.functions[call.callee_id]
 | 
						|
                        if callee.cycle is cycle:
 | 
						|
                            try:
 | 
						|
                                callees[callee] += call.ratio
 | 
						|
                            except KeyError:
 | 
						|
                                callees[callee] = call.ratio
 | 
						|
            
 | 
						|
            for member in cycle.functions:
 | 
						|
                member[outevent] = outevent.null()
 | 
						|
 | 
						|
            for callee, call_ratio in callees.iteritems():
 | 
						|
                ranks = {}
 | 
						|
                call_ratios = {}
 | 
						|
                partials = {}
 | 
						|
                self._rank_cycle_function(cycle, callee, 0, ranks)
 | 
						|
                self._call_ratios_cycle(cycle, callee, ranks, call_ratios, set())
 | 
						|
                partial = self._integrate_cycle_function(cycle, callee, call_ratio, partials, ranks, call_ratios, outevent, inevent)
 | 
						|
                assert partial == max(partials.values())
 | 
						|
                assert not total or abs(1.0 - partial/(call_ratio*total)) <= 0.001
 | 
						|
 | 
						|
        return cycle[outevent]
 | 
						|
 | 
						|
    def _rank_cycle_function(self, cycle, function, rank, ranks):
 | 
						|
        if function not in ranks or ranks[function] > rank:
 | 
						|
            ranks[function] = rank
 | 
						|
            for call in function.calls.itervalues():
 | 
						|
                if call.callee_id != function.id:
 | 
						|
                    callee = self.functions[call.callee_id]
 | 
						|
                    if callee.cycle is cycle:
 | 
						|
                        self._rank_cycle_function(cycle, callee, rank + 1, ranks)
 | 
						|
 | 
						|
    def _call_ratios_cycle(self, cycle, function, ranks, call_ratios, visited):
 | 
						|
        if function not in visited:
 | 
						|
            visited.add(function)
 | 
						|
            for call in function.calls.itervalues():
 | 
						|
                if call.callee_id != function.id:
 | 
						|
                    callee = self.functions[call.callee_id]
 | 
						|
                    if callee.cycle is cycle:
 | 
						|
                        if ranks[callee] > ranks[function]:
 | 
						|
                            call_ratios[callee] = call_ratios.get(callee, 0.0) + call.ratio
 | 
						|
                            self._call_ratios_cycle(cycle, callee, ranks, call_ratios, visited)
 | 
						|
 | 
						|
    def _integrate_cycle_function(self, cycle, function, partial_ratio, partials, ranks, call_ratios, outevent, inevent):
 | 
						|
        if function not in partials:
 | 
						|
            partial = partial_ratio*function[inevent]
 | 
						|
            for call in function.calls.itervalues():
 | 
						|
                if call.callee_id != function.id:
 | 
						|
                    callee = self.functions[call.callee_id]
 | 
						|
                    if callee.cycle is not cycle:
 | 
						|
                        assert outevent in call
 | 
						|
                        partial += partial_ratio*call[outevent]
 | 
						|
                    else:
 | 
						|
                        if ranks[callee] > ranks[function]:
 | 
						|
                            callee_partial = self._integrate_cycle_function(cycle, callee, partial_ratio, partials, ranks, call_ratios, outevent, inevent)
 | 
						|
                            call_ratio = ratio(call.ratio, call_ratios[callee])
 | 
						|
                            call_partial = call_ratio*callee_partial
 | 
						|
                            try:
 | 
						|
                                call[outevent] += call_partial
 | 
						|
                            except UndefinedEvent:
 | 
						|
                                call[outevent] = call_partial
 | 
						|
                            partial += call_partial
 | 
						|
            partials[function] = partial
 | 
						|
            try:
 | 
						|
                function[outevent] += partial
 | 
						|
            except UndefinedEvent:
 | 
						|
                function[outevent] = partial
 | 
						|
        return partials[function]
 | 
						|
 | 
						|
    def aggregate(self, event):
 | 
						|
        """Aggregate an event for the whole profile."""
 | 
						|
 | 
						|
        total = event.null()
 | 
						|
        for function in self.functions.itervalues():
 | 
						|
            try:
 | 
						|
                total = event.aggregate(total, function[event])
 | 
						|
            except UndefinedEvent:
 | 
						|
                return
 | 
						|
        self[event] = total
 | 
						|
 | 
						|
    def ratio(self, outevent, inevent):
 | 
						|
        assert outevent not in self
 | 
						|
        assert inevent in self
 | 
						|
        for function in self.functions.itervalues():
 | 
						|
            assert outevent not in function
 | 
						|
            assert inevent in function
 | 
						|
            function[outevent] = ratio(function[inevent], self[inevent])
 | 
						|
            for call in function.calls.itervalues():
 | 
						|
                assert outevent not in call
 | 
						|
                if inevent in call:
 | 
						|
                    call[outevent] = ratio(call[inevent], self[inevent])
 | 
						|
        self[outevent] = 1.0
 | 
						|
 | 
						|
    def prune(self, node_thres, edge_thres):
 | 
						|
        """Prune the profile"""
 | 
						|
 | 
						|
        # compute the prune ratios
 | 
						|
        for function in self.functions.itervalues():
 | 
						|
            try:
 | 
						|
                function.weight = function[TOTAL_TIME_RATIO]
 | 
						|
            except UndefinedEvent:
 | 
						|
                pass
 | 
						|
 | 
						|
            for call in function.calls.itervalues():
 | 
						|
                callee = self.functions[call.callee_id]
 | 
						|
 | 
						|
                if TOTAL_TIME_RATIO in call:
 | 
						|
                    # handle exact cases first
 | 
						|
                    call.weight = call[TOTAL_TIME_RATIO] 
 | 
						|
                else:
 | 
						|
                    try:
 | 
						|
                        # make a safe estimate
 | 
						|
                        call.weight = min(function[TOTAL_TIME_RATIO], callee[TOTAL_TIME_RATIO]) 
 | 
						|
                    except UndefinedEvent:
 | 
						|
                        pass
 | 
						|
 | 
						|
        # prune the nodes
 | 
						|
        for function_id in self.functions.keys():
 | 
						|
            function = self.functions[function_id]
 | 
						|
            if function.weight is not None:
 | 
						|
                if function.weight < node_thres:
 | 
						|
                    del self.functions[function_id]
 | 
						|
 | 
						|
        # prune the egdes
 | 
						|
        for function in self.functions.itervalues():
 | 
						|
            for callee_id in function.calls.keys():
 | 
						|
                call = function.calls[callee_id]
 | 
						|
                if callee_id not in self.functions or call.weight is not None and call.weight < edge_thres:
 | 
						|
                    del function.calls[callee_id]
 | 
						|
    
 | 
						|
    def dump(self):
 | 
						|
        for function in self.functions.itervalues():
 | 
						|
            sys.stderr.write('Function %s:\n' % (function.name,))
 | 
						|
            self._dump_events(function.events)
 | 
						|
            for call in function.calls.itervalues():
 | 
						|
                callee = self.functions[call.callee_id]
 | 
						|
                sys.stderr.write('  Call %s:\n' % (callee.name,))
 | 
						|
                self._dump_events(call.events)
 | 
						|
        for cycle in self.cycles:
 | 
						|
            sys.stderr.write('Cycle:\n')
 | 
						|
            self._dump_events(cycle.events)
 | 
						|
            for function in cycle.functions:
 | 
						|
                sys.stderr.write('  Function %s\n' % (function.name,))
 | 
						|
 | 
						|
    def _dump_events(self, events):
 | 
						|
        for event, value in events.iteritems():
 | 
						|
            sys.stderr.write('    %s: %s\n' % (event.name, event.format(value)))
 | 
						|
 | 
						|
 | 
						|
class Struct:
 | 
						|
    """Masquerade a dictionary with a structure-like behavior."""
 | 
						|
 | 
						|
    def __init__(self, attrs = None):
 | 
						|
        if attrs is None:
 | 
						|
            attrs = {}
 | 
						|
        self.__dict__['_attrs'] = attrs
 | 
						|
    
 | 
						|
    def __getattr__(self, name):
 | 
						|
        try:
 | 
						|
            return self._attrs[name]
 | 
						|
        except KeyError:
 | 
						|
            raise AttributeError(name)
 | 
						|
 | 
						|
    def __setattr__(self, name, value):
 | 
						|
        self._attrs[name] = value
 | 
						|
 | 
						|
    def __str__(self):
 | 
						|
        return str(self._attrs)
 | 
						|
 | 
						|
    def __repr__(self):
 | 
						|
        return repr(self._attrs)
 | 
						|
    
 | 
						|
 | 
						|
class ParseError(Exception):
 | 
						|
    """Raised when parsing to signal mismatches."""
 | 
						|
 | 
						|
    def __init__(self, msg, line):
 | 
						|
        self.msg = msg
 | 
						|
        # TODO: store more source line information
 | 
						|
        self.line = line
 | 
						|
 | 
						|
    def __str__(self):
 | 
						|
        return '%s: %r' % (self.msg, self.line)
 | 
						|
 | 
						|
 | 
						|
class Parser:
 | 
						|
    """Parser interface."""
 | 
						|
 | 
						|
    def __init__(self):
 | 
						|
        pass
 | 
						|
 | 
						|
    def parse(self):
 | 
						|
        raise NotImplementedError
 | 
						|
 | 
						|
    
 | 
						|
class LineParser(Parser):
 | 
						|
    """Base class for parsers that read line-based formats."""
 | 
						|
 | 
						|
    def __init__(self, file):
 | 
						|
        Parser.__init__(self)
 | 
						|
        self._file = file
 | 
						|
        self.__line = None
 | 
						|
        self.__eof = False
 | 
						|
 | 
						|
    def readline(self):
 | 
						|
        line = self._file.readline()
 | 
						|
        if not line:
 | 
						|
            self.__line = ''
 | 
						|
            self.__eof = True
 | 
						|
        self.__line = line.rstrip('\r\n')
 | 
						|
 | 
						|
    def lookahead(self):
 | 
						|
        assert self.__line is not None
 | 
						|
        return self.__line
 | 
						|
 | 
						|
    def consume(self):
 | 
						|
        assert self.__line is not None
 | 
						|
        line = self.__line
 | 
						|
        self.readline()
 | 
						|
        return line
 | 
						|
 | 
						|
    def eof(self):
 | 
						|
        assert self.__line is not None
 | 
						|
        return self.__eof
 | 
						|
 | 
						|
 | 
						|
XML_ELEMENT_START, XML_ELEMENT_END, XML_CHARACTER_DATA, XML_EOF = range(4)
 | 
						|
 | 
						|
 | 
						|
class XmlToken:
 | 
						|
 | 
						|
    def __init__(self, type, name_or_data, attrs = None, line = None, column = None):
 | 
						|
        assert type in (XML_ELEMENT_START, XML_ELEMENT_END, XML_CHARACTER_DATA, XML_EOF)
 | 
						|
        self.type = type
 | 
						|
        self.name_or_data = name_or_data
 | 
						|
        self.attrs = attrs
 | 
						|
        self.line = line
 | 
						|
        self.column = column
 | 
						|
 | 
						|
    def __str__(self):
 | 
						|
        if self.type == XML_ELEMENT_START:
 | 
						|
            return '<' + self.name_or_data + ' ...>'
 | 
						|
        if self.type == XML_ELEMENT_END:
 | 
						|
            return '</' + self.name_or_data + '>'
 | 
						|
        if self.type == XML_CHARACTER_DATA:
 | 
						|
            return self.name_or_data
 | 
						|
        if self.type == XML_EOF:
 | 
						|
            return 'end of file'
 | 
						|
        assert 0
 | 
						|
 | 
						|
 | 
						|
class XmlTokenizer:
 | 
						|
    """Expat based XML tokenizer."""
 | 
						|
 | 
						|
    def __init__(self, fp, skip_ws = True):
 | 
						|
        self.fp = fp
 | 
						|
        self.tokens = []
 | 
						|
        self.index = 0
 | 
						|
        self.final = False
 | 
						|
        self.skip_ws = skip_ws
 | 
						|
        
 | 
						|
        self.character_pos = 0, 0
 | 
						|
        self.character_data = ''
 | 
						|
        
 | 
						|
        self.parser = xml.parsers.expat.ParserCreate()
 | 
						|
        self.parser.StartElementHandler  = self.handle_element_start
 | 
						|
        self.parser.EndElementHandler    = self.handle_element_end
 | 
						|
        self.parser.CharacterDataHandler = self.handle_character_data
 | 
						|
    
 | 
						|
    def handle_element_start(self, name, attributes):
 | 
						|
        self.finish_character_data()
 | 
						|
        line, column = self.pos()
 | 
						|
        token = XmlToken(XML_ELEMENT_START, name, attributes, line, column)
 | 
						|
        self.tokens.append(token)
 | 
						|
    
 | 
						|
    def handle_element_end(self, name):
 | 
						|
        self.finish_character_data()
 | 
						|
        line, column = self.pos()
 | 
						|
        token = XmlToken(XML_ELEMENT_END, name, None, line, column)
 | 
						|
        self.tokens.append(token)
 | 
						|
 | 
						|
    def handle_character_data(self, data):
 | 
						|
        if not self.character_data:
 | 
						|
            self.character_pos = self.pos()
 | 
						|
        self.character_data += data
 | 
						|
    
 | 
						|
    def finish_character_data(self):
 | 
						|
        if self.character_data:
 | 
						|
            if not self.skip_ws or not self.character_data.isspace(): 
 | 
						|
                line, column = self.character_pos
 | 
						|
                token = XmlToken(XML_CHARACTER_DATA, self.character_data, None, line, column)
 | 
						|
                self.tokens.append(token)
 | 
						|
            self.character_data = ''
 | 
						|
    
 | 
						|
    def next(self):
 | 
						|
        size = 16*1024
 | 
						|
        while self.index >= len(self.tokens) and not self.final:
 | 
						|
            self.tokens = []
 | 
						|
            self.index = 0
 | 
						|
            data = self.fp.read(size)
 | 
						|
            self.final = len(data) < size
 | 
						|
            try:
 | 
						|
                self.parser.Parse(data, self.final)
 | 
						|
            except xml.parsers.expat.ExpatError, e:
 | 
						|
                #if e.code == xml.parsers.expat.errors.XML_ERROR_NO_ELEMENTS:
 | 
						|
                if e.code == 3:
 | 
						|
                    pass
 | 
						|
                else:
 | 
						|
                    raise e
 | 
						|
        if self.index >= len(self.tokens):
 | 
						|
            line, column = self.pos()
 | 
						|
            token = XmlToken(XML_EOF, None, None, line, column)
 | 
						|
        else:
 | 
						|
            token = self.tokens[self.index]
 | 
						|
            self.index += 1
 | 
						|
        return token
 | 
						|
 | 
						|
    def pos(self):
 | 
						|
        return self.parser.CurrentLineNumber, self.parser.CurrentColumnNumber
 | 
						|
 | 
						|
 | 
						|
class XmlTokenMismatch(Exception):
 | 
						|
 | 
						|
    def __init__(self, expected, found):
 | 
						|
        self.expected = expected
 | 
						|
        self.found = found
 | 
						|
 | 
						|
    def __str__(self):
 | 
						|
        return '%u:%u: %s expected, %s found' % (self.found.line, self.found.column, str(self.expected), str(self.found))
 | 
						|
 | 
						|
 | 
						|
class XmlParser(Parser):
 | 
						|
    """Base XML document parser."""
 | 
						|
 | 
						|
    def __init__(self, fp):
 | 
						|
        Parser.__init__(self)
 | 
						|
        self.tokenizer = XmlTokenizer(fp)
 | 
						|
        self.consume()
 | 
						|
    
 | 
						|
    def consume(self):
 | 
						|
        self.token = self.tokenizer.next()
 | 
						|
 | 
						|
    def match_element_start(self, name):
 | 
						|
        return self.token.type == XML_ELEMENT_START and self.token.name_or_data == name
 | 
						|
    
 | 
						|
    def match_element_end(self, name):
 | 
						|
        return self.token.type == XML_ELEMENT_END and self.token.name_or_data == name
 | 
						|
 | 
						|
    def element_start(self, name):
 | 
						|
        while self.token.type == XML_CHARACTER_DATA:
 | 
						|
            self.consume()
 | 
						|
        if self.token.type != XML_ELEMENT_START:
 | 
						|
            raise XmlTokenMismatch(XmlToken(XML_ELEMENT_START, name), self.token)
 | 
						|
        if self.token.name_or_data != name:
 | 
						|
            raise XmlTokenMismatch(XmlToken(XML_ELEMENT_START, name), self.token)
 | 
						|
        attrs = self.token.attrs
 | 
						|
        self.consume()
 | 
						|
        return attrs
 | 
						|
    
 | 
						|
    def element_end(self, name):
 | 
						|
        while self.token.type == XML_CHARACTER_DATA:
 | 
						|
            self.consume()
 | 
						|
        if self.token.type != XML_ELEMENT_END:
 | 
						|
            raise XmlTokenMismatch(XmlToken(XML_ELEMENT_END, name), self.token)
 | 
						|
        if self.token.name_or_data != name:
 | 
						|
            raise XmlTokenMismatch(XmlToken(XML_ELEMENT_END, name), self.token)
 | 
						|
        self.consume()
 | 
						|
 | 
						|
    def character_data(self, strip = True):
 | 
						|
        data = ''
 | 
						|
        while self.token.type == XML_CHARACTER_DATA:
 | 
						|
            data += self.token.name_or_data
 | 
						|
            self.consume()
 | 
						|
        if strip:
 | 
						|
            data = data.strip()
 | 
						|
        return data
 | 
						|
 | 
						|
 | 
						|
class GprofParser(Parser):
 | 
						|
    """Parser for GNU gprof output.
 | 
						|
 | 
						|
    See also:
 | 
						|
    - Chapter "Interpreting gprof's Output" from the GNU gprof manual
 | 
						|
      http://sourceware.org/binutils/docs-2.18/gprof/Call-Graph.html#Call-Graph
 | 
						|
    - File "cg_print.c" from the GNU gprof source code
 | 
						|
      http://sourceware.org/cgi-bin/cvsweb.cgi/~checkout~/src/gprof/cg_print.c?rev=1.12&cvsroot=src
 | 
						|
    """
 | 
						|
 | 
						|
    def __init__(self, fp):
 | 
						|
        Parser.__init__(self)
 | 
						|
        self.fp = fp
 | 
						|
        self.functions = {}
 | 
						|
        self.cycles = {}
 | 
						|
 | 
						|
    def readline(self):
 | 
						|
        line = self.fp.readline()
 | 
						|
        if not line:
 | 
						|
            sys.stderr.write('error: unexpected end of file\n')
 | 
						|
            sys.exit(1)
 | 
						|
        line = line.rstrip('\r\n')
 | 
						|
        return line
 | 
						|
 | 
						|
    _int_re = re.compile(r'^\d+$')
 | 
						|
    _float_re = re.compile(r'^\d+\.\d+$')
 | 
						|
 | 
						|
    def translate(self, mo):
 | 
						|
        """Extract a structure from a match object, while translating the types in the process."""
 | 
						|
        attrs = {}
 | 
						|
        groupdict = mo.groupdict()
 | 
						|
        for name, value in groupdict.iteritems():
 | 
						|
            if value is None:
 | 
						|
                value = None
 | 
						|
            elif self._int_re.match(value):
 | 
						|
                value = int(value)
 | 
						|
            elif self._float_re.match(value):
 | 
						|
                value = float(value)
 | 
						|
            attrs[name] = (value)
 | 
						|
        return Struct(attrs)
 | 
						|
 | 
						|
    _cg_header_re = re.compile(
 | 
						|
        # original gprof header
 | 
						|
        r'^\s+called/total\s+parents\s*$|' +
 | 
						|
        r'^index\s+%time\s+self\s+descendents\s+called\+self\s+name\s+index\s*$|' +
 | 
						|
        r'^\s+called/total\s+children\s*$|' +
 | 
						|
        # GNU gprof header
 | 
						|
        r'^index\s+%\s+time\s+self\s+children\s+called\s+name\s*$'
 | 
						|
    )
 | 
						|
 | 
						|
    _cg_ignore_re = re.compile(
 | 
						|
        # spontaneous
 | 
						|
        r'^\s+<spontaneous>\s*$|'
 | 
						|
        # internal calls (such as "mcount")
 | 
						|
        r'^.*\((\d+)\)$'
 | 
						|
    )
 | 
						|
 | 
						|
    _cg_primary_re = re.compile(
 | 
						|
        r'^\[(?P<index>\d+)\]?' + 
 | 
						|
        r'\s+(?P<percentage_time>\d+\.\d+)' + 
 | 
						|
        r'\s+(?P<self>\d+\.\d+)' + 
 | 
						|
        r'\s+(?P<descendants>\d+\.\d+)' + 
 | 
						|
        r'\s+(?:(?P<called>\d+)(?:\+(?P<called_self>\d+))?)?' + 
 | 
						|
        r'\s+(?P<name>\S.*?)' +
 | 
						|
        r'(?:\s+<cycle\s(?P<cycle>\d+)>)?' +
 | 
						|
        r'\s\[(\d+)\]$'
 | 
						|
    )
 | 
						|
 | 
						|
    _cg_parent_re = re.compile(
 | 
						|
        r'^\s+(?P<self>\d+\.\d+)?' + 
 | 
						|
        r'\s+(?P<descendants>\d+\.\d+)?' + 
 | 
						|
        r'\s+(?P<called>\d+)(?:/(?P<called_total>\d+))?' + 
 | 
						|
        r'\s+(?P<name>\S.*?)' +
 | 
						|
        r'(?:\s+<cycle\s(?P<cycle>\d+)>)?' +
 | 
						|
        r'\s\[(?P<index>\d+)\]$'
 | 
						|
    )
 | 
						|
 | 
						|
    _cg_child_re = _cg_parent_re
 | 
						|
 | 
						|
    _cg_cycle_header_re = re.compile(
 | 
						|
        r'^\[(?P<index>\d+)\]?' + 
 | 
						|
        r'\s+(?P<percentage_time>\d+\.\d+)' + 
 | 
						|
        r'\s+(?P<self>\d+\.\d+)' + 
 | 
						|
        r'\s+(?P<descendants>\d+\.\d+)' + 
 | 
						|
        r'\s+(?:(?P<called>\d+)(?:\+(?P<called_self>\d+))?)?' + 
 | 
						|
        r'\s+<cycle\s(?P<cycle>\d+)\sas\sa\swhole>' +
 | 
						|
        r'\s\[(\d+)\]$'
 | 
						|
    )
 | 
						|
 | 
						|
    _cg_cycle_member_re = re.compile(
 | 
						|
        r'^\s+(?P<self>\d+\.\d+)?' + 
 | 
						|
        r'\s+(?P<descendants>\d+\.\d+)?' + 
 | 
						|
        r'\s+(?P<called>\d+)(?:\+(?P<called_self>\d+))?' + 
 | 
						|
        r'\s+(?P<name>\S.*?)' +
 | 
						|
        r'(?:\s+<cycle\s(?P<cycle>\d+)>)?' +
 | 
						|
        r'\s\[(?P<index>\d+)\]$'
 | 
						|
    )
 | 
						|
 | 
						|
    _cg_sep_re = re.compile(r'^--+$')
 | 
						|
 | 
						|
    def parse_function_entry(self, lines):
 | 
						|
        parents = []
 | 
						|
        children = []
 | 
						|
 | 
						|
        while True:
 | 
						|
            if not lines:
 | 
						|
                sys.stderr.write('warning: unexpected end of entry\n')
 | 
						|
            line = lines.pop(0)
 | 
						|
            if line.startswith('['):
 | 
						|
                break
 | 
						|
        
 | 
						|
            # read function parent line
 | 
						|
            mo = self._cg_parent_re.match(line)
 | 
						|
            if not mo:
 | 
						|
                if self._cg_ignore_re.match(line):
 | 
						|
                    continue
 | 
						|
                sys.stderr.write('warning: unrecognized call graph entry: %r\n' % line)
 | 
						|
            else:
 | 
						|
                parent = self.translate(mo)
 | 
						|
                parents.append(parent)
 | 
						|
 | 
						|
        # read primary line
 | 
						|
        mo = self._cg_primary_re.match(line)
 | 
						|
        if not mo:
 | 
						|
            sys.stderr.write('warning: unrecognized call graph entry: %r\n' % line)
 | 
						|
            return
 | 
						|
        else:
 | 
						|
            function = self.translate(mo)
 | 
						|
 | 
						|
        while lines:
 | 
						|
            line = lines.pop(0)
 | 
						|
            
 | 
						|
            # read function subroutine line
 | 
						|
            mo = self._cg_child_re.match(line)
 | 
						|
            if not mo:
 | 
						|
                if self._cg_ignore_re.match(line):
 | 
						|
                    continue
 | 
						|
                sys.stderr.write('warning: unrecognized call graph entry: %r\n' % line)
 | 
						|
            else:
 | 
						|
                child = self.translate(mo)
 | 
						|
                children.append(child)
 | 
						|
        
 | 
						|
        function.parents = parents
 | 
						|
        function.children = children
 | 
						|
 | 
						|
        self.functions[function.index] = function
 | 
						|
 | 
						|
    def parse_cycle_entry(self, lines):
 | 
						|
 | 
						|
        # read cycle header line
 | 
						|
        line = lines[0]
 | 
						|
        mo = self._cg_cycle_header_re.match(line)
 | 
						|
        if not mo:
 | 
						|
            sys.stderr.write('warning: unrecognized call graph entry: %r\n' % line)
 | 
						|
            return
 | 
						|
        cycle = self.translate(mo)
 | 
						|
 | 
						|
        # read cycle member lines
 | 
						|
        cycle.functions = []
 | 
						|
        for line in lines[1:]:
 | 
						|
            mo = self._cg_cycle_member_re.match(line)
 | 
						|
            if not mo:
 | 
						|
                sys.stderr.write('warning: unrecognized call graph entry: %r\n' % line)
 | 
						|
                continue
 | 
						|
            call = self.translate(mo)
 | 
						|
            cycle.functions.append(call)
 | 
						|
        
 | 
						|
        self.cycles[cycle.cycle] = cycle
 | 
						|
 | 
						|
    def parse_cg_entry(self, lines):
 | 
						|
        if lines[0].startswith("["):
 | 
						|
            self.parse_cycle_entry(lines)
 | 
						|
        else:
 | 
						|
            self.parse_function_entry(lines)
 | 
						|
 | 
						|
    def parse_cg(self):
 | 
						|
        """Parse the call graph."""
 | 
						|
 | 
						|
        # skip call graph header
 | 
						|
        while not self._cg_header_re.match(self.readline()):
 | 
						|
            pass
 | 
						|
        line = self.readline()
 | 
						|
        while self._cg_header_re.match(line):
 | 
						|
            line = self.readline()
 | 
						|
 | 
						|
        # process call graph entries
 | 
						|
        entry_lines = []
 | 
						|
        while line != '\014': # form feed
 | 
						|
            if line and not line.isspace():
 | 
						|
                if self._cg_sep_re.match(line):
 | 
						|
                    self.parse_cg_entry(entry_lines)
 | 
						|
                    entry_lines = []
 | 
						|
                else:
 | 
						|
                    entry_lines.append(line)            
 | 
						|
            line = self.readline()
 | 
						|
    
 | 
						|
    def parse(self):
 | 
						|
        self.parse_cg()
 | 
						|
        self.fp.close()
 | 
						|
 | 
						|
        profile = Profile()
 | 
						|
        profile[TIME] = 0.0
 | 
						|
        
 | 
						|
        cycles = {}
 | 
						|
        for index in self.cycles.iterkeys():
 | 
						|
            cycles[index] = Cycle()
 | 
						|
 | 
						|
        for entry in self.functions.itervalues():
 | 
						|
            # populate the function
 | 
						|
            function = Function(entry.index, entry.name)
 | 
						|
            function[TIME] = entry.self
 | 
						|
            if entry.called is not None:
 | 
						|
                function.called = entry.called
 | 
						|
            if entry.called_self is not None:
 | 
						|
                call = Call(entry.index)
 | 
						|
                call[CALLS] = entry.called_self
 | 
						|
                function.called += entry.called_self
 | 
						|
            
 | 
						|
            # populate the function calls
 | 
						|
            for child in entry.children:
 | 
						|
                call = Call(child.index)
 | 
						|
                
 | 
						|
                assert child.called is not None
 | 
						|
                call[CALLS] = child.called
 | 
						|
 | 
						|
                if child.index not in self.functions:
 | 
						|
                    # NOTE: functions that were never called but were discovered by gprof's 
 | 
						|
                    # static call graph analysis dont have a call graph entry so we need
 | 
						|
                    # to add them here
 | 
						|
                    missing = Function(child.index, child.name)
 | 
						|
                    function[TIME] = 0.0
 | 
						|
                    function.called = 0
 | 
						|
                    profile.add_function(missing)
 | 
						|
 | 
						|
                function.add_call(call)
 | 
						|
 | 
						|
            profile.add_function(function)
 | 
						|
 | 
						|
            if entry.cycle is not None:
 | 
						|
                try:
 | 
						|
                    cycle = cycles[entry.cycle]
 | 
						|
                except KeyError:
 | 
						|
                    sys.stderr.write('warning: <cycle %u as a whole> entry missing\n' % entry.cycle) 
 | 
						|
                    cycle = Cycle()
 | 
						|
                    cycles[entry.cycle] = cycle
 | 
						|
                cycle.add_function(function)
 | 
						|
 | 
						|
            profile[TIME] = profile[TIME] + function[TIME]
 | 
						|
 | 
						|
        for cycle in cycles.itervalues():
 | 
						|
            profile.add_cycle(cycle)
 | 
						|
 | 
						|
        # Compute derived events
 | 
						|
        profile.validate()
 | 
						|
        profile.ratio(TIME_RATIO, TIME)
 | 
						|
        profile.call_ratios(CALLS)
 | 
						|
        profile.integrate(TOTAL_TIME, TIME)
 | 
						|
        profile.ratio(TOTAL_TIME_RATIO, TOTAL_TIME)
 | 
						|
 | 
						|
        return profile
 | 
						|
 | 
						|
 | 
						|
class CallgrindParser(LineParser):
 | 
						|
    """Parser for valgrind's callgrind tool.
 | 
						|
    
 | 
						|
    See also:
 | 
						|
    - http://valgrind.org/docs/manual/cl-format.html
 | 
						|
    """
 | 
						|
 | 
						|
    _call_re = re.compile('^calls=\s*(\d+)\s+((\d+|\+\d+|-\d+|\*)\s+)+$')
 | 
						|
 | 
						|
    def __init__(self, infile):
 | 
						|
        LineParser.__init__(self, infile)
 | 
						|
 | 
						|
        # Textual positions
 | 
						|
        self.position_ids = {}
 | 
						|
        self.positions = {}
 | 
						|
 | 
						|
        # Numeric positions
 | 
						|
        self.num_positions = 1
 | 
						|
        self.cost_positions = ['line']
 | 
						|
        self.last_positions = [0]
 | 
						|
 | 
						|
        # Events
 | 
						|
        self.num_events = 0
 | 
						|
        self.cost_events = []
 | 
						|
 | 
						|
        self.profile = Profile()
 | 
						|
        self.profile[SAMPLES] = 0
 | 
						|
 | 
						|
    def parse(self):
 | 
						|
        # read lookahead
 | 
						|
        self.readline()
 | 
						|
 | 
						|
        self.parse_key('version')
 | 
						|
        self.parse_key('creator')
 | 
						|
        self.parse_part()
 | 
						|
 | 
						|
        # compute derived data
 | 
						|
        self.profile.validate()
 | 
						|
        self.profile.find_cycles()
 | 
						|
        self.profile.ratio(TIME_RATIO, SAMPLES)
 | 
						|
        self.profile.call_ratios(CALLS)
 | 
						|
        self.profile.integrate(TOTAL_TIME_RATIO, TIME_RATIO)
 | 
						|
 | 
						|
        return self.profile
 | 
						|
 | 
						|
    def parse_part(self):
 | 
						|
        while self.parse_header_line():
 | 
						|
            pass
 | 
						|
        while self.parse_body_line():
 | 
						|
            pass
 | 
						|
        return True
 | 
						|
 | 
						|
    def parse_header_line(self):
 | 
						|
        return \
 | 
						|
            self.parse_empty() or \
 | 
						|
            self.parse_comment() or \
 | 
						|
            self.parse_part_detail() or \
 | 
						|
            self.parse_description() or \
 | 
						|
            self.parse_event_specification() or \
 | 
						|
            self.parse_cost_line_def() or \
 | 
						|
            self.parse_cost_summary()
 | 
						|
 | 
						|
    _detail_keys = set(('cmd', 'pid', 'thread', 'part'))
 | 
						|
 | 
						|
    def parse_part_detail(self):
 | 
						|
        return self.parse_keys(self._detail_keys)
 | 
						|
 | 
						|
    def parse_description(self):
 | 
						|
        return self.parse_key('desc') is not None
 | 
						|
 | 
						|
    def parse_event_specification(self):
 | 
						|
        event = self.parse_key('event')
 | 
						|
        if event is None:
 | 
						|
            return False
 | 
						|
        return True
 | 
						|
 | 
						|
    def parse_cost_line_def(self):
 | 
						|
        pair = self.parse_keys(('events', 'positions'))
 | 
						|
        if pair is None:
 | 
						|
            return False
 | 
						|
        key, value = pair
 | 
						|
        items = value.split()
 | 
						|
        if key == 'events':
 | 
						|
            self.num_events = len(items)
 | 
						|
            self.cost_events = items
 | 
						|
        if key == 'positions':
 | 
						|
            self.num_positions = len(items)
 | 
						|
            self.cost_positions = items
 | 
						|
            self.last_positions = [0]*self.num_positions
 | 
						|
        return True
 | 
						|
 | 
						|
    def parse_cost_summary(self):
 | 
						|
        pair = self.parse_keys(('summary', 'totals'))
 | 
						|
        if pair is None:
 | 
						|
            return False
 | 
						|
        return True
 | 
						|
 | 
						|
    def parse_body_line(self):
 | 
						|
        return \
 | 
						|
            self.parse_empty() or \
 | 
						|
            self.parse_comment() or \
 | 
						|
            self.parse_cost_line() or \
 | 
						|
            self.parse_position_spec() or \
 | 
						|
            self.parse_association_spec()
 | 
						|
 | 
						|
    _cost_re = re.compile(r'^(\d+|\+\d+|-\d+|\*)( \d+)+$')
 | 
						|
 | 
						|
    def parse_cost_line(self, calls=None):
 | 
						|
        line = self.lookahead()
 | 
						|
        mo = self._cost_re.match(line)
 | 
						|
        if not mo:
 | 
						|
            return False
 | 
						|
 | 
						|
        function = self.get_function()
 | 
						|
 | 
						|
        values = line.split(' ')
 | 
						|
        assert len(values) == self.num_positions + self.num_events
 | 
						|
 | 
						|
        positions = values[0 : self.num_positions]
 | 
						|
        events = values[self.num_positions : ]
 | 
						|
 | 
						|
        for i in range(self.num_positions):
 | 
						|
            position = positions[i]
 | 
						|
            if position == '*':
 | 
						|
                position = self.last_positions[i]
 | 
						|
            elif position[0] in '-+':
 | 
						|
                position = self.last_positions[i] + int(position)
 | 
						|
            else:
 | 
						|
                position = int(position)
 | 
						|
            self.last_positions[i] = position
 | 
						|
 | 
						|
        events = map(float, events)
 | 
						|
 | 
						|
        if calls is None:
 | 
						|
            function[SAMPLES] += events[0] 
 | 
						|
            self.profile[SAMPLES] += events[0]
 | 
						|
        else:
 | 
						|
            callee = self.get_callee()
 | 
						|
            callee.called += calls
 | 
						|
    
 | 
						|
            try:
 | 
						|
                call = function.calls[callee.id]
 | 
						|
            except KeyError:
 | 
						|
                call = Call(callee.id)
 | 
						|
                call[CALLS] = calls
 | 
						|
                call[SAMPLES] = events[0]
 | 
						|
                function.add_call(call)
 | 
						|
            else:
 | 
						|
                call[CALLS] += calls
 | 
						|
                call[SAMPLES] += events[0]
 | 
						|
 | 
						|
        self.consume()
 | 
						|
        return True
 | 
						|
 | 
						|
    def parse_association_spec(self):
 | 
						|
        line = self.lookahead()
 | 
						|
        if not line.startswith('calls='):
 | 
						|
            return False
 | 
						|
 | 
						|
        _, values = line.split('=', 1)
 | 
						|
        values = values.strip().split()
 | 
						|
        calls = int(values[0])
 | 
						|
        call_position = values[1:]
 | 
						|
        self.consume()
 | 
						|
 | 
						|
        self.parse_cost_line(calls)
 | 
						|
 | 
						|
        return True
 | 
						|
 | 
						|
    _position_re = re.compile('^(?P<position>c?(?:ob|fl|fi|fe|fn))=\s*(?:\((?P<id>\d+)\))?(?:\s*(?P<name>.+))?')
 | 
						|
 | 
						|
    _position_table_map = {
 | 
						|
        'ob': 'ob',
 | 
						|
        'fl': 'fl',
 | 
						|
        'fi': 'fl',
 | 
						|
        'fe': 'fl',
 | 
						|
        'fn': 'fn',
 | 
						|
        'cob': 'ob',
 | 
						|
        'cfl': 'fl',
 | 
						|
        'cfi': 'fl',
 | 
						|
        'cfe': 'fl',
 | 
						|
        'cfn': 'fn',
 | 
						|
    }
 | 
						|
 | 
						|
    _position_map = {
 | 
						|
        'ob': 'ob',
 | 
						|
        'fl': 'fl',
 | 
						|
        'fi': 'fl',
 | 
						|
        'fe': 'fl',
 | 
						|
        'fn': 'fn',
 | 
						|
        'cob': 'cob',
 | 
						|
        'cfl': 'cfl',
 | 
						|
        'cfi': 'cfl',
 | 
						|
        'cfe': 'cfl',
 | 
						|
        'cfn': 'cfn',
 | 
						|
    }
 | 
						|
 | 
						|
    def parse_position_spec(self):
 | 
						|
        line = self.lookahead()
 | 
						|
        mo = self._position_re.match(line)
 | 
						|
        if not mo:
 | 
						|
            return False
 | 
						|
 | 
						|
        position, id, name = mo.groups()
 | 
						|
        if id:
 | 
						|
            table = self._position_table_map[position]
 | 
						|
            if name:
 | 
						|
                self.position_ids[(table, id)] = name
 | 
						|
            else:
 | 
						|
                name = self.position_ids.get((table, id), '')
 | 
						|
        self.positions[self._position_map[position]] = name
 | 
						|
        self.consume()
 | 
						|
        return True
 | 
						|
 | 
						|
    def parse_empty(self):
 | 
						|
        line = self.lookahead()
 | 
						|
        if line.strip():
 | 
						|
            return False
 | 
						|
        self.consume()
 | 
						|
        return True
 | 
						|
 | 
						|
    def parse_comment(self):
 | 
						|
        line = self.lookahead()
 | 
						|
        if not line.startswith('#'):
 | 
						|
            return False
 | 
						|
        self.consume()
 | 
						|
        return True
 | 
						|
 | 
						|
    _key_re = re.compile(r'^(\w+):')
 | 
						|
 | 
						|
    def parse_key(self, key):
 | 
						|
        pair = self.parse_keys((key,))
 | 
						|
        if not pair:
 | 
						|
            return None
 | 
						|
        key, value = pair
 | 
						|
        return value
 | 
						|
        line = self.lookahead()
 | 
						|
        mo = self._key_re.match(line)
 | 
						|
        if not mo:
 | 
						|
            return None
 | 
						|
        key, value = line.split(':', 1)
 | 
						|
        if key not in keys:
 | 
						|
            return None
 | 
						|
        value = value.strip()
 | 
						|
        self.consume()
 | 
						|
        return key, value
 | 
						|
 | 
						|
    def parse_keys(self, keys):
 | 
						|
        line = self.lookahead()
 | 
						|
        mo = self._key_re.match(line)
 | 
						|
        if not mo:
 | 
						|
            return None
 | 
						|
        key, value = line.split(':', 1)
 | 
						|
        if key not in keys:
 | 
						|
            return None
 | 
						|
        value = value.strip()
 | 
						|
        self.consume()
 | 
						|
        return key, value
 | 
						|
 | 
						|
    def make_function(self, module, filename, name):
 | 
						|
        # FIXME: module and filename are not being tracked reliably
 | 
						|
        #id = '|'.join((module, filename, name))
 | 
						|
        id = name
 | 
						|
        try:
 | 
						|
            function = self.profile.functions[id]
 | 
						|
        except KeyError:
 | 
						|
            function = Function(id, name)
 | 
						|
            function[SAMPLES] = 0
 | 
						|
            function.called = 0
 | 
						|
            self.profile.add_function(function)
 | 
						|
        return function
 | 
						|
 | 
						|
    def get_function(self):
 | 
						|
        module = self.positions.get('ob', '')
 | 
						|
        filename = self.positions.get('fl', '') 
 | 
						|
        function = self.positions.get('fn', '') 
 | 
						|
        return self.make_function(module, filename, function)
 | 
						|
 | 
						|
    def get_callee(self):
 | 
						|
        module = self.positions.get('cob', '')
 | 
						|
        filename = self.positions.get('cfi', '') 
 | 
						|
        function = self.positions.get('cfn', '') 
 | 
						|
        return self.make_function(module, filename, function)
 | 
						|
 | 
						|
 | 
						|
class OprofileParser(LineParser):
 | 
						|
    """Parser for oprofile callgraph output.
 | 
						|
    
 | 
						|
    See also:
 | 
						|
    - http://oprofile.sourceforge.net/doc/opreport.html#opreport-callgraph
 | 
						|
    """
 | 
						|
 | 
						|
    _fields_re = {
 | 
						|
        'samples': r'(\d+)',
 | 
						|
        '%': r'(\S+)',
 | 
						|
        'linenr info': r'(?P<source>\(no location information\)|\S+:\d+)',
 | 
						|
        'image name': r'(?P<image>\S+(?:\s\(tgid:[^)]*\))?)',
 | 
						|
        'app name': r'(?P<application>\S+)',
 | 
						|
        'symbol name': r'(?P<symbol>\(no symbols\)|.+?)',
 | 
						|
    }
 | 
						|
 | 
						|
    def __init__(self, infile):
 | 
						|
        LineParser.__init__(self, infile)
 | 
						|
        self.entries = {}
 | 
						|
        self.entry_re = None
 | 
						|
 | 
						|
    def add_entry(self, callers, function, callees):
 | 
						|
        try:
 | 
						|
            entry = self.entries[function.id]
 | 
						|
        except KeyError:
 | 
						|
            self.entries[function.id] = (callers, function, callees)
 | 
						|
        else:
 | 
						|
            callers_total, function_total, callees_total = entry
 | 
						|
            self.update_subentries_dict(callers_total, callers)
 | 
						|
            function_total.samples += function.samples
 | 
						|
            self.update_subentries_dict(callees_total, callees)
 | 
						|
    
 | 
						|
    def update_subentries_dict(self, totals, partials):
 | 
						|
        for partial in partials.itervalues():
 | 
						|
            try:
 | 
						|
                total = totals[partial.id]
 | 
						|
            except KeyError:
 | 
						|
                totals[partial.id] = partial
 | 
						|
            else:
 | 
						|
                total.samples += partial.samples
 | 
						|
        
 | 
						|
    def parse(self):
 | 
						|
        # read lookahead
 | 
						|
        self.readline()
 | 
						|
 | 
						|
        self.parse_header()
 | 
						|
        while self.lookahead():
 | 
						|
            self.parse_entry()
 | 
						|
 | 
						|
        profile = Profile()
 | 
						|
 | 
						|
        reverse_call_samples = {}
 | 
						|
        
 | 
						|
        # populate the profile
 | 
						|
        profile[SAMPLES] = 0
 | 
						|
        for _callers, _function, _callees in self.entries.itervalues():
 | 
						|
            function = Function(_function.id, _function.name)
 | 
						|
            function[SAMPLES] = _function.samples
 | 
						|
            profile.add_function(function)
 | 
						|
            profile[SAMPLES] += _function.samples
 | 
						|
 | 
						|
            if _function.application:
 | 
						|
                function.process = os.path.basename(_function.application)
 | 
						|
            if _function.image:
 | 
						|
                function.module = os.path.basename(_function.image)
 | 
						|
 | 
						|
            total_callee_samples = 0
 | 
						|
            for _callee in _callees.itervalues():
 | 
						|
                total_callee_samples += _callee.samples
 | 
						|
 | 
						|
            for _callee in _callees.itervalues():
 | 
						|
                if not _callee.self:
 | 
						|
                    call = Call(_callee.id)
 | 
						|
                    call[SAMPLES2] = _callee.samples
 | 
						|
                    function.add_call(call)
 | 
						|
                
 | 
						|
        # compute derived data
 | 
						|
        profile.validate()
 | 
						|
        profile.find_cycles()
 | 
						|
        profile.ratio(TIME_RATIO, SAMPLES)
 | 
						|
        profile.call_ratios(SAMPLES2)
 | 
						|
        profile.integrate(TOTAL_TIME_RATIO, TIME_RATIO)
 | 
						|
 | 
						|
        return profile
 | 
						|
 | 
						|
    def parse_header(self):
 | 
						|
        while not self.match_header():
 | 
						|
            self.consume()
 | 
						|
        line = self.lookahead()
 | 
						|
        fields = re.split(r'\s\s+', line)
 | 
						|
        entry_re = r'^\s*' + r'\s+'.join([self._fields_re[field] for field in fields]) + r'(?P<self>\s+\[self\])?$'
 | 
						|
        self.entry_re = re.compile(entry_re)
 | 
						|
        self.skip_separator()
 | 
						|
 | 
						|
    def parse_entry(self):
 | 
						|
        callers = self.parse_subentries()
 | 
						|
        if self.match_primary():
 | 
						|
            function = self.parse_subentry()
 | 
						|
            if function is not None:
 | 
						|
                callees = self.parse_subentries()
 | 
						|
                self.add_entry(callers, function, callees)
 | 
						|
        self.skip_separator()
 | 
						|
 | 
						|
    def parse_subentries(self):
 | 
						|
        subentries = {}
 | 
						|
        while self.match_secondary():
 | 
						|
            subentry = self.parse_subentry()
 | 
						|
            subentries[subentry.id] = subentry
 | 
						|
        return subentries
 | 
						|
 | 
						|
    def parse_subentry(self):
 | 
						|
        entry = Struct()
 | 
						|
        line = self.consume()
 | 
						|
        mo = self.entry_re.match(line)
 | 
						|
        if not mo:
 | 
						|
            raise ParseError('failed to parse', line)
 | 
						|
        fields = mo.groupdict()
 | 
						|
        entry.samples = int(mo.group(1))
 | 
						|
        if 'source' in fields and fields['source'] != '(no location information)':
 | 
						|
            source = fields['source']
 | 
						|
            filename, lineno = source.split(':')
 | 
						|
            entry.filename = filename
 | 
						|
            entry.lineno = int(lineno)
 | 
						|
        else:
 | 
						|
            source = ''
 | 
						|
            entry.filename = None
 | 
						|
            entry.lineno = None
 | 
						|
        entry.image = fields.get('image', '')
 | 
						|
        entry.application = fields.get('application', '')
 | 
						|
        if 'symbol' in fields and fields['symbol'] != '(no symbols)':
 | 
						|
            entry.symbol = fields['symbol']
 | 
						|
        else:
 | 
						|
            entry.symbol = ''
 | 
						|
        if entry.symbol.startswith('"') and entry.symbol.endswith('"'):
 | 
						|
            entry.symbol = entry.symbol[1:-1]
 | 
						|
        entry.id = ':'.join((entry.application, entry.image, source, entry.symbol))
 | 
						|
        entry.self = fields.get('self', None) != None
 | 
						|
        if entry.self:
 | 
						|
            entry.id += ':self'
 | 
						|
        if entry.symbol:
 | 
						|
            entry.name = entry.symbol
 | 
						|
        else:
 | 
						|
            entry.name = entry.image
 | 
						|
        return entry
 | 
						|
 | 
						|
    def skip_separator(self):
 | 
						|
        while not self.match_separator():
 | 
						|
            self.consume()
 | 
						|
        self.consume()
 | 
						|
 | 
						|
    def match_header(self):
 | 
						|
        line = self.lookahead()
 | 
						|
        return line.startswith('samples')
 | 
						|
 | 
						|
    def match_separator(self):
 | 
						|
        line = self.lookahead()
 | 
						|
        return line == '-'*len(line)
 | 
						|
 | 
						|
    def match_primary(self):
 | 
						|
        line = self.lookahead()
 | 
						|
        return not line[:1].isspace()
 | 
						|
    
 | 
						|
    def match_secondary(self):
 | 
						|
        line = self.lookahead()
 | 
						|
        return line[:1].isspace()
 | 
						|
 | 
						|
 | 
						|
class SysprofParser(XmlParser):
 | 
						|
 | 
						|
    def __init__(self, stream):
 | 
						|
        XmlParser.__init__(self, stream)
 | 
						|
 | 
						|
    def parse(self):
 | 
						|
        objects = {}
 | 
						|
        nodes = {}
 | 
						|
 | 
						|
        self.element_start('profile')
 | 
						|
        while self.token.type == XML_ELEMENT_START:
 | 
						|
            if self.token.name_or_data == 'objects':
 | 
						|
                assert not objects
 | 
						|
                objects = self.parse_items('objects')
 | 
						|
            elif self.token.name_or_data == 'nodes':
 | 
						|
                assert not nodes
 | 
						|
                nodes = self.parse_items('nodes')
 | 
						|
            else:
 | 
						|
                self.parse_value(self.token.name_or_data)
 | 
						|
        self.element_end('profile')
 | 
						|
 | 
						|
        return self.build_profile(objects, nodes)
 | 
						|
 | 
						|
    def parse_items(self, name):
 | 
						|
        assert name[-1] == 's'
 | 
						|
        items = {}
 | 
						|
        self.element_start(name)
 | 
						|
        while self.token.type == XML_ELEMENT_START:
 | 
						|
            id, values = self.parse_item(name[:-1])
 | 
						|
            assert id not in items
 | 
						|
            items[id] = values
 | 
						|
        self.element_end(name)
 | 
						|
        return items
 | 
						|
 | 
						|
    def parse_item(self, name):
 | 
						|
        attrs = self.element_start(name)
 | 
						|
        id = int(attrs['id'])
 | 
						|
        values = self.parse_values()
 | 
						|
        self.element_end(name)
 | 
						|
        return id, values
 | 
						|
 | 
						|
    def parse_values(self):
 | 
						|
        values = {}
 | 
						|
        while self.token.type == XML_ELEMENT_START:
 | 
						|
            name = self.token.name_or_data
 | 
						|
            value = self.parse_value(name)
 | 
						|
            assert name not in values
 | 
						|
            values[name] = value
 | 
						|
        return values
 | 
						|
 | 
						|
    def parse_value(self, tag):
 | 
						|
        self.element_start(tag)
 | 
						|
        value = self.character_data()
 | 
						|
        self.element_end(tag)
 | 
						|
        if value.isdigit():
 | 
						|
            return int(value)
 | 
						|
        if value.startswith('"') and value.endswith('"'):
 | 
						|
            return value[1:-1]
 | 
						|
        return value
 | 
						|
 | 
						|
    def build_profile(self, objects, nodes):
 | 
						|
        profile = Profile()
 | 
						|
        
 | 
						|
        profile[SAMPLES] = 0
 | 
						|
        for id, object in objects.iteritems():
 | 
						|
            # Ignore fake objects (process names, modules, "Everything", "kernel", etc.)
 | 
						|
            if object['self'] == 0:
 | 
						|
                continue
 | 
						|
 | 
						|
            function = Function(id, object['name'])
 | 
						|
            function[SAMPLES] = object['self']
 | 
						|
            profile.add_function(function)
 | 
						|
            profile[SAMPLES] += function[SAMPLES]
 | 
						|
 | 
						|
        for id, node in nodes.iteritems():
 | 
						|
            # Ignore fake calls
 | 
						|
            if node['self'] == 0:
 | 
						|
                continue
 | 
						|
 | 
						|
            # Find a non-ignored parent
 | 
						|
            parent_id = node['parent']
 | 
						|
            while parent_id != 0:
 | 
						|
                parent = nodes[parent_id]
 | 
						|
                caller_id = parent['object']
 | 
						|
                if objects[caller_id]['self'] != 0:
 | 
						|
                    break
 | 
						|
                parent_id = parent['parent']
 | 
						|
            if parent_id == 0:
 | 
						|
                continue
 | 
						|
 | 
						|
            callee_id = node['object']
 | 
						|
 | 
						|
            assert objects[caller_id]['self']
 | 
						|
            assert objects[callee_id]['self']
 | 
						|
 | 
						|
            function = profile.functions[caller_id]
 | 
						|
 | 
						|
            samples = node['self']
 | 
						|
            try:
 | 
						|
                call = function.calls[callee_id]
 | 
						|
            except KeyError:
 | 
						|
                call = Call(callee_id)
 | 
						|
                call[SAMPLES2] = samples
 | 
						|
                function.add_call(call)
 | 
						|
            else:
 | 
						|
                call[SAMPLES2] += samples
 | 
						|
 | 
						|
        # Compute derived events
 | 
						|
        profile.validate()
 | 
						|
        profile.find_cycles()
 | 
						|
        profile.ratio(TIME_RATIO, SAMPLES)
 | 
						|
        profile.call_ratios(SAMPLES2)
 | 
						|
        profile.integrate(TOTAL_TIME_RATIO, TIME_RATIO)
 | 
						|
 | 
						|
        return profile
 | 
						|
 | 
						|
 | 
						|
class SharkParser(LineParser):
 | 
						|
    """Parser for MacOSX Shark output.
 | 
						|
 | 
						|
    Author: tom@dbservice.com
 | 
						|
    """
 | 
						|
 | 
						|
    def __init__(self, infile):
 | 
						|
        LineParser.__init__(self, infile)
 | 
						|
        self.stack = []
 | 
						|
        self.entries = {}
 | 
						|
 | 
						|
    def add_entry(self, function):
 | 
						|
        try:
 | 
						|
            entry = self.entries[function.id]
 | 
						|
        except KeyError:
 | 
						|
            self.entries[function.id] = (function, { })
 | 
						|
        else:
 | 
						|
            function_total, callees_total = entry
 | 
						|
            function_total.samples += function.samples
 | 
						|
    
 | 
						|
    def add_callee(self, function, callee):
 | 
						|
        func, callees = self.entries[function.id]
 | 
						|
        try:
 | 
						|
            entry = callees[callee.id]
 | 
						|
        except KeyError:
 | 
						|
            callees[callee.id] = callee
 | 
						|
        else:
 | 
						|
            entry.samples += callee.samples
 | 
						|
        
 | 
						|
    def parse(self):
 | 
						|
        self.readline()
 | 
						|
        self.readline()
 | 
						|
        self.readline()
 | 
						|
        self.readline()
 | 
						|
 | 
						|
        match = re.compile(r'(?P<prefix>[|+ ]*)(?P<samples>\d+), (?P<symbol>[^,]+), (?P<image>.*)')
 | 
						|
 | 
						|
        while self.lookahead():
 | 
						|
            line = self.consume()
 | 
						|
            mo = match.match(line)
 | 
						|
            if not mo:
 | 
						|
                raise ParseError('failed to parse', line)
 | 
						|
 | 
						|
            fields = mo.groupdict()
 | 
						|
            prefix = len(fields.get('prefix', 0)) / 2 - 1
 | 
						|
 | 
						|
            symbol = str(fields.get('symbol', 0))
 | 
						|
            image = str(fields.get('image', 0))
 | 
						|
 | 
						|
            entry = Struct()
 | 
						|
            entry.id = ':'.join([symbol, image])
 | 
						|
            entry.samples = int(fields.get('samples', 0))
 | 
						|
 | 
						|
            entry.name = symbol
 | 
						|
            entry.image = image
 | 
						|
 | 
						|
            # adjust the callstack
 | 
						|
            if prefix < len(self.stack):
 | 
						|
                del self.stack[prefix:]
 | 
						|
 | 
						|
            if prefix == len(self.stack):
 | 
						|
                self.stack.append(entry)
 | 
						|
 | 
						|
            # if the callstack has had an entry, it's this functions caller
 | 
						|
            if prefix > 0:
 | 
						|
                self.add_callee(self.stack[prefix - 1], entry)
 | 
						|
                
 | 
						|
            self.add_entry(entry)
 | 
						|
                
 | 
						|
        profile = Profile()
 | 
						|
        profile[SAMPLES] = 0
 | 
						|
        for _function, _callees in self.entries.itervalues():
 | 
						|
            function = Function(_function.id, _function.name)
 | 
						|
            function[SAMPLES] = _function.samples
 | 
						|
            profile.add_function(function)
 | 
						|
            profile[SAMPLES] += _function.samples
 | 
						|
 | 
						|
            if _function.image:
 | 
						|
                function.module = os.path.basename(_function.image)
 | 
						|
 | 
						|
            for _callee in _callees.itervalues():
 | 
						|
                call = Call(_callee.id)
 | 
						|
                call[SAMPLES] = _callee.samples
 | 
						|
                function.add_call(call)
 | 
						|
                
 | 
						|
        # compute derived data
 | 
						|
        profile.validate()
 | 
						|
        profile.find_cycles()
 | 
						|
        profile.ratio(TIME_RATIO, SAMPLES)
 | 
						|
        profile.call_ratios(SAMPLES)
 | 
						|
        profile.integrate(TOTAL_TIME_RATIO, TIME_RATIO)
 | 
						|
 | 
						|
        return profile
 | 
						|
 | 
						|
 | 
						|
class XPerfParser(Parser):
 | 
						|
    """Parser for CSVs generted by XPerf, from Microsoft Windows Performance Tools.
 | 
						|
    """
 | 
						|
 | 
						|
    def __init__(self, stream):
 | 
						|
        Parser.__init__(self)
 | 
						|
        self.stream = stream
 | 
						|
        self.profile = Profile()
 | 
						|
        self.profile[SAMPLES] = 0
 | 
						|
        self.column = {}
 | 
						|
 | 
						|
    def parse(self):
 | 
						|
        import csv
 | 
						|
        reader = csv.reader(
 | 
						|
            self.stream, 
 | 
						|
            delimiter = ',',
 | 
						|
            quotechar = None,
 | 
						|
            escapechar = None,
 | 
						|
            doublequote = False,
 | 
						|
            skipinitialspace = True,
 | 
						|
            lineterminator = '\r\n',
 | 
						|
            quoting = csv.QUOTE_NONE)
 | 
						|
        it = iter(reader)
 | 
						|
        row = reader.next()
 | 
						|
        self.parse_header(row)
 | 
						|
        for row in it:
 | 
						|
            self.parse_row(row)
 | 
						|
                
 | 
						|
        # compute derived data
 | 
						|
        self.profile.validate()
 | 
						|
        self.profile.find_cycles()
 | 
						|
        self.profile.ratio(TIME_RATIO, SAMPLES)
 | 
						|
        self.profile.call_ratios(SAMPLES2)
 | 
						|
        self.profile.integrate(TOTAL_TIME_RATIO, TIME_RATIO)
 | 
						|
 | 
						|
        return self.profile
 | 
						|
 | 
						|
    def parse_header(self, row):
 | 
						|
        for column in range(len(row)):
 | 
						|
            name = row[column]
 | 
						|
            assert name not in self.column
 | 
						|
            self.column[name] = column
 | 
						|
 | 
						|
    def parse_row(self, row):
 | 
						|
        fields = {}
 | 
						|
        for name, column in self.column.iteritems():
 | 
						|
            value = row[column]
 | 
						|
            for factory in int, float:
 | 
						|
                try:
 | 
						|
                    value = factory(value)
 | 
						|
                except ValueError:
 | 
						|
                    pass
 | 
						|
                else:
 | 
						|
                    break
 | 
						|
            fields[name] = value
 | 
						|
        
 | 
						|
        process = fields['Process Name']
 | 
						|
        symbol = fields['Module'] + '!' + fields['Function']
 | 
						|
        weight = fields['Weight']
 | 
						|
        count = fields['Count']
 | 
						|
 | 
						|
        function = self.get_function(process, symbol)
 | 
						|
        function[SAMPLES] += weight * count
 | 
						|
        self.profile[SAMPLES] += weight * count
 | 
						|
 | 
						|
        stack = fields['Stack']
 | 
						|
        if stack != '?':
 | 
						|
            stack = stack.split('/')
 | 
						|
            assert stack[0] == '[Root]'
 | 
						|
            if stack[-1] != symbol:
 | 
						|
                # XXX: some cases the sampled function does not appear in the stack
 | 
						|
                stack.append(symbol)
 | 
						|
            caller = None
 | 
						|
            for symbol in stack[1:]:
 | 
						|
                callee = self.get_function(process, symbol)
 | 
						|
                if caller is not None:
 | 
						|
                    try:
 | 
						|
                        call = caller.calls[callee.id]
 | 
						|
                    except KeyError:
 | 
						|
                        call = Call(callee.id)
 | 
						|
                        call[SAMPLES2] = count
 | 
						|
                        caller.add_call(call)
 | 
						|
                    else:
 | 
						|
                        call[SAMPLES2] += count
 | 
						|
                caller = callee
 | 
						|
 | 
						|
    def get_function(self, process, symbol):
 | 
						|
        function_id = process + '!' + symbol
 | 
						|
 | 
						|
        try:
 | 
						|
            function = self.profile.functions[function_id]
 | 
						|
        except KeyError:
 | 
						|
            module, name = symbol.split('!')
 | 
						|
            function = Function(function_id, name)
 | 
						|
            function.process = process
 | 
						|
            function.module = module
 | 
						|
            function[SAMPLES] = 0
 | 
						|
            self.profile.add_function(function)
 | 
						|
 | 
						|
        return function
 | 
						|
 | 
						|
 | 
						|
class SleepyParser(Parser):
 | 
						|
    """Parser for GNU gprof output.
 | 
						|
 | 
						|
    See also:
 | 
						|
    - http://www.codersnotes.com/sleepy/
 | 
						|
    - http://sleepygraph.sourceforge.net/
 | 
						|
    """
 | 
						|
 | 
						|
    def __init__(self, filename):
 | 
						|
        Parser.__init__(self)
 | 
						|
 | 
						|
        from zipfile import ZipFile
 | 
						|
 | 
						|
        self.database = ZipFile(filename)
 | 
						|
 | 
						|
        self.symbols = {}
 | 
						|
        self.calls = {}
 | 
						|
 | 
						|
        self.profile = Profile()
 | 
						|
    
 | 
						|
    _symbol_re = re.compile(
 | 
						|
        r'^(?P<id>\w+)' + 
 | 
						|
        r'\s+"(?P<module>[^"]*)"' + 
 | 
						|
        r'\s+"(?P<procname>[^"]*)"' + 
 | 
						|
        r'\s+"(?P<sourcefile>[^"]*)"' + 
 | 
						|
        r'\s+(?P<sourceline>\d+)$'
 | 
						|
    )
 | 
						|
 | 
						|
    def parse_symbols(self):
 | 
						|
        lines = self.database.read('symbols.txt').splitlines()
 | 
						|
        for line in lines:
 | 
						|
            mo = self._symbol_re.match(line)
 | 
						|
            if mo:
 | 
						|
                symbol_id, module, procname, sourcefile, sourceline = mo.groups()
 | 
						|
    
 | 
						|
                function_id = ':'.join([module, procname])
 | 
						|
 | 
						|
                try:
 | 
						|
                    function = self.profile.functions[function_id]
 | 
						|
                except KeyError:
 | 
						|
                    function = Function(function_id, procname)
 | 
						|
                    function.module = module
 | 
						|
                    function[SAMPLES] = 0
 | 
						|
                    self.profile.add_function(function)
 | 
						|
 | 
						|
                self.symbols[symbol_id] = function
 | 
						|
 | 
						|
    def parse_callstacks(self):
 | 
						|
        lines = self.database.read("callstacks.txt").splitlines()
 | 
						|
        for line in lines:
 | 
						|
            fields = line.split()
 | 
						|
            samples = int(fields[0])
 | 
						|
            callstack = fields[1:]
 | 
						|
 | 
						|
            callstack = [self.symbols[symbol_id] for symbol_id in callstack]
 | 
						|
 | 
						|
            callee = callstack[0]
 | 
						|
 | 
						|
            callee[SAMPLES] += samples
 | 
						|
            self.profile[SAMPLES] += samples
 | 
						|
            
 | 
						|
            for caller in callstack[1:]:
 | 
						|
                try:
 | 
						|
                    call = caller.calls[callee.id]
 | 
						|
                except KeyError:
 | 
						|
                    call = Call(callee.id)
 | 
						|
                    call[SAMPLES2] = samples
 | 
						|
                    caller.add_call(call)
 | 
						|
                else:
 | 
						|
                    call[SAMPLES2] += samples
 | 
						|
 | 
						|
                callee = caller
 | 
						|
 | 
						|
    def parse(self):
 | 
						|
        profile = self.profile
 | 
						|
        profile[SAMPLES] = 0
 | 
						|
 | 
						|
        self.parse_symbols()
 | 
						|
        self.parse_callstacks()
 | 
						|
 | 
						|
        # Compute derived events
 | 
						|
        profile.validate()
 | 
						|
        profile.find_cycles()
 | 
						|
        profile.ratio(TIME_RATIO, SAMPLES)
 | 
						|
        profile.call_ratios(SAMPLES2)
 | 
						|
        profile.integrate(TOTAL_TIME_RATIO, TIME_RATIO)
 | 
						|
 | 
						|
        return profile
 | 
						|
 | 
						|
 | 
						|
class AQtimeTable:
 | 
						|
 | 
						|
    def __init__(self, name, fields):
 | 
						|
        self.name = name
 | 
						|
 | 
						|
        self.fields = fields
 | 
						|
        self.field_column = {}
 | 
						|
        for column in range(len(fields)):
 | 
						|
            self.field_column[fields[column]] = column
 | 
						|
        self.rows = []
 | 
						|
 | 
						|
    def __len__(self):
 | 
						|
        return len(self.rows)
 | 
						|
 | 
						|
    def __iter__(self):
 | 
						|
        for values, children in self.rows:
 | 
						|
            fields = {}
 | 
						|
            for name, value in zip(self.fields, values):
 | 
						|
                fields[name] = value
 | 
						|
            children = dict([(child.name, child) for child in children])
 | 
						|
            yield fields, children
 | 
						|
        raise StopIteration
 | 
						|
 | 
						|
    def add_row(self, values, children=()):
 | 
						|
        self.rows.append((values, children))
 | 
						|
 | 
						|
 | 
						|
class AQtimeParser(XmlParser):
 | 
						|
 | 
						|
    def __init__(self, stream):
 | 
						|
        XmlParser.__init__(self, stream)
 | 
						|
        self.tables = {}
 | 
						|
 | 
						|
    def parse(self):
 | 
						|
        self.element_start('AQtime_Results')
 | 
						|
        self.parse_headers()
 | 
						|
        results = self.parse_results()
 | 
						|
        self.element_end('AQtime_Results')
 | 
						|
        return self.build_profile(results) 
 | 
						|
 | 
						|
    def parse_headers(self):
 | 
						|
        self.element_start('HEADERS')
 | 
						|
        while self.token.type == XML_ELEMENT_START:
 | 
						|
            self.parse_table_header()
 | 
						|
        self.element_end('HEADERS')
 | 
						|
 | 
						|
    def parse_table_header(self):
 | 
						|
        attrs = self.element_start('TABLE_HEADER')
 | 
						|
        name = attrs['NAME']
 | 
						|
        id = int(attrs['ID'])
 | 
						|
        field_types = []
 | 
						|
        field_names = []
 | 
						|
        while self.token.type == XML_ELEMENT_START:
 | 
						|
            field_type, field_name = self.parse_table_field()
 | 
						|
            field_types.append(field_type)
 | 
						|
            field_names.append(field_name)
 | 
						|
        self.element_end('TABLE_HEADER')
 | 
						|
        self.tables[id] = name, field_types, field_names
 | 
						|
 | 
						|
    def parse_table_field(self):
 | 
						|
        attrs = self.element_start('TABLE_FIELD')
 | 
						|
        type = attrs['TYPE']
 | 
						|
        name = self.character_data()
 | 
						|
        self.element_end('TABLE_FIELD')
 | 
						|
        return type, name
 | 
						|
 | 
						|
    def parse_results(self):
 | 
						|
        self.element_start('RESULTS')
 | 
						|
        table = self.parse_data()
 | 
						|
        self.element_end('RESULTS')
 | 
						|
        return table
 | 
						|
 | 
						|
    def parse_data(self):
 | 
						|
        rows = []
 | 
						|
        attrs = self.element_start('DATA')
 | 
						|
        table_id = int(attrs['TABLE_ID'])
 | 
						|
        table_name, field_types, field_names = self.tables[table_id]
 | 
						|
        table = AQtimeTable(table_name, field_names)
 | 
						|
        while self.token.type == XML_ELEMENT_START:
 | 
						|
            row, children = self.parse_row(field_types)
 | 
						|
            table.add_row(row, children)
 | 
						|
        self.element_end('DATA')
 | 
						|
        return table
 | 
						|
 | 
						|
    def parse_row(self, field_types):
 | 
						|
        row = [None]*len(field_types)
 | 
						|
        children = []
 | 
						|
        self.element_start('ROW')
 | 
						|
        while self.token.type == XML_ELEMENT_START:
 | 
						|
            if self.token.name_or_data == 'FIELD':
 | 
						|
                field_id, field_value = self.parse_field(field_types)
 | 
						|
                row[field_id] = field_value
 | 
						|
            elif self.token.name_or_data == 'CHILDREN':
 | 
						|
                children = self.parse_children()
 | 
						|
            else:
 | 
						|
                raise XmlTokenMismatch("<FIELD ...> or <CHILDREN ...>", self.token)
 | 
						|
        self.element_end('ROW')
 | 
						|
        return row, children
 | 
						|
 | 
						|
    def parse_field(self, field_types):
 | 
						|
        attrs = self.element_start('FIELD')
 | 
						|
        id = int(attrs['ID'])
 | 
						|
        type = field_types[id]
 | 
						|
        value = self.character_data()
 | 
						|
        if type == 'Integer':
 | 
						|
            value = int(value)
 | 
						|
        elif type == 'Float':
 | 
						|
            value = float(value)
 | 
						|
        elif type == 'Address':
 | 
						|
            value = int(value)
 | 
						|
        elif type == 'String':
 | 
						|
            pass
 | 
						|
        else:
 | 
						|
            assert False
 | 
						|
        self.element_end('FIELD')
 | 
						|
        return id, value
 | 
						|
 | 
						|
    def parse_children(self):
 | 
						|
        children = []
 | 
						|
        self.element_start('CHILDREN')
 | 
						|
        while self.token.type == XML_ELEMENT_START:
 | 
						|
            table = self.parse_data()
 | 
						|
            assert table.name not in children
 | 
						|
            children.append(table)
 | 
						|
        self.element_end('CHILDREN')
 | 
						|
        return children
 | 
						|
 | 
						|
    def build_profile(self, results):
 | 
						|
        assert results.name == 'Routines'
 | 
						|
        profile = Profile()
 | 
						|
        profile[TIME] = 0.0
 | 
						|
        for fields, tables in results:
 | 
						|
            function = self.build_function(fields)
 | 
						|
            children = tables['Children']
 | 
						|
            for fields, _ in children:
 | 
						|
                call = self.build_call(fields)
 | 
						|
                function.add_call(call)
 | 
						|
            profile.add_function(function)
 | 
						|
            profile[TIME] = profile[TIME] + function[TIME]
 | 
						|
        profile[TOTAL_TIME] = profile[TIME]
 | 
						|
        profile.ratio(TOTAL_TIME_RATIO, TOTAL_TIME)
 | 
						|
        return profile
 | 
						|
    
 | 
						|
    def build_function(self, fields):
 | 
						|
        function = Function(self.build_id(fields), self.build_name(fields))
 | 
						|
        function[TIME] = fields['Time']
 | 
						|
        function[TOTAL_TIME] = fields['Time with Children']
 | 
						|
        #function[TIME_RATIO] = fields['% Time']/100.0
 | 
						|
        #function[TOTAL_TIME_RATIO] = fields['% with Children']/100.0
 | 
						|
        return function
 | 
						|
 | 
						|
    def build_call(self, fields):
 | 
						|
        call = Call(self.build_id(fields))
 | 
						|
        call[TIME] = fields['Time']
 | 
						|
        call[TOTAL_TIME] = fields['Time with Children']
 | 
						|
        #call[TIME_RATIO] = fields['% Time']/100.0
 | 
						|
        #call[TOTAL_TIME_RATIO] = fields['% with Children']/100.0
 | 
						|
        return call
 | 
						|
 | 
						|
    def build_id(self, fields):
 | 
						|
        return ':'.join([fields['Module Name'], fields['Unit Name'], fields['Routine Name']])
 | 
						|
 | 
						|
    def build_name(self, fields):
 | 
						|
        # TODO: use more fields
 | 
						|
        return fields['Routine Name']
 | 
						|
 | 
						|
 | 
						|
class PstatsParser:
 | 
						|
    """Parser python profiling statistics saved with te pstats module."""
 | 
						|
 | 
						|
    def __init__(self, *filename):
 | 
						|
        import pstats
 | 
						|
        try:
 | 
						|
            self.stats = pstats.Stats(*filename)
 | 
						|
        except ValueError:
 | 
						|
            import hotshot.stats
 | 
						|
            self.stats = hotshot.stats.load(filename[0])
 | 
						|
        self.profile = Profile()
 | 
						|
        self.function_ids = {}
 | 
						|
 | 
						|
    def get_function_name(self, (filename, line, name)):
 | 
						|
        module = os.path.splitext(filename)[0]
 | 
						|
        module = os.path.basename(module)
 | 
						|
        return "%s:%d:%s" % (module, line, name)
 | 
						|
 | 
						|
    def get_function(self, key):
 | 
						|
        try:
 | 
						|
            id = self.function_ids[key]
 | 
						|
        except KeyError:
 | 
						|
            id = len(self.function_ids)
 | 
						|
            name = self.get_function_name(key)
 | 
						|
            function = Function(id, name)
 | 
						|
            self.profile.functions[id] = function
 | 
						|
            self.function_ids[key] = id
 | 
						|
        else:
 | 
						|
            function = self.profile.functions[id]
 | 
						|
        return function
 | 
						|
 | 
						|
    def parse(self):
 | 
						|
        self.profile[TIME] = 0.0
 | 
						|
        self.profile[TOTAL_TIME] = self.stats.total_tt
 | 
						|
        for fn, (cc, nc, tt, ct, callers) in self.stats.stats.iteritems():
 | 
						|
            callee = self.get_function(fn)
 | 
						|
            callee.called = nc
 | 
						|
            callee[TOTAL_TIME] = ct
 | 
						|
            callee[TIME] = tt
 | 
						|
            self.profile[TIME] += tt
 | 
						|
            self.profile[TOTAL_TIME] = max(self.profile[TOTAL_TIME], ct)
 | 
						|
            for fn, value in callers.iteritems():
 | 
						|
                caller = self.get_function(fn)
 | 
						|
                call = Call(callee.id)
 | 
						|
                if isinstance(value, tuple):
 | 
						|
                    for i in xrange(0, len(value), 4):
 | 
						|
                        nc, cc, tt, ct = value[i:i+4]
 | 
						|
                        if CALLS in call:
 | 
						|
                            call[CALLS] += cc
 | 
						|
                        else:
 | 
						|
                            call[CALLS] = cc
 | 
						|
 | 
						|
                        if TOTAL_TIME in call:
 | 
						|
                            call[TOTAL_TIME] += ct
 | 
						|
                        else:
 | 
						|
                            call[TOTAL_TIME] = ct
 | 
						|
 | 
						|
                else:
 | 
						|
                    call[CALLS] = value
 | 
						|
                    call[TOTAL_TIME] = ratio(value, nc)*ct
 | 
						|
 | 
						|
                caller.add_call(call)
 | 
						|
        #self.stats.print_stats()
 | 
						|
        #self.stats.print_callees()
 | 
						|
 | 
						|
        # Compute derived events
 | 
						|
        self.profile.validate()
 | 
						|
        self.profile.ratio(TIME_RATIO, TIME)
 | 
						|
        self.profile.ratio(TOTAL_TIME_RATIO, TOTAL_TIME)
 | 
						|
 | 
						|
        return self.profile
 | 
						|
 | 
						|
 | 
						|
class Theme:
 | 
						|
 | 
						|
    def __init__(self, 
 | 
						|
            bgcolor = (0.0, 0.0, 1.0),
 | 
						|
            mincolor = (0.0, 0.0, 0.0),
 | 
						|
            maxcolor = (0.0, 0.0, 1.0),
 | 
						|
            fontname = "Arial",
 | 
						|
            minfontsize = 10.0,
 | 
						|
            maxfontsize = 10.0,
 | 
						|
            minpenwidth = 0.5,
 | 
						|
            maxpenwidth = 4.0,
 | 
						|
            gamma = 2.2,
 | 
						|
            skew = 1.0):
 | 
						|
        self.bgcolor = bgcolor
 | 
						|
        self.mincolor = mincolor
 | 
						|
        self.maxcolor = maxcolor
 | 
						|
        self.fontname = fontname
 | 
						|
        self.minfontsize = minfontsize
 | 
						|
        self.maxfontsize = maxfontsize
 | 
						|
        self.minpenwidth = minpenwidth
 | 
						|
        self.maxpenwidth = maxpenwidth
 | 
						|
        self.gamma = gamma
 | 
						|
        self.skew = skew
 | 
						|
 | 
						|
    def graph_bgcolor(self):
 | 
						|
        return self.hsl_to_rgb(*self.bgcolor)
 | 
						|
 | 
						|
    def graph_fontname(self):
 | 
						|
        return self.fontname
 | 
						|
 | 
						|
    def graph_fontsize(self):
 | 
						|
        return self.minfontsize
 | 
						|
 | 
						|
    def node_bgcolor(self, weight):
 | 
						|
        return self.color(weight)
 | 
						|
 | 
						|
    def node_fgcolor(self, weight):
 | 
						|
        return self.graph_bgcolor()
 | 
						|
 | 
						|
    def node_fontsize(self, weight):
 | 
						|
        return self.fontsize(weight)
 | 
						|
 | 
						|
    def edge_color(self, weight):
 | 
						|
        return self.color(weight)
 | 
						|
 | 
						|
    def edge_fontsize(self, weight):
 | 
						|
        return self.fontsize(weight)
 | 
						|
 | 
						|
    def edge_penwidth(self, weight):
 | 
						|
        return max(weight*self.maxpenwidth, self.minpenwidth)
 | 
						|
 | 
						|
    def edge_arrowsize(self, weight):
 | 
						|
        return 0.5 * math.sqrt(self.edge_penwidth(weight))
 | 
						|
 | 
						|
    def fontsize(self, weight):
 | 
						|
        return max(weight**2 * self.maxfontsize, self.minfontsize)
 | 
						|
 | 
						|
    def color(self, weight):
 | 
						|
        weight = min(max(weight, 0.0), 1.0)
 | 
						|
    
 | 
						|
        hmin, smin, lmin = self.mincolor
 | 
						|
        hmax, smax, lmax = self.maxcolor
 | 
						|
        
 | 
						|
        if self.skew < 0:
 | 
						|
            raise ValueError("Skew must be greater than 0")
 | 
						|
        elif self.skew == 1.0:
 | 
						|
            h = hmin + weight*(hmax - hmin)
 | 
						|
            s = smin + weight*(smax - smin)
 | 
						|
            l = lmin + weight*(lmax - lmin)
 | 
						|
        else:
 | 
						|
            base = self.skew
 | 
						|
            h = hmin + ((hmax-hmin)*(-1.0 + (base ** weight)) / (base - 1.0))
 | 
						|
            s = smin + ((smax-smin)*(-1.0 + (base ** weight)) / (base - 1.0))
 | 
						|
            l = lmin + ((lmax-lmin)*(-1.0 + (base ** weight)) / (base - 1.0))
 | 
						|
 | 
						|
        return self.hsl_to_rgb(h, s, l)
 | 
						|
 | 
						|
    def hsl_to_rgb(self, h, s, l):
 | 
						|
        """Convert a color from HSL color-model to RGB.
 | 
						|
 | 
						|
        See also:
 | 
						|
        - http://www.w3.org/TR/css3-color/#hsl-color
 | 
						|
        """
 | 
						|
 | 
						|
        h = h % 1.0
 | 
						|
        s = min(max(s, 0.0), 1.0)
 | 
						|
        l = min(max(l, 0.0), 1.0)
 | 
						|
 | 
						|
        if l <= 0.5:
 | 
						|
            m2 = l*(s + 1.0)
 | 
						|
        else:
 | 
						|
            m2 = l + s - l*s
 | 
						|
        m1 = l*2.0 - m2
 | 
						|
        r = self._hue_to_rgb(m1, m2, h + 1.0/3.0)
 | 
						|
        g = self._hue_to_rgb(m1, m2, h)
 | 
						|
        b = self._hue_to_rgb(m1, m2, h - 1.0/3.0)
 | 
						|
 | 
						|
        # Apply gamma correction
 | 
						|
        r **= self.gamma
 | 
						|
        g **= self.gamma
 | 
						|
        b **= self.gamma
 | 
						|
 | 
						|
        return (r, g, b)
 | 
						|
 | 
						|
    def _hue_to_rgb(self, m1, m2, h):
 | 
						|
        if h < 0.0:
 | 
						|
            h += 1.0
 | 
						|
        elif h > 1.0:
 | 
						|
            h -= 1.0
 | 
						|
        if h*6 < 1.0:
 | 
						|
            return m1 + (m2 - m1)*h*6.0
 | 
						|
        elif h*2 < 1.0:
 | 
						|
            return m2
 | 
						|
        elif h*3 < 2.0:
 | 
						|
            return m1 + (m2 - m1)*(2.0/3.0 - h)*6.0
 | 
						|
        else:
 | 
						|
            return m1
 | 
						|
 | 
						|
 | 
						|
TEMPERATURE_COLORMAP = Theme(
 | 
						|
    mincolor = (2.0/3.0, 0.80, 0.25), # dark blue
 | 
						|
    maxcolor = (0.0, 1.0, 0.5), # satured red
 | 
						|
    gamma = 1.0
 | 
						|
)
 | 
						|
 | 
						|
PINK_COLORMAP = Theme(
 | 
						|
    mincolor = (0.0, 1.0, 0.90), # pink
 | 
						|
    maxcolor = (0.0, 1.0, 0.5), # satured red
 | 
						|
)
 | 
						|
 | 
						|
GRAY_COLORMAP = Theme(
 | 
						|
    mincolor = (0.0, 0.0, 0.85), # light gray
 | 
						|
    maxcolor = (0.0, 0.0, 0.0), # black
 | 
						|
)
 | 
						|
 | 
						|
BW_COLORMAP = Theme(
 | 
						|
    minfontsize = 8.0,
 | 
						|
    maxfontsize = 24.0,
 | 
						|
    mincolor = (0.0, 0.0, 0.0), # black
 | 
						|
    maxcolor = (0.0, 0.0, 0.0), # black
 | 
						|
    minpenwidth = 0.1,
 | 
						|
    maxpenwidth = 8.0,
 | 
						|
)
 | 
						|
 | 
						|
 | 
						|
class DotWriter:
 | 
						|
    """Writer for the DOT language.
 | 
						|
 | 
						|
    See also:
 | 
						|
    - "The DOT Language" specification
 | 
						|
      http://www.graphviz.org/doc/info/lang.html
 | 
						|
    """
 | 
						|
 | 
						|
    def __init__(self, fp):
 | 
						|
        self.fp = fp
 | 
						|
 | 
						|
    def graph(self, profile, theme):
 | 
						|
        self.begin_graph()
 | 
						|
 | 
						|
        fontname = theme.graph_fontname()
 | 
						|
 | 
						|
        self.attr('graph', fontname=fontname, ranksep=0.25, nodesep=0.125)
 | 
						|
        self.attr('node', fontname=fontname, shape="box", style="filled", fontcolor="white", width=0, height=0)
 | 
						|
        self.attr('edge', fontname=fontname)
 | 
						|
 | 
						|
        for function in profile.functions.itervalues():
 | 
						|
            labels = []
 | 
						|
            if function.process is not None:
 | 
						|
                labels.append(function.process)
 | 
						|
            if function.module is not None:
 | 
						|
                labels.append(function.module)
 | 
						|
            labels.append(function.name)
 | 
						|
            for event in TOTAL_TIME_RATIO, TIME_RATIO:
 | 
						|
                if event in function.events:
 | 
						|
                    label = event.format(function[event])
 | 
						|
                    labels.append(label)
 | 
						|
            if function.called is not None:
 | 
						|
                labels.append(u"%u\xd7" % (function.called,))
 | 
						|
 | 
						|
            if function.weight is not None:
 | 
						|
                weight = function.weight
 | 
						|
            else:
 | 
						|
                weight = 0.0
 | 
						|
 | 
						|
            label = '\n'.join(labels)
 | 
						|
            self.node(function.id, 
 | 
						|
                label = label, 
 | 
						|
                color = self.color(theme.node_bgcolor(weight)), 
 | 
						|
                fontcolor = self.color(theme.node_fgcolor(weight)), 
 | 
						|
                fontsize = "%.2f" % theme.node_fontsize(weight),
 | 
						|
            )
 | 
						|
 | 
						|
            for call in function.calls.itervalues():
 | 
						|
                callee = profile.functions[call.callee_id]
 | 
						|
 | 
						|
                labels = []
 | 
						|
                for event in TOTAL_TIME_RATIO, CALLS:
 | 
						|
                    if event in call.events:
 | 
						|
                        label = event.format(call[event])
 | 
						|
                        labels.append(label)
 | 
						|
 | 
						|
                if call.weight is not None:
 | 
						|
                    weight = call.weight
 | 
						|
                elif callee.weight is not None:
 | 
						|
                    weight = callee.weight
 | 
						|
                else:
 | 
						|
                    weight = 0.0
 | 
						|
 | 
						|
                label = '\n'.join(labels)
 | 
						|
 | 
						|
                self.edge(function.id, call.callee_id, 
 | 
						|
                    label = label, 
 | 
						|
                    color = self.color(theme.edge_color(weight)), 
 | 
						|
                    fontcolor = self.color(theme.edge_color(weight)),
 | 
						|
                    fontsize = "%.2f" % theme.edge_fontsize(weight), 
 | 
						|
                    penwidth = "%.2f" % theme.edge_penwidth(weight), 
 | 
						|
                    labeldistance = "%.2f" % theme.edge_penwidth(weight), 
 | 
						|
                    arrowsize = "%.2f" % theme.edge_arrowsize(weight),
 | 
						|
                )
 | 
						|
 | 
						|
        self.end_graph()
 | 
						|
 | 
						|
    def begin_graph(self):
 | 
						|
        self.write('digraph {\n')
 | 
						|
 | 
						|
    def end_graph(self):
 | 
						|
        self.write('}\n')
 | 
						|
 | 
						|
    def attr(self, what, **attrs):
 | 
						|
        self.write("\t")
 | 
						|
        self.write(what)
 | 
						|
        self.attr_list(attrs)
 | 
						|
        self.write(";\n")
 | 
						|
 | 
						|
    def node(self, node, **attrs):
 | 
						|
        self.write("\t")
 | 
						|
        self.id(node)
 | 
						|
        self.attr_list(attrs)
 | 
						|
        self.write(";\n")
 | 
						|
 | 
						|
    def edge(self, src, dst, **attrs):
 | 
						|
        self.write("\t")
 | 
						|
        self.id(src)
 | 
						|
        self.write(" -> ")
 | 
						|
        self.id(dst)
 | 
						|
        self.attr_list(attrs)
 | 
						|
        self.write(";\n")
 | 
						|
 | 
						|
    def attr_list(self, attrs):
 | 
						|
        if not attrs:
 | 
						|
            return
 | 
						|
        self.write(' [')
 | 
						|
        first = True
 | 
						|
        for name, value in attrs.iteritems():
 | 
						|
            if first:
 | 
						|
                first = False
 | 
						|
            else:
 | 
						|
                self.write(", ")
 | 
						|
            self.id(name)
 | 
						|
            self.write('=')
 | 
						|
            self.id(value)
 | 
						|
        self.write(']')
 | 
						|
 | 
						|
    def id(self, id):
 | 
						|
        if isinstance(id, (int, float)):
 | 
						|
            s = str(id)
 | 
						|
        elif isinstance(id, basestring):
 | 
						|
            if id.isalnum() and not id.startswith('0x'):
 | 
						|
                s = id
 | 
						|
            else:
 | 
						|
                s = self.escape(id)
 | 
						|
        else:
 | 
						|
            raise TypeError
 | 
						|
        self.write(s)
 | 
						|
 | 
						|
    def color(self, (r, g, b)):
 | 
						|
 | 
						|
        def float2int(f):
 | 
						|
            if f <= 0.0:
 | 
						|
                return 0
 | 
						|
            if f >= 1.0:
 | 
						|
                return 255
 | 
						|
            return int(255.0*f + 0.5)
 | 
						|
 | 
						|
        return "#" + "".join(["%02x" % float2int(c) for c in (r, g, b)])
 | 
						|
 | 
						|
    def escape(self, s):
 | 
						|
        s = s.encode('utf-8')
 | 
						|
        s = s.replace('\\', r'\\')
 | 
						|
        s = s.replace('\n', r'\n')
 | 
						|
        s = s.replace('\t', r'\t')
 | 
						|
        s = s.replace('"', r'\"')
 | 
						|
        return '"' + s + '"'
 | 
						|
 | 
						|
    def write(self, s):
 | 
						|
        self.fp.write(s)
 | 
						|
 | 
						|
 | 
						|
class Main:
 | 
						|
    """Main program."""
 | 
						|
 | 
						|
    themes = {
 | 
						|
            "color": TEMPERATURE_COLORMAP,
 | 
						|
            "pink": PINK_COLORMAP,
 | 
						|
            "gray": GRAY_COLORMAP,
 | 
						|
            "bw": BW_COLORMAP,
 | 
						|
    }
 | 
						|
 | 
						|
    def main(self):
 | 
						|
        """Main program."""
 | 
						|
 | 
						|
        parser = optparse.OptionParser(
 | 
						|
            usage="\n\t%prog [options] [file] ...",
 | 
						|
            version="%%prog %s" % __version__)
 | 
						|
        parser.add_option(
 | 
						|
            '-o', '--output', metavar='FILE',
 | 
						|
            type="string", dest="output",
 | 
						|
            help="output filename [stdout]")
 | 
						|
        parser.add_option(
 | 
						|
            '-n', '--node-thres', metavar='PERCENTAGE',
 | 
						|
            type="float", dest="node_thres", default=0.5,
 | 
						|
            help="eliminate nodes below this threshold [default: %default]")
 | 
						|
        parser.add_option(
 | 
						|
            '-e', '--edge-thres', metavar='PERCENTAGE',
 | 
						|
            type="float", dest="edge_thres", default=0.1,
 | 
						|
            help="eliminate edges below this threshold [default: %default]")
 | 
						|
        parser.add_option(
 | 
						|
            '-f', '--format',
 | 
						|
            type="choice", choices=('prof', 'callgrind', 'oprofile', 'sysprof', 'pstats', 'shark', 'sleepy', 'aqtime', 'xperf'),
 | 
						|
            dest="format", default="prof",
 | 
						|
            help="profile format: prof, callgrind, oprofile, sysprof, shark, sleepy, aqtime, pstats, or xperf [default: %default]")
 | 
						|
        parser.add_option(
 | 
						|
            '-c', '--colormap',
 | 
						|
            type="choice", choices=('color', 'pink', 'gray', 'bw'),
 | 
						|
            dest="theme", default="color",
 | 
						|
            help="color map: color, pink, gray, or bw [default: %default]")
 | 
						|
        parser.add_option(
 | 
						|
            '-s', '--strip',
 | 
						|
            action="store_true",
 | 
						|
            dest="strip", default=False,
 | 
						|
            help="strip function parameters, template parameters, and const modifiers from demangled C++ function names")
 | 
						|
        parser.add_option(
 | 
						|
            '-w', '--wrap',
 | 
						|
            action="store_true",
 | 
						|
            dest="wrap", default=False,
 | 
						|
            help="wrap function names")
 | 
						|
        # add a new option to control skew of the colorization curve
 | 
						|
        parser.add_option(
 | 
						|
            '--skew',
 | 
						|
            type="float", dest="theme_skew", default=1.0,
 | 
						|
            help="skew the colorization curve.  Values < 1.0 give more variety to lower percentages.  Value > 1.0 give less variety to lower percentages")
 | 
						|
        (self.options, self.args) = parser.parse_args(sys.argv[1:])
 | 
						|
 | 
						|
        if len(self.args) > 1 and self.options.format != 'pstats':
 | 
						|
            parser.error('incorrect number of arguments')
 | 
						|
 | 
						|
        try:
 | 
						|
            self.theme = self.themes[self.options.theme]
 | 
						|
        except KeyError:
 | 
						|
            parser.error('invalid colormap \'%s\'' % self.options.theme)
 | 
						|
        
 | 
						|
        # set skew on the theme now that it has been picked.
 | 
						|
        if self.options.theme_skew:
 | 
						|
            self.theme.skew = self.options.theme_skew
 | 
						|
 | 
						|
        if self.options.format == 'prof':
 | 
						|
            if not self.args:
 | 
						|
                fp = sys.stdin
 | 
						|
            else:
 | 
						|
                fp = open(self.args[0], 'rt')
 | 
						|
            parser = GprofParser(fp)
 | 
						|
        elif self.options.format == 'callgrind':
 | 
						|
            if not self.args:
 | 
						|
                fp = sys.stdin
 | 
						|
            else:
 | 
						|
                fp = open(self.args[0], 'rt')
 | 
						|
            parser = CallgrindParser(fp)
 | 
						|
        elif self.options.format == 'oprofile':
 | 
						|
            if not self.args:
 | 
						|
                fp = sys.stdin
 | 
						|
            else:
 | 
						|
                fp = open(self.args[0], 'rt')
 | 
						|
            parser = OprofileParser(fp)
 | 
						|
        elif self.options.format == 'sysprof':
 | 
						|
            if not self.args:
 | 
						|
                fp = sys.stdin
 | 
						|
            else:
 | 
						|
                fp = open(self.args[0], 'rt')
 | 
						|
            parser = SysprofParser(fp)
 | 
						|
        elif self.options.format == 'pstats':
 | 
						|
            if not self.args:
 | 
						|
                parser.error('at least a file must be specified for pstats input')
 | 
						|
            parser = PstatsParser(*self.args)
 | 
						|
        elif self.options.format == 'xperf':
 | 
						|
            if not self.args:
 | 
						|
                fp = sys.stdin
 | 
						|
            else:
 | 
						|
                fp = open(self.args[0], 'rt')
 | 
						|
            parser = XPerfParser(fp)
 | 
						|
        elif self.options.format == 'shark':
 | 
						|
            if not self.args:
 | 
						|
                fp = sys.stdin
 | 
						|
            else:
 | 
						|
                fp = open(self.args[0], 'rt')
 | 
						|
            parser = SharkParser(fp)
 | 
						|
        elif self.options.format == 'sleepy':
 | 
						|
            if len(self.args) != 1:
 | 
						|
                parser.error('exactly one file must be specified for sleepy input')
 | 
						|
            parser = SleepyParser(self.args[0])
 | 
						|
        elif self.options.format == 'aqtime':
 | 
						|
            if not self.args:
 | 
						|
                fp = sys.stdin
 | 
						|
            else:
 | 
						|
                fp = open(self.args[0], 'rt')
 | 
						|
            parser = AQtimeParser(fp)
 | 
						|
        else:
 | 
						|
            parser.error('invalid format \'%s\'' % self.options.format)
 | 
						|
 | 
						|
        self.profile = parser.parse()
 | 
						|
        
 | 
						|
        if self.options.output is None:
 | 
						|
            self.output = sys.stdout
 | 
						|
        else:
 | 
						|
            self.output = open(self.options.output, 'wt')
 | 
						|
 | 
						|
        self.write_graph()
 | 
						|
 | 
						|
    _parenthesis_re = re.compile(r'\([^()]*\)')
 | 
						|
    _angles_re = re.compile(r'<[^<>]*>')
 | 
						|
    _const_re = re.compile(r'\s+const$')
 | 
						|
 | 
						|
    def strip_function_name(self, name):
 | 
						|
        """Remove extraneous information from C++ demangled function names."""
 | 
						|
 | 
						|
        # Strip function parameters from name by recursively removing paired parenthesis
 | 
						|
        while True:
 | 
						|
            name, n = self._parenthesis_re.subn('', name)
 | 
						|
            if not n:
 | 
						|
                break
 | 
						|
 | 
						|
        # Strip const qualifier
 | 
						|
        name = self._const_re.sub('', name)
 | 
						|
 | 
						|
        # Strip template parameters from name by recursively removing paired angles
 | 
						|
        while True:
 | 
						|
            name, n = self._angles_re.subn('', name)
 | 
						|
            if not n:
 | 
						|
                break
 | 
						|
 | 
						|
        return name
 | 
						|
 | 
						|
    def wrap_function_name(self, name):
 | 
						|
        """Split the function name on multiple lines."""
 | 
						|
 | 
						|
        if len(name) > 32:
 | 
						|
            ratio = 2.0/3.0
 | 
						|
            height = max(int(len(name)/(1.0 - ratio) + 0.5), 1)
 | 
						|
            width = max(len(name)/height, 32)
 | 
						|
            # TODO: break lines in symbols
 | 
						|
            name = textwrap.fill(name, width, break_long_words=False)
 | 
						|
 | 
						|
        # Take away spaces
 | 
						|
        name = name.replace(", ", ",")
 | 
						|
        name = name.replace("> >", ">>")
 | 
						|
        name = name.replace("> >", ">>") # catch consecutive
 | 
						|
 | 
						|
        return name
 | 
						|
 | 
						|
    def compress_function_name(self, name):
 | 
						|
        """Compress function name according to the user preferences."""
 | 
						|
 | 
						|
        if self.options.strip:
 | 
						|
            name = self.strip_function_name(name)
 | 
						|
 | 
						|
        if self.options.wrap:
 | 
						|
            name = self.wrap_function_name(name)
 | 
						|
 | 
						|
        # TODO: merge functions with same resulting name
 | 
						|
 | 
						|
        return name
 | 
						|
 | 
						|
    def write_graph(self):
 | 
						|
        dot = DotWriter(self.output)
 | 
						|
        profile = self.profile
 | 
						|
        profile.prune(self.options.node_thres/100.0, self.options.edge_thres/100.0)
 | 
						|
 | 
						|
        for function in profile.functions.itervalues():
 | 
						|
            function.name = self.compress_function_name(function.name)
 | 
						|
 | 
						|
        dot.graph(profile, self.theme)
 | 
						|
 | 
						|
 | 
						|
if __name__ == '__main__':
 | 
						|
    Main().main()
 |