1
# this is copied from the lsprof distro because somehow
2
# it is not installed by distutils
3
# I made one modification to profile so that it returns a pair
4
# instead of just the Stats object
8
import cPickle as pickle
16
from _lsprof import Profiler, profiler_entry
20
__all__ = ['profile', 'Stats']
23
def profile(f, *args, **kwds):
24
"""Run a function profile.
26
Exceptions are not caught: If you need stats even when exceptions are to be
27
raised, pass in a closure that will catch the exceptions and transform them
28
appropriately for your driver function.
30
Important caveat: only one profile can execute at a time. See BzrProfiler
33
:return: The functions return value and a stats object.
35
profiler = BzrProfiler()
38
ret = f(*args, **kwds)
40
stats = profiler.stop()
44
class BzrProfiler(object):
45
"""Bzr utility wrapper around Profiler.
47
For most uses the module level 'profile()' function will be suitable.
48
However profiling when a simple wrapped function isn't available may
49
be easier to accomplish using this class.
51
To use it, create a BzrProfiler and call start() on it. Some arbitrary
52
time later call stop() to stop profiling and retrieve the statistics
53
from the code executed in the interim.
55
Note that profiling involves a threading.Lock around the actual profiling.
56
This is needed because profiling involves global manipulation of the python
57
interpreter state. As such you cannot perform multiple profiles at once.
58
Trying to do so will lock out the second profiler unless the global
59
breezy.lsprof.BzrProfiler.profiler_block is set to 0. Setting it to 0 will
60
cause profiling to fail rather than blocking.
64
"""Serialise rather than failing to profile concurrent profile requests."""
66
profiler_lock = threading.Lock()
67
"""Global lock used to serialise profiles."""
72
This hooks into threading and will record all calls made until
75
self._g_threadmap = {}
77
permitted = self.__class__.profiler_lock.acquire(
78
self.__class__.profiler_block)
80
raise errors.InternalBzrError(msg="Already profiling something")
82
self.p.enable(subcalls=True)
83
threading.setprofile(self._thread_profile)
85
self.__class__.profiler_lock.release()
91
This unhooks from threading and cleans up the profiler, returning
92
the gathered Stats object.
94
:return: A breezy.lsprof.Stats object.
98
for pp in self._g_threadmap.values():
100
threading.setprofile(None)
104
for tid, pp in self._g_threadmap.items():
105
threads[tid] = Stats(pp.getstats(), {})
106
self._g_threadmap = None
107
return Stats(p.getstats(), threads)
109
self.__class__.profiler_lock.release()
111
def _thread_profile(self, f, *args, **kwds):
112
# we lose the first profile point for a new thread in order to
113
# trampoline a new Profile object into place
114
thr = _thread.get_ident()
115
self._g_threadmap[thr] = p = Profiler()
116
# this overrides our sys.setprofile hook:
117
p.enable(subcalls=True, builtins=True)
121
"""Wrapper around the collected data.
123
A Stats instance is created when the profiler finishes. Normal
124
usage is to use save() to write out the data to a file, or pprint()
125
to write human-readable information to the command line.
128
def __init__(self, data, threads):
130
self.threads = threads
132
def sort(self, crit="inlinetime", reverse=True):
133
"""Sort the data by the supplied critera.
135
:param crit: the data attribute used as the sort key."""
136
if crit not in profiler_entry.__dict__ or crit == 'code':
137
raise ValueError("Can't sort by %s" % crit)
139
key_func = operator.attrgetter(crit)
140
self.data.sort(key=key_func, reverse=reverse)
144
e.calls.sort(key=key_func, reverse=reverse)
146
def pprint(self, top=None, file=None):
147
"""Pretty-print the data as plain text for human consumption.
149
:param top: only output the top n entries.
150
The default value of None means output all data.
151
:param file: the output file; if None, output will
152
default to stdout."""
158
cols = "% 12s %12s %11.4f %11.4f %s\n"
159
hcols = "% 12s %12s %12s %12s %s\n"
160
file.write(hcols % ("CallCount", "Recursive", "Total(ms)",
161
"Inline(ms)", "module:lineno(function)"))
163
file.write(cols % (e.callcount, e.reccallcount, e.totaltime,
164
e.inlinetime, label(e.code)))
167
file.write(cols % ("+%s" % se.callcount, se.reccallcount,
168
se.totaltime, se.inlinetime,
169
"+%s" % label(se.code)))
172
"""Replace all references to code objects with string
173
descriptions; this makes it possible to pickle the instance."""
175
# this code is probably rather ickier than it needs to be!
176
for i in range(len(self.data)):
178
if not isinstance(e.code, str):
179
self.data[i] = type(e)((label(e.code),) + e[1:])
181
for j in range(len(e.calls)):
183
if not isinstance(se.code, str):
184
e.calls[j] = type(se)((label(se.code),) + se[1:])
185
for s in self.threads.values():
188
def calltree(self, file):
189
"""Output profiling data in calltree format (for KCacheGrind)."""
190
_CallTreeFilter(self.data).output(file)
192
def save(self, filename, format=None):
193
"""Save profiling data to a file.
195
:param filename: the name of the output file
196
:param format: 'txt' for a text representation;
197
'callgrind' for calltree format;
198
otherwise a pickled Python object. A format of None indicates
199
that the format to use is to be found from the filename. If
200
the name starts with callgrind.out, callgrind format is used
201
otherwise the format is given by the filename extension.
204
basename = os.path.basename(filename)
205
if basename.startswith('callgrind.out'):
208
ext = os.path.splitext(filename)[1]
211
with open(filename, 'wb') as outfile:
212
if format == "callgrind":
213
# The callgrind format states it is 'ASCII based':
214
# <http://valgrind.org/docs/manual/cl-format.html>
215
# But includes filenames so lets ignore and use UTF-8.
216
self.calltree(codecs.getwriter('utf-8')(outfile))
217
elif format == "txt":
218
self.pprint(file=codecs.getwriter('utf-8')(outfile))
221
pickle.dump(self, outfile, 2)
224
class _CallTreeFilter(object):
225
"""Converter of a Stats object to input suitable for KCacheGrind.
227
This code is taken from http://ddaa.net/blog/python/lsprof-calltree
228
with the changes made by J.P. Calderone and Itamar applied. Note that
229
isinstance(code, str) needs to be used at times to determine if the code
230
object is actually an external code object (with a filename, etc.) or
234
def __init__(self, data):
238
def output(self, out_file):
239
self.out_file = out_file
240
out_file.write('events: Ticks\n')
241
self._print_summary()
242
for entry in self.data:
245
def _print_summary(self):
247
for entry in self.data:
248
totaltime = int(entry.totaltime * 1000)
249
max_cost = max(max_cost, totaltime)
250
self.out_file.write('summary: %d\n' % (max_cost,))
252
def _entry(self, entry):
253
out_file = self.out_file
255
inlinetime = int(entry.inlinetime * 1000)
256
if isinstance(code, str):
257
out_file.write('fi=~\n')
259
out_file.write('fi=%s\n' % (code.co_filename,))
260
out_file.write('fn=%s\n' % (label(code, True),))
261
if isinstance(code, str):
262
out_file.write('0 %s\n' % (inlinetime,))
264
out_file.write('%d %d\n' % (code.co_firstlineno, inlinetime))
265
# recursive calls are counted in entry.calls
270
if isinstance(code, str):
273
lineno = code.co_firstlineno
274
for subentry in calls:
275
self._subentry(lineno, subentry)
278
def _subentry(self, lineno, subentry):
279
out_file = self.out_file
281
totaltime = int(subentry.totaltime * 1000)
282
if isinstance(code, str):
283
out_file.write('cfi=~\n')
284
out_file.write('cfn=%s\n' % (label(code, True),))
285
out_file.write('calls=%d 0\n' % (subentry.callcount,))
287
out_file.write('cfi=%s\n' % (code.co_filename,))
288
out_file.write('cfn=%s\n' % (label(code, True),))
289
out_file.write('calls=%d %d\n' % (
290
subentry.callcount, code.co_firstlineno))
291
out_file.write('%d %d\n' % (lineno, totaltime))
297
def label(code, calltree=False):
298
if isinstance(code, str):
301
mname = _fn2mod[code.co_filename]
303
for k, v in sys.modules.items():
306
if getattr(v, '__file__', None) is None:
308
if not isinstance(v.__file__, str):
310
if v.__file__.startswith(code.co_filename):
311
mname = _fn2mod[code.co_filename] = k
314
mname = _fn2mod[code.co_filename] = '<%s>' % code.co_filename
316
return '%s %s:%d' % (code.co_name, mname, code.co_firstlineno)
318
return '%s:%d(%s)' % (mname, code.co_firstlineno, code.co_name)
322
sys.argv = sys.argv[1:]
324
sys.stderr.write("usage: lsprof.py <script> <arguments...>\n")
327
result, stats = profile(runpy.run_path, sys.argv[0], run_name='__main__')
332
if __name__ == '__main__':