#!/usr/bin/python3 # -*- tab-width: 4; indent-tabs-mode: nil; py-indent-offset: 4 -*- # # This file is part of the LibreOffice project. # # This Source Code Form is subject to the terms of the Mozilla Public # License, v. 2.0. If a copy of the MPL was not distributed with this # file, You can obtain one at http://mozilla.org/MPL/2.0/. # ### script to help debug leaks of reference counted objects ## I. to use it, first override acquire() and release() # Foo * g_pTrackedFoo = 0; # Foo::Foo() # static int nFoos = 0; # if (++nFoos == 42) // track instance #42 # g_pTrackedFoo = this; # void Foo::acquire() # if (this == g_pTrackedFoo) # ; // set gdb breakpoint here # Foo_Base::acquire() # void Foo::release() # if (this == g_pTrackedFoo) # ; // set gdb breakpoint here # Foo_Base::release() ## II. run test/soffice in gdb and set breakpoints in acquire/release ## with a command to print the backtrace # set logging on # break foo.cxx:123 # break foo.cxx:234 # command 1 2 # bt # c # end # run ## III. now feed logfile gdb.txt into this script # bin/refcount_leak.py < gdb.txt ### from operator import itemgetter import re import sys threshold = 2 class Trace: clock = 0 # global counter # frames: list of stack frames, beginning with outermost def __init__(self, lines): lines.reverse() self.frames = lines Trace.clock += 1 self.clock = Trace.clock def addTrace(traces, lines): if not(traces is None) and len(lines) > 0: traces.append(Trace(lines)) def readGdbLog(infile): traces_acquire = [] traces_release = [] current = None lines = [] apattern = re.compile("^Breakpoint.*::acquire") rpattern = re.compile("^Breakpoint.*::release") for line in infile: if apattern.match(line): addTrace(current, lines) lines = [] current = traces_acquire if rpattern.match(line): addTrace(current, lines) lines = [] current = traces_release if line.startswith("#"): # strip #123 stack frame number, and newline lines.append(line[line.index("0x"):-1]) addTrace(current, lines) print("# parsed traces acquire: ", len(traces_acquire)) print("# parsed traces release: ", len(traces_release)) return (traces_acquire, traces_release) def getFunction(frame): start = frame.index(" in ") + len(" in ") try: end = frame.index(" at ", start) except ValueError as e: # argh... stack frames may be split across multiple lines if # a parameter has a fancy pretty printer return frame[start:] return frame[start:end] def matchStack(trace_acquire, trace_release): if trace_release.clock < trace_acquire.clock: return None # acquire must precede release common = 0 refpattern = re.compile(r"::Reference<.*>::Reference\(") for (frame1, frame2) in zip(trace_release.frames, trace_acquire.frames): if frame1 == frame2: common += 1 else: if getFunction(frame1) == getFunction(frame2): common += 1 acquireframes = len(trace_acquire.frames) # there is sometimes a dozen frames of UNO type related junk # on the stack where the acquire() happens, which breaks the # matching; try to avoid that for i in range(common, acquireframes): if refpattern.search(trace_acquire.frames[i]): acquireframes = i+1 # cut off junk above Reference ctor break score = max(len(trace_release.frames), acquireframes) - common # smaller score is better return (score, trace_release.clock - trace_acquire.clock) # brute force greedy n^2 matching def matchStacks(traces_acquire, traces_release): matches = [] for release in traces_release: for acquire in traces_acquire: score = matchStack(acquire, release) if score is not None: matches.append((score, acquire, release)) matches.sort(key=itemgetter(0)) return matches def bestMatches(traces_acquire, traces_release, matches): traces_aunmatched = traces_acquire traces_runmatched = traces_release bestmatches = [] for (score,acquire,release) in matches: if not(acquire in traces_aunmatched and release in traces_runmatched): continue traces_aunmatched.remove(acquire) traces_runmatched.remove(release) bestmatches.append((score,acquire,release)) print("# unmatched acquire: ", len(traces_aunmatched)) print("# unmatched release: ", len(traces_runmatched)) return (bestmatches,traces_aunmatched,traces_runmatched) def printTrace(trace): for frame in reversed(trace.frames): print(" ", frame) def printMatched(bestmatches): for (score,acquire,release) in reversed(bestmatches): print("\n*** Matched trace with score: ", score) print(" acquire: ") printTrace(acquire) print(" release: ") printTrace(release) def printUnmatched(traces, prefix): for trace in traces: print("\n*** Unmatched trace (", prefix, "):") printTrace(trace) if __name__ == "__main__": (traces_acquire, traces_release) = readGdbLog(sys.stdin) matches = matchStacks(traces_acquire, traces_release) (bestmatches,traces_au,traces_ru) = bestMatches(traces_acquire, traces_release, matches) # print output, sorted with the most suspicious stuff first: printUnmatched(traces_au, "acquire") printUnmatched(traces_ru, "release") printMatched(bestmatches) # vim:set shiftwidth=4 softtabstop=4 expandtab: