elements for result summaries that # look like this: #

# # # # #

File:	gstmodule.c
Function:	init_gst
Error:	ob_refcnt of new ref from (unknown) pygobject_init is 1 too high

if not soup.html: # broken file: error during output of HTML? return for div in soup.html.body.findAll('div'): table = div.table if not table: continue #print div['id'] #print 'div: %r' % div rows = table('tr') def get_second_col(row): return row('td')[1].b.string # Capture the marked up source code and notes from the report: htmlpre = div.div.pre errmsg = get_second_col(rows[2]) if not errmsg: continue yield ErrorReport(htmlpath=htmlpath, htmlid=div['id'], filename=get_second_col(rows[0]), function = get_second_col(rows[1]), errmsg = errmsg, htmlpre = htmlpre) class Severity(namedtuple('Severity', ('priority', 'title', 'description'))): """ priority: the int values are in asending severity (so that e.g. priority 5 is more severe than severity 4). This should give us a useful sort order for Severity instances """ (PRIORITY__RETURNING_NULL_WITHOUT_SETTING_EXCEPTION, PRIORITY__POSSIBLE_REFERENCE_LEAK, PRIORITY__REFERENCE_LEAK_OF_SINGLETON, PRIORITY__SEGFAULT_IN_ERROR_HANDLING, PRIORITY__REFERENCE_LEAK_IN_INITIALIZATION, PRIORITY__REFERENCE_COUNT_TOO_LOW_IN_INITIALIZATION, PRIORITY__REFERENCE_LEAK_IN_NORMAL_USE, PRIORITY__REFERENCE_COUNT_TOO_LOW_IN_NORMAL_USE, PRIORITY__SEGFAULT_IN_NORMAL_USE, PRIORITY__UNCLASSIFIED, ) = range(10) class Triager: """ Classify ErrorReport instances into various severity levels, identified by Severity instances """ def _classify_segfault(self, report): if report.contains_failure(): return Severity(priority=PRIORITY__SEGFAULT_IN_ERROR_HANDLING, title='Segfaults within error-handling paths', description='

Code paths in error-handling that will lead to a segmentatation fault (e.g. under low memory conditions)

') else: return Severity(priority=PRIORITY__SEGFAULT_IN_NORMAL_USE, title='Segfaults in normal paths', description='

Code paths that will lead to a segmentatation fault

') def classify(self, report): #print('report: %r' % (dir(report), )) #print('report.errmsg: %r' % report.errmsg) if report.errmsg is None: return Severity(priority=PRIORITY__UNCLASSIFIED, title='Unclassified errors', description='''

The triager didn't know how to classify these ones

''') m = re.match('ob_refcnt of (.+) too high', report.errmsg) if m: if report.might_be_borrowed_ref(): return Severity(priority=PRIORITY__POSSIBLE_REFERENCE_LEAK, title='Possible reference leaks', description=("""

Code paths in which the reference count of an object might too large - but in which the reference in question came from a function not known to the analyzer.

The analyzer assumes such references are new references, but if the function returns a borrowed reference instead, it's probably not a bug

""" )) if 'PyBool_FromLong' in report.errmsg: is_singleton = True else: is_singleton = False if is_singleton: return Severity(priority=PRIORITY__REFERENCE_LEAK_OF_SINGLETON, title='Reference leaks of a singleton', description=('''

Code paths in which the reference count of a singleton object will be left too large.

Technically incorrect, but unlikely to cause problems

''' )) else: if report.is_within_initialization(): return Severity(priority=PRIORITY__REFERENCE_LEAK_IN_INITIALIZATION, title='Reference leak within initialization', description='''

Code paths in which the reference count of an object is left too high, but within an initialization routine, and thus likely to only happen once

''') else: return Severity(priority=PRIORITY__REFERENCE_LEAK_IN_NORMAL_USE, title='Reference leaks', description='''

Code paths in which the reference count of an object is left too high, leading to memory leaks

''') m = re.match('ob_refcnt of (.+) too low', report.errmsg) if m: if report.is_within_initialization(): return Severity(priority=PRIORITY__REFERENCE_COUNT_TOO_LOW_IN_INITIALIZATION, title='Reference count too low within an initialization routine', description='''

Code paths in which the reference count of an object is too low, but within an initialization routine, and thus likely to only happen once

''' ) else: return Severity(priority=PRIORITY__REFERENCE_COUNT_TOO_LOW_IN_NORMAL_USE, title='Reference count too low', description='''

Code paths in which the reference count of an object is left too low. This could lead to the object being deallocated too early, triggering segfaults when later accessed. Over repeated calls, these errors could accumulate, increasing the likelihood of a segfault.

''') if report.errmsg == 'returning (PyObject*)NULL without setting an exception': return Severity(priority=PRIORITY__RETURNING_NULL_WITHOUT_SETTING_EXCEPTION, title='Returning (PyObject*)NULL without setting an exception', description='''

These messages are often false-positives: the analysis tool has no knowledge about internal API calls that can lead to an exception being set''') m = re.match('calling (.+) with NULL as argument (.*)', report.errmsg) if m: return self._classify_segfault(report) m = re.match('dereferencing NULL (.*)', report.errmsg) if m: return self._classify_segfault(report) m = re.match('reading from deallocated memory (.*)', report.errmsg) if m: return self._classify_segfault(report) return Severity(priority=PRIORITY__UNCLASSIFIED, title='Unclassified errors', description='''

The triager didn't know how to classify these ones

''') class BuildLog: # Wrapper around a "build.log" scraped from the mock build def __init__(self, path): self.unimplemented_functions = set() self.cplusplus_failure = False self.seen_rpmbuild = False self.num_tracebacks = 0 buildlog = os.path.join(path, 'build.log') with open(buildlog) as f: for line in f.readlines(): if 0: print(repr(line)) m = re.match('NotImplementedError: not yet implemented: (\S+)', line) if m: self.unimplemented_functions.add(m.group(1)) # Am seeing errors of this form: # The C++ compiler "/usr/bin/c++" is not able to compile a simple test # program. # It fails with the following output: # Change Dir: /builddir/build/BUILD/airrac-0.2.3/CMakeFiles/CMakeTmp # # Run Build Command:/usr/bin/gmake "cmTryCompileExec/fast" # /usr/bin/gmake -f CMakeFiles/cmTryCompileExec.dir/build.make # CMakeFiles/cmTryCompileExec.dir/build # gmake[1]: Entering directory # `/builddir/build/BUILD/airrac-0.2.3/CMakeFiles/CMakeTmp' # /usr/bin/cmake -E cmake_progress_report # /builddir/build/BUILD/airrac-0.2.3/CMakeFiles/CMakeTmp/CMakeFiles 1 # Building CXX object CMakeFiles/cmTryCompileExec.dir/testCXXCompiler.cxx.o # /usr/bin/c++ -O2 -g -pipe -Wall -Wp,-D_FORTIFY_SOURCE=2 -fexceptions # -fstack-protector --param=ssp-buffer-size=4 -m64 -mtune=generic -o # CMakeFiles/cmTryCompileExec.dir/testCXXCompiler.cxx.o -c # /builddir/build/BUILD/airrac-0.2.3/CMakeFiles/CMakeTmp/testCXXCompiler.cxx # Traceback (most recent call last): # File "/usr/bin/the-real-g++", line 53, in # p = subprocess.Popen(args) # File "/usr/lib64/python2.7/subprocess.py", line 679, in __init__ # errread, errwrite) # File "/usr/lib64/python2.7/subprocess.py", line 1130, in _execute_child # self.pid = os.fork() # OSError: [Errno 11] Resource temporarily unavailable if 'The C++ compiler "/usr/bin/c++" is not able to compile a simple test' in line: self.cplusplus_failure = 'The C++ compiler "/usr/bin/c++" is not able to compile a simple test' if not self.cplusplus_failure: if 'OSError: [Errno 11] Resource temporarily unavailable' in line: self.cplusplus_failure = 'OSError: [Errno 11] Resource temporarily unavailable' if 'configure: error: C++ compiler cannot create executables' in line: self.cplusplus_failure = 'configure: error: C++ compiler cannot create executables' if 'rpmbuild -bb' in line: self.seen_rpmbuild = True if line.startswith('Traceback '): self.num_tracebacks += 1 class Index: def __init__(self, path, title): self.reported = False self.seen_SWIG = False self.seen_Cython = False outpath = os.path.join(path, 'index.html') with open(outpath, 'w') as f: f.write('%s\n' % title) f.write(' \n') f.write('

%s

\n' % title) f.write("

This is a summary of errors seen when compiling with an experimental static analysis tool

") f.write('

Raw build logs can be seen here

\n') buildlog = BuildLog(path) if buildlog.cplusplus_failure: f.write('

C++ failure: %s

\n' % buildlog.cplusplus_failure) srpm = Srpm.from_path(path) BugReportDb.add_status(srpm, "FIXME: C++ failure: %s" % buildlog.cplusplus_failure) self.reported = True """ if not buildlog.seen_rpmbuild: f.write('

Did not see rpmbuild -bb in build.log

\n') srpm = Srpm.from_path(path) BugReportDb.add_status(srpm, "FIXME: did not see rpmbuild -bb in build.log") self.reported = True return """ # Gather the ErrorReport by severity triager = Triager() # mapping from Severity to list of ErrorReport self.severities = {} self.num_reports = 0 for dirpath, dirnames, filenames in os.walk(path): #print dirpath, dirnames, filenames for filename in filenames: if filename.endswith('-refcount-errors.html'): #print ' ', os.path.join(dirpath, filename) htmlpath = os.path.join(dirpath, filename) for er in get_errors_from_file(htmlpath): if er is None: continue #print(er.filename) #print(er.function) #print(er.errmsg) sev = triager.classify(er) #print(sev) if sev in self.severities: self.severities[sev].append(er) else: self.severities[sev] = [er] for sev, issues in self.iter_severities(): f.write('

%s

\n' % sev.title) f.write(' %s\n' % sev.description) f.write(' \n') for er in issues: self.num_reports += 1 href = os.path.relpath(er.href(), path) f.write(' ' % (href, er.filename, href, er.function, href, er.errmsg)) f.write('

\n') if 'SWIG' in er.function or 'SWIG' in er.errmsg: self.seen_SWIG = True if '__pyx' in er.function or '__pyx' in er.errmsg: self.seen_Cython = True if buildlog.unimplemented_functions: f.write('

Implementation notes for gcc-with-cpychecker

\n') f.write('

The following "Py" functions were used but aren\'t\n' ' yet explicitly handled by gcc-with-cpychecker

\n' '

```
%s
```

\n') if self.num_reports == 0 and not buildlog.unimplemented_functions: f.write('

Nothing was reported; did the plugin run correctly?\n') f.write(' \n') f.write('\n') if self.seen_Cython: if not self.reported: srpm = Srpm.from_path(path) BugReportDb.add_status(srpm, "FIXME: Cython-built") self.reported = True if self.seen_SWIG: if not self.reported: srpm = Srpm.from_path(path) BugReportDb.add_status(srpm, "FIXME: SWIG-built") self.reported = True if buildlog.num_tracebacks >= 5: if not self.reported: srpm = Srpm.from_path(path) BugReportDb.add_status(srpm, ("FIXME: %i tracebacks during build" % buildlog.num_tracebacks)) self.reported = True def iter_severities(self): for sev in sorted(self.severities.keys())[::-1]: yield sev, self.severities[sev] def main(): # locate .html # iterate over toplevel in "LOGS": for resultdir in os.listdir('LOGS'): resultpath = os.path.join('LOGS', resultdir) print(resultpath) index = Index(resultpath, 'Errors seen in %s' % resultdir) if __name__ == '__main__': main()