| 12
 3
 4
 5
 6
 7
 8
 9
 10
 11
 12
 13
 14
 15
 16
 17
 18
 19
 20
 21
 22
 23
 24
 25
 26
 27
 28
 29
 30
 31
 32
 33
 34
 35
 36
 37
 38
 39
 40
 41
 42
 43
 44
 45
 46
 47
 48
 49
 50
 51
 52
 53
 54
 55
 56
 57
 58
 59
 60
 61
 62
 63
 64
 65
 66
 67
 68
 69
 70
 71
 72
 73
 74
 75
 76
 77
 78
 79
 80
 81
 82
 83
 84
 85
 86
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 98
 99
 100
 101
 102
 103
 104
 105
 106
 107
 108
 109
 110
 111
 112
 113
 114
 115
 116
 117
 118
 119
 120
 121
 122
 123
 
 | #!/usr/bin/python3
import re
import io
definitionSet = set()
definitionToSourceLocationMap = dict()
definitionToTypeMap = dict()
touchedMap = dict()
excludeSet = set()
sourceLocationSet = set()
# clang does not always use exactly the same numbers in the type-parameter vars it generates
# so I need to substitute them to ensure we can match correctly.
normalizeTypeParamsRegex = re.compile(r"type-parameter-\d+-\d+")
def normalizeTypeParams( line ):
    return normalizeTypeParamsRegex.sub("type-parameter-?-?", line)
with io.open("workdir/loplugin.fieldcanbelocal.log", "r", buffering=1024*1024) as txt:
    for line in txt:
        tokens = line.strip().split("\t")
        if tokens[0] == "definition:":
            fieldInfo = (normalizeTypeParams(tokens[1]), tokens[2])
            fieldType = tokens[3]
            srcLoc = tokens[4]
            # ignore external source code
            if srcLoc.startswith("external/"):
                continue
            # ignore build folder
            if srcLoc.startswith("workdir/"):
                continue
            definitionSet.add(fieldInfo)
            definitionToTypeMap[fieldInfo] = fieldType
            definitionToSourceLocationMap[fieldInfo] = srcLoc
        elif tokens[0] == "touched:":
            fieldInfo = (normalizeTypeParams(tokens[1]), tokens[2])
            touchedByFunction = normalizeTypeParams(tokens[3])
            touchedByFunctionSrcLoc = tokens[4]
            if fieldInfo in excludeSet:
                continue
            if touchedByFunction == "Negative":
                excludeSet.add(fieldInfo)
                if fieldInfo in touchedMap:
                    touchedMap.pop(fieldInfo)
            elif fieldInfo in touchedMap:
                if touchedMap[fieldInfo] != touchedByFunction:
                    excludeSet.add(fieldInfo)
                    touchedMap.pop(fieldInfo)
            else:
                touchedMap[fieldInfo] = touchedByFunction
        else:
            print( "unknown line: " + line)
outputSet = set()
for d in definitionSet:
    if d not in touchedMap:
        continue
    fieldType = definitionToTypeMap[d]
    # ignore some types that are known false+
    if (fieldType.startswith("std::unique_ptr<")
        or fieldType == "std::mutex"
        or "Mutex" in fieldType
        or "union" in fieldType
        or "anonymous namespace" in fieldType
        or "unnamed struct" in fieldType):
        continue
    # ignore some field names that are known false+
    if (d[1] == "mbDisposing"
        or d[1] == "bInDispose"
        or d[1] == "m_bDisposing"
        or d[1].startswith("m_bIn")):
        continue
    srcLoc = definitionToSourceLocationMap[d]
    # ignore some types in the system libraries we somehow pick up
    if srcLoc.startswith(".") or srcLoc.startswith("/") or srcLoc.startswith("lib/"):
        continue
    # part of the URE
    if srcLoc.startswith("include/cppuhelper/"):
        continue
    # on-disk structures
    if srcLoc.startswith("hwpfilter/"):
        continue
    if srcLoc.startswith("include/osl/"):
        continue
    if srcLoc.startswith("include/sal/"):
        continue
    if srcLoc.startswith("sw/source/filter/ww8/ww8struc.hxx"):
        continue
    if srcLoc.startswith("sd/source/filter/ppt/ppt97animations.hxx"):
        continue
    if srcLoc.startswith("lotuswordpro/"):
        continue
    if srcLoc.startswith("include/filter/msfilter/svdfppt.hxx"):
        continue
    if srcLoc.startswith("filter/source/graphicfilter/icgm/chart.hxx"):
        continue
    # most of this code is only compiled on windows, so we don't have decent results
    if srcLoc.startswith("include/svl/svdde.hxx"):
        continue
    touchedByFunction = touchedMap[d]
    outputSet.add((d[0] + " " + d[1] + " " + definitionToTypeMap[d], srcLoc, touchedByFunction))
# sort the results using a "natural order" so sequences like [item1,item2,item10] sort nicely
def natural_sort_key(s, _nsre=re.compile('([0-9]+)')):
    return [int(text) if text.isdigit() else text.lower()
            for text in re.split(_nsre, s)]
# sort by both the source-line and the datatype, so the output file ordering is stable
# when we have multiple items on the same source line
def v_sort_key(v):
    return natural_sort_key(v[1]) + [v[0]]
# sort results by name and line number
tmp1list = sorted(outputSet, key=lambda v: v_sort_key(v))
# print out the results
with open("compilerplugins/clang/fieldcanbelocal.results", "wt") as f:
    for t in tmp1list:
        f.write( t[1] + "\n" )
        f.write( "    " + t[0] + "\n" )
        f.write( "    " + t[2] + "\n" )
 |