summaryrefslogtreecommitdiffstats
path: root/compilerplugins/clang/fieldcanbelocal.py
blob: 3266574445c5ff320f5ad921e5d3c6aebf5b0abf (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
#!/usr/bin/python3

import re
import io

definitionSet = set()
definitionToSourceLocationMap = dict()
definitionToTypeMap = dict()
touchedMap = dict()
excludeSet = set()
sourceLocationSet = set()

# clang does not always use exactly the same numbers in the type-parameter vars it generates
# so I need to substitute them to ensure we can match correctly.
normalizeTypeParamsRegex = re.compile(r"type-parameter-\d+-\d+")
def normalizeTypeParams( line ):
    return normalizeTypeParamsRegex.sub("type-parameter-?-?", line)


with io.open("workdir/loplugin.fieldcanbelocal.log", "r", buffering=1024*1024) as txt:
    for line in txt:
        tokens = line.strip().split("\t")
        if tokens[0] == "definition:":
            fieldInfo = (normalizeTypeParams(tokens[1]), tokens[2])
            fieldType = tokens[3]
            srcLoc = tokens[4]
            # ignore external source code
            if srcLoc.startswith("external/"):
                continue
            # ignore build folder
            if srcLoc.startswith("workdir/"):
                continue
            definitionSet.add(fieldInfo)
            definitionToTypeMap[fieldInfo] = fieldType
            definitionToSourceLocationMap[fieldInfo] = srcLoc
        elif tokens[0] == "touched:":
            fieldInfo = (normalizeTypeParams(tokens[1]), tokens[2])
            touchedByFunction = normalizeTypeParams(tokens[3])
            touchedByFunctionSrcLoc = tokens[4]
            if fieldInfo in excludeSet:
                continue
            if touchedByFunction == "Negative":
                excludeSet.add(fieldInfo)
                if fieldInfo in touchedMap:
                    touchedMap.pop(fieldInfo)
            elif fieldInfo in touchedMap:
                if touchedMap[fieldInfo] != touchedByFunction:
                    excludeSet.add(fieldInfo)
                    touchedMap.pop(fieldInfo)
            else:
                touchedMap[fieldInfo] = touchedByFunction
        else:
            print( "unknown line: " + line)

outputSet = set()
for d in definitionSet:
    if not d in touchedMap:
        continue
    fieldType = definitionToTypeMap[d]
    # ignore some types that are known false+
    if (fieldType.startswith("std::unique_ptr<")
        or fieldType == "std::mutex"
        or "Mutex" in fieldType
        or "union" in fieldType
        or "anonymous namespace" in fieldType
        or "unnamed struct" in fieldType):
        continue
    # ignore some field names that are known false+
    if (d[1] == "mbDisposing"
        or d[1] == "bInDispose"
        or d[1] == "m_bDisposing"
        or d[1].startswith("m_bIn")):
        continue
    srcLoc = definitionToSourceLocationMap[d]
    # ignore some types in the system libraries we somehow pick up
    if srcLoc.startswith(".") or srcLoc.startswith("/") or srcLoc.startswith("lib/"):
        continue
    # part of the URE
    if srcLoc.startswith("include/cppuhelper/"):
        continue
    # on-disk structures
    if srcLoc.startswith("hwpfilter/"):
        continue
    if srcLoc.startswith("include/osl/"):
        continue
    if srcLoc.startswith("include/sal/"):
        continue
    if srcLoc.startswith("sw/source/filter/ww8/ww8struc.hxx"):
        continue
    if srcLoc.startswith("sd/source/filter/ppt/ppt97animations.hxx"):
        continue
    if srcLoc.startswith("lotuswordpro/"):
        continue
    if srcLoc.startswith("include/filter/msfilter/svdfppt.hxx"):
        continue
    if srcLoc.startswith("filter/source/graphicfilter/icgm/chart.hxx"):
        continue
    # most of this code is only compiled on windows, so we don't have decent results
    if srcLoc.startswith("include/svl/svdde.hxx"):
        continue
    touchedByFunction = touchedMap[d]
    outputSet.add((d[0] + " " + d[1] + " " + definitionToTypeMap[d], srcLoc, touchedByFunction))

# sort the results using a "natural order" so sequences like [item1,item2,item10] sort nicely
def natural_sort_key(s, _nsre=re.compile('([0-9]+)')):
    return [int(text) if text.isdigit() else text.lower()
            for text in re.split(_nsre, s)]
# sort by both the source-line and the datatype, so the output file ordering is stable
# when we have multiple items on the same source line
def v_sort_key(v):
    return natural_sort_key(v[1]) + [v[0]]

# sort results by name and line number
tmp1list = sorted(outputSet, key=lambda v: v_sort_key(v))

# print out the results
with open("compilerplugins/clang/fieldcanbelocal.results", "wt") as f:
    for t in tmp1list:
        f.write( t[1] + "\n" )
        f.write( "    " + t[0] + "\n" )
        f.write( "    " + t[2] + "\n" )