summaryrefslogtreecommitdiffstats
path: root/compilerplugins/clang/virtualdead.py
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-15 05:54:39 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-15 05:54:39 +0000
commit267c6f2ac71f92999e969232431ba04678e7437e (patch)
tree358c9467650e1d0a1d7227a21dac2e3d08b622b2 /compilerplugins/clang/virtualdead.py
parentInitial commit. (diff)
downloadlibreoffice-267c6f2ac71f92999e969232431ba04678e7437e.tar.xz
libreoffice-267c6f2ac71f92999e969232431ba04678e7437e.zip
Adding upstream version 4:24.2.0.upstream/4%24.2.0
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'compilerplugins/clang/virtualdead.py')
-rwxr-xr-xcompilerplugins/clang/virtualdead.py128
1 files changed, 128 insertions, 0 deletions
diff --git a/compilerplugins/clang/virtualdead.py b/compilerplugins/clang/virtualdead.py
new file mode 100755
index 0000000000..efb5e2e777
--- /dev/null
+++ b/compilerplugins/clang/virtualdead.py
@@ -0,0 +1,128 @@
+#!/usr/bin/python3
+
+import re
+import io
+
+callDict = dict() # callInfo tuple -> callValue
+definitionToSourceLocationMap = dict()
+paramSet = set() # paraminfo tuple
+
+# clang does not always use exactly the same numbers in the type-parameter vars it generates
+# so I need to substitute them to ensure we can match correctly.
+normalizeTypeParamsRegex = re.compile(r"type-parameter-\d+-\d+")
+def normalizeTypeParams( line ):
+ return normalizeTypeParamsRegex.sub("type-parameter-?-?", line)
+
+# reading as binary (since we known it is pure ascii) is much faster than reading as unicode
+with io.open("workdir/loplugin.virtualdead.log", "r", encoding="ascii", errors="ignore", buffering=1024*1024) as txt:
+ for line in txt:
+ try:
+ tokens = line.strip().split("\t")
+ if tokens[0] == "virtual:":
+ nameAndParams = normalizeTypeParams(tokens[1])
+ sourceLocation = tokens[2]
+ returnValue = tokens[3]
+ callInfo = (nameAndParams, sourceLocation)
+ if not callInfo in callDict:
+ callDict[callInfo] = set()
+ callDict[callInfo].add(returnValue)
+ definitionToSourceLocationMap[nameAndParams] = sourceLocation
+ elif tokens[0] == "param:":
+ name = normalizeTypeParams(tokens[1])
+ if len(tokens)>2:
+ bitfield = tokens[2]
+ paramSet.add((name,bitfield))
+ else:
+ print( "unknown line: " + line)
+ except IndexError:
+ print("problem with line " + line.strip())
+ raise
+
+tmp1list = list()
+for callInfo, callValues in iter(callDict.items()):
+ nameAndParams = callInfo[1]
+ if len(callValues) != 1:
+ continue
+ callValue = next(iter(callValues))
+ if "unknown-stmt" in callValue:
+ continue
+ if "unknown2" in callValue:
+ continue
+ if "unknown3" in callValue:
+ continue
+ if "unknown4" in callValue:
+ continue
+ if "pure" in callValue:
+ continue
+ srcloc = callInfo[1]
+ if srcloc.startswith("workdir/"): continue
+ # ignore Qt stuff
+ if srcloc.startswith("Gui/"): continue
+ if srcloc.startswith("Widgets/"): continue
+ if srcloc.startswith("Core/"): continue
+ if srcloc.startswith("/Qt"): continue
+ if srcloc.startswith("Qt"): continue
+ if srcloc.startswith("64-"): continue
+ functionSig = callInfo[0]
+ tmp1list.append((srcloc, functionSig, callValue))
+
+def merge_bitfield(a, b):
+ if len(a) == 0: return b
+ ret = ""
+ for i, c in enumerate(b):
+ if c == "1" or a[i] == "1":
+ ret += "1"
+ else:
+ ret += "0"
+ return ret;
+tmp2dict = dict()
+tmp2list = list()
+for paramInfo in paramSet:
+ name = paramInfo[0]
+ bitfield = paramInfo[1]
+ if re.match( r"\w+ com::", name): continue
+ if re.match( r"\w+ ooo::vba::", name): continue
+ if re.match( r"\w+ orcus::", name): continue
+ if re.match( r"\w+ std::", name): continue
+ if not name in tmp2dict:
+ tmp2dict[name] = bitfield
+ else:
+ tmp2dict[name] = merge_bitfield(tmp2dict[name], bitfield)
+for name, bitfield in iter(tmp2dict.items()):
+ srcloc = definitionToSourceLocationMap[name]
+ # ignore Qt stuff
+ if srcloc.startswith("Gui/"): continue
+ if srcloc.startswith("Widgets/"): continue
+ if srcloc.startswith("Core/"): continue
+ if srcloc.startswith("/Qt"): continue
+ if srcloc.startswith("Qt"): continue
+ if srcloc.startswith("64-"): continue
+ # ignore external stuff
+ if srcloc.startswith("workdir/"): continue
+ # referenced by generated code in workdir/
+ if srcloc.startswith("writerfilter/source/ooxml/OOXMLFactory.hxx"): continue
+ if "0" in bitfield:
+ tmp2list.append((srcloc, name, bitfield))
+
+# sort results by filename:lineno
+def natural_sort_key(s, _nsre=re.compile('([0-9]+)')):
+ return [int(text) if text.isdigit() else text.lower()
+ for text in re.split(_nsre, s)]
+# sort by both the source-line and the datatype, so the output file ordering is stable
+# when we have multiple items on the same source line
+def v_sort_key(v):
+ return natural_sort_key(v[0]) + [v[1]]
+tmp1list.sort(key=lambda v: v_sort_key(v))
+tmp2list.sort(key=lambda v: v_sort_key(v))
+
+# print out the results
+with open("compilerplugins/clang/virtualdead.results", "wt") as f:
+ for v in tmp1list:
+ f.write(v[0] + "\n")
+ f.write(" " + v[1] + "\n")
+ f.write(" " + v[2] + "\n")
+with open("compilerplugins/clang/virtualdead.unusedparams.results", "wt") as f:
+ for v in tmp2list:
+ f.write(v[0] + "\n")
+ f.write(" " + v[1] + "\n")
+ f.write(" " + v[2] + "\n")