diff options
Diffstat (limited to 'bin/find-most-common-warn-messages.py')
-rwxr-xr-x | bin/find-most-common-warn-messages.py | 39 |
1 files changed, 39 insertions, 0 deletions
diff --git a/bin/find-most-common-warn-messages.py b/bin/find-most-common-warn-messages.py new file mode 100755 index 0000000000..dc2ecf8ab0 --- /dev/null +++ b/bin/find-most-common-warn-messages.py @@ -0,0 +1,39 @@ +#!/usr/bin/python3 + +# A script to search our test logs and sort the messages by how common they are so we can start to +# reduce the noise a little. + +import sys +import re +import io +import subprocess + +# find . -name '*.log' | xargs grep -h 'warn:' | sort | uniq -c | sort -n --field-separator=: --key=5,6 + +process = subprocess.Popen("find workdir -name '*.log' | xargs grep -h 'warn:' | sort", + shell=True, stdout=subprocess.PIPE, universal_newlines=True) + +messages = dict() # dict of sourceAndLine->count +sampleOfMessage = dict() # dict of sourceAndLine->string +for line in process.stdout: + line = line.strip() + # a sample line is: + # warn:sw:18790:1:sw/source/core/doc/DocumentRedlineManager.cxx:98: redline table corrupted: overlapping redlines + tokens = line.split(":") + sourceAndLine = tokens[4] + ":" + tokens[5] + if (sourceAndLine in messages): + messages[sourceAndLine] = messages[sourceAndLine] + 1 + else: + messages[sourceAndLine] = 1 + sampleOfMessage[sourceAndLine] = line[line.find(tokens[6]):] + +tmplist = list() # set of tuple (count, sourceAndLine) +for key, value in messages.items(): + tmplist.append([value,key]) + +print( "The top 20 warnings" ) +print("") +for i in sorted(tmplist, key=lambda v: v[0])[-20:]: + print( "%6d %s %s" % (i[0], i[1], sampleOfMessage[i[1]]) ) + + |