summaryrefslogtreecommitdiffstats
path: root/tools/performance-log-deduce.py
blob: 1c6e059a5ef4222cf4793fc836afee0c61354d1a (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
#!/usr/bin/env python3

"""
performance-log-deduce.py -- Deduce GIMP performance log thread state
Copyright (C) 2018  Ell

This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 3 of the License, or
(at your option) any later version.

This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
along with this program.  If not, see <https://www.gnu.org/licenses/>.


Usage: performance-log-deduce.py < infile > outfile
"""

DEDUCE_MIN_N_OCCURRENCES = 10
DEDUCE_MIN_PERCENTAGE    = 0.75

from xml.etree import ElementTree
import sys

empty_element = ElementTree.Element ("")

# Read performance log from STDIN
log = ElementTree.fromstring (sys.stdin.buffer.read ())

# Construct state histogram
address_states = {}

for sample in (log.find ("samples") or empty_element).iterfind ("sample"):
    threads = (sample.find ("backtrace") or empty_element).iterfind ("thread")

    for thread in threads:
        running = int (thread.get ("running"))

        frame = thread.find ("frame")

        if frame is not None:
            address = frame.get ("address")

            states = address_states.setdefault (address, [0, 0])

            states[running] += 1

# Find maximal states
for address, states in list (address_states.items ()):
    n = sum (states)

    if n >= DEDUCE_MIN_N_OCCURRENCES:
        state = 0
        m     = states[0]

        for i in range (1, len (states)):
            if states[i] > m:
                state = i
                m     = states[i]

        percentage = m / n

        if percentage >= DEDUCE_MIN_PERCENTAGE:
            address_states[address] = state
        else:
            del address_states[address]
    else:
        del address_states[address]

# Replace thread states
for sample in (log.find ("samples") or empty_element).iterfind ("sample"):
    threads = (sample.find ("backtrace") or empty_element).iterfind ("thread")

    for thread in threads:
        frame = thread.find ("frame")

        if frame is not None:
            address = frame.get ("address")

            running = address_states.get (address, None)

            if running is not None:
                thread.set ("running", str (running))

# Write performance log to STDOUT
sys.stdout.buffer.write (ElementTree.tostring (log))