summaryrefslogtreecommitdiffstats
path: root/third_party/python/fluent.migrate/fluent/migrate/changesets.py
blob: e68717555038087d0414ad01ca5573f968b27217 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
from __future__ import annotations
from typing import Set, Tuple, TypedDict

import time

from .blame import BlameResult

Changes = Set[Tuple[str, str]]


class Changeset(TypedDict):
    author: str
    first_commit: float
    changes: Changes


def by_first_commit(item: Changeset):
    """Order two changesets by their first commit date."""
    return item["first_commit"]


def convert_blame_to_changesets(blame_json: BlameResult) -> list[Changeset]:
    """Convert a blame dict into a list of changesets.

    The blame information in `blame_json` should be a dict of the following
    structure:

        {
            'authors': [
                'A.N. Author <author@example.com>',
            ],
            'blame': {
                'path/one': {
                    'key1': [0, 1346095921.0],
                },
            }
        }

    It will be transformed into a list of changesets which can be fed into
    `InternalContext.serialize_changeset`:

        [
            {
                'author': 'A.N. Author <author@example.com>',
                'first_commit': 1346095921.0,
                'changes': {
                    ('path/one', 'key1'),
                }
            },
        ]

    """
    now = time.time()
    changesets: list[Changeset] = [
        {"author": author, "first_commit": now, "changes": set()}
        for author in blame_json["authors"]
    ]

    for path, keys_info in blame_json["blame"].items():
        for key, (author_index, timestamp) in keys_info.items():
            changeset = changesets[author_index]
            changeset["changes"].add((path, key))
            if timestamp < changeset["first_commit"]:
                changeset["first_commit"] = timestamp

    return sorted(changesets, key=by_first_commit)