1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
|
#!/usr/bin/env python
from subprocess import check_output as run
from datetime import datetime
from itertools import groupby
from operator import itemgetter
import re
import magic
def authors(filename):
log = run(['git', 'log', '--follow',
'--date=short','--format=%aN%x09%ad', filename],
universal_newlines=True)
for line in log.splitlines():
author, date = line.split('\t')
if author != 'fix-copyright.py':
yield author, datetime.strptime(date, '%Y-%m-%d')
def new_copyright(filename, previous):
def f():
au = list(authors(filename))
alldates = map(itemgetter(1), au)
aup = sorted(au + map(lambda a: (a, None), previous), key=itemgetter(0))
for author, records in groupby(aup, itemgetter(0)):
dates = filter(None, map(itemgetter(1), records))
if not dates: dates = alldates
start = min(dates)
end = max(dates)
fmt = '{0}' if start.year == end.year else '{0}-{1}'
line = 'Copyright ' + fmt.format(start.year, end.year) + ' ' + author
key = (start, author)
yield key, line
return map(itemgetter(1), sorted(f()))
def fix_copyright(filename):
# Find copyright block in original file
prefix = set()
names = []
lines = []
with open(filename, 'r') as f:
content = list(f)
for i, line in enumerate(content[:15]):
m = re.match(r'^(?P<prefix>\W*)(\(c\))?\s*?copyright\s*(\(c\))?\s+\d{4}(\s*-\s*\d{4})?\s+(?P<name>.+?)\s*$', line, re.IGNORECASE)
if m:
d = m.groupdict()
prefix.add(d['prefix'])
lines.append(i)
names.append(d['name'].strip())
if len(prefix) != 1:
print 'Not found:', filename
return
prefix = list(prefix)[0]
print filename
new = iter(new_copyright(filename, names))
with open(filename, 'w') as f:
for i, line in enumerate(content):
if i in lines:
for repl in new:
print >>f, prefix + repl
else:
print >>f, line,
pass
def all_files():
ls = run(['git', 'ls-files'], universal_newlines=True)
for filename in ls.splitlines():
if magic.from_file(filename, mime=True).split('/')[0] == 'text':
yield filename
for f in all_files():
fix_copyright(f)
|