check_whence.py 2.16 KB
Newer Older
1
2
3
4
5
6
7
#!/usr/bin/python

import os, re, sys

def list_whence():
    with open('WHENCE') as whence:
        for line in whence:
Thierry Reding's avatar
Thierry Reding committed
8
            match = re.match(r'(?:File|Source):\s*"(.*)"', line)
9
10
11
            if match:
                yield match.group(1)
                continue
Thierry Reding's avatar
Thierry Reding committed
12
            match = re.match(r'(?:File|Source):\s*(\S*)', line)
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
            if match:
                yield match.group(1)
                continue
            match = re.match(r'Licen[cs]e: (?:.*\bSee (.*) for details\.?|(\S*))\n',
                             line)
            if match:
                if match.group(1):
                    for name in re.split(r', | and ', match.group(1)):
                        yield name
                    continue
                if match.group(2):
                    # Just one word - may or may not be a filename
                    if not re.search(r'unknown|distributable', match.group(2),
                                     re.IGNORECASE):
                        yield match.group(2)
                        continue

def list_git():
    with os.popen('git ls-files') as git_files:
        for line in git_files:
            yield line.rstrip('\n')

def main():
    whence_list = list(list_whence())
    known_files = set(name for name in whence_list if not name.endswith('/')) | \
                  set(['check_whence.py', 'configure', 'Makefile',
39
                       'README', 'copy-firmware.sh', 'WHENCE'])
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
    known_prefixes = set(name for name in whence_list if name.endswith('/'))
    git_files = set(list_git())

    for name in sorted(list(known_files - git_files)):
        sys.stderr.write('E: %s listed in WHENCE does not exist\n' % name)

    for name in sorted(list(git_files - known_files)):
        # Ignore subdirectory changelogs and GPG detached signatures
        if (name.endswith('/ChangeLog') or
            (name.endswith('.asc') and name[:-4] in known_files)):
            continue

        # Ignore unknown files in known directories
        for prefix in known_prefixes:
            if name.startswith(prefix):
                break
        else:
            sys.stderr.write('E: %s not listed in WHENCE\n' % name)

if __name__ == '__main__':
    main()