summaryrefslogtreecommitdiff
path: root/Meta/check-emoji.py
blob: ae8e7ace85ff285eaba6ea13314c7b91f6f93219 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
#!/usr/bin/env python3

import os
import re
import sys

RE_INVALID_CHAR = re.compile('[^A-FU0-9+_]')
RE_MISSING_UNDERSCORE = re.compile('[^_]U')
RE_MISSING_LETTER_U = re.compile('_(?!U)')
RE_MISSING_SIGN_PLUS = re.compile('U(?!\\+)')


def any_problems_here():
    found_invalid_filenames = False
    for filename in os.listdir():
        if not filename.endswith('.png'):
            print(f'Non-png file {filename} does not belong in the emoji directory')
            found_invalid_filenames = True
            break
        filename = filename[:-len('.png')]
        if RE_INVALID_CHAR.search(filename):
            print(f'Filename {filename}.png contains invalid characters in its filename. Only uppercase letters'
                  ' A-F and U, numbers, +, and _ should be used.')
            found_invalid_filenames = True
            break
        if 'U+0' in filename:
            print(f'Filename {filename}.png contains codepoint(s) with leading zeros. Leading zeros should be'
                  ' removed from codepoint(s).')
            found_invalid_filenames = True
            break
        if '+U' in filename:
            print(f'Filename {filename}.png is incorrectly named. "_" should be used as a separator between'
                  ' codepoints, not "+".')
            found_invalid_filenames = True
            break
        if RE_MISSING_UNDERSCORE.search(filename):
            print(f'Filename {filename}.png is missing an underscore "_" between codepoints.')
            found_invalid_filenames = True
            break
        if RE_MISSING_LETTER_U.search(filename):
            print(f'Filename {filename}.png is either missing a "U" to indicate the start of a codepoint,'
                  ' or has a spurious underscore ("_").')
            found_invalid_filenames = True
            break
        if RE_MISSING_SIGN_PLUS.search(filename):
            print(f'Filename {filename}.png is either missing a "+" after a "U", or has a spurious "U".')
            found_invalid_filenames = True
            break
        if 'U+FE0F' in filename:
            print(f'Filename {filename}.png should not include any emoji presentation selectors. U+FE0F codepoints'
                  ' should be removed from the filename.')
            found_invalid_filenames = True
            break

        code_points = [int(code_point[len('U+'):], 16) for code_point in filename.split('_')]

        if any(code_point > 0x10ffff for code_point in code_points):
            print(f'Filename {filename}.png contains a code point exceeding U+10FFFF')
            found_invalid_filenames = True
            break

    return found_invalid_filenames


if __name__ == '__main__':
    os.chdir(os.path.dirname(__file__) + "/../Base/res/emoji/")
    if any_problems_here():
        sys.exit(1)