nheko/scripts/emoji_codegen.py

104 lines
2.8 KiB
Python
Raw Permalink Normal View History

2017-04-23 20:31:08 +02:00
#!/usr/bin/env python3
import sys
2020-01-24 04:18:14 +01:00
import re
2017-04-23 20:31:08 +02:00
from jinja2 import Template
class Emoji(object):
2020-01-24 04:18:14 +01:00
def __init__(self, code, shortname):
self.code = repr(code.encode('utf-8'))[1:].strip("'")
2017-04-23 20:31:08 +02:00
self.shortname = shortname
def generate_code(emojis, category):
tmpl = Template('''
2020-01-24 04:18:14 +01:00
const std::vector<Emoji> emoji::Provider::{{ category }} = {
// {{ category.capitalize() }}
2017-04-23 20:31:08 +02:00
{%- for e in emoji %}
Emoji{QString::fromUtf8("{{ e.code }}"), "{{ e.shortname }}", emoji::EmojiCategory::{{ category.capitalize() }}},
2017-04-23 20:31:08 +02:00
{%- endfor %}
};
''')
d = dict(category=category, emoji=emojis)
print(tmpl.render(d))
def generate_qml_list(**kwargs):
tmpl = Template('''
const QVector<Emoji> emoji::Provider::emoji = {
{%- for c in kwargs.items() %}
// {{ c[0].capitalize() }}
{%- for e in c[1] %}
Emoji{QString::fromUtf8("{{ e.code }}"), "{{ e.shortname }}", emoji::EmojiCategory::{{ c[0].capitalize() }}},
{%- endfor %}
{%- endfor %}
};
''')
d = dict(kwargs=kwargs)
print(tmpl.render(d))
2017-04-23 20:31:08 +02:00
if __name__ == '__main__':
if len(sys.argv) < 2:
2020-01-24 04:18:14 +01:00
print('usage: emoji_codegen.py /path/to/emoji-test.txt')
2017-04-23 20:31:08 +02:00
sys.exit(1)
filename = sys.argv[1]
2020-01-24 04:18:14 +01:00
people = []
nature = []
food = []
activity = []
travel = []
objects = []
symbols = []
flags = []
categories = {
'Smileys & Emotion': people,
'People & Body': people,
'Animals & Nature': nature,
'Food & Drink': food,
'Travel & Places': travel,
'Activities': activity,
'Objects': objects,
'Symbols': symbols,
'Flags': flags
}
current_category = ''
for line in open(filename, 'r'):
if line.startswith('# group:'):
current_category = line.split(':', 1)[1].strip()
if not line or line.startswith('#'):
continue
2017-04-23 20:31:08 +02:00
2020-01-24 04:18:14 +01:00
segments = re.split(r'\s+[#;] ', line.strip())
if len(segments) != 3:
continue
2017-04-23 20:31:08 +02:00
2020-01-24 04:18:14 +01:00
code, qualification, charAndName = segments
2017-04-23 20:31:08 +02:00
2020-01-24 04:18:14 +01:00
# skip fully qualified versions of same unicode
if code.endswith('FE0F'):
continue
2017-04-23 20:31:08 +02:00
2020-01-24 04:18:14 +01:00
if qualification == 'component':
2017-04-23 20:31:08 +02:00
continue
2020-01-24 04:18:14 +01:00
char, name = re.match(r'^(\S+) E\d+\.\d+ (.*)$', charAndName).groups()
categories[current_category].append(Emoji(char, name))
2017-04-23 20:31:08 +02:00
# Use xclip to pipe the output to clipboard.
# e.g ./codegen.py emoji.json | xclip -sel clip
generate_code(people, 'people')
generate_code(nature, 'nature')
generate_code(food, 'food')
generate_code(activity, 'activity')
generate_code(travel, 'travel')
generate_code(objects, 'objects')
generate_code(symbols, 'symbols')
generate_code(flags, 'flags')
generate_qml_list(people=people, nature=nature, food=food, activity=activity, travel=travel, objects=objects, symbols=symbols, flags=flags)