anki/ftl/extract-strings.py

33 lines
1.0 KiB
Python
Raw Normal View History

2020-11-19 02:26:09 +01:00
#!/usr/bin/env python3
# -*- coding: UTF-8 -*-
"""
Tool to extract core strings and keys from .ftl files.
"""
import os
import json
import glob
from fluent.syntax import parse
from fluent.syntax.serializer import serialize_element
from fluent.syntax.ast import Junk
root = os.environ["BUILD_WORKSPACE_DIRECTORY"]
ftl_files = glob.glob(os.path.join(root, "ftl", "core", "*.ftl"), recursive=True)
keys_by_value = {}
for path in ftl_files:
obj = parse(open(path).read(), with_spans=False)
for ent in obj.body:
if isinstance(ent, Junk):
raise Exception(f"file had junk! {path} {ent}")
if getattr(ent, "id", None):
key = ent.id.name
val = "".join(serialize_element(elem) for elem in ent.value.elements)
if val in keys_by_value:
print("duplicate found:", keys_by_value[val], key)
keys_by_value.setdefault(val, []).append(key)
json.dump(keys_by_value, open(os.path.join(root, "keys_by_value.json"), "w"))
print("keys:", len(keys_by_value))