diff --git a/json/en.json b/json/en.json index da7e8a0..756e6dc 100644 --- a/json/en.json +++ b/json/en.json @@ -12550,7 +12550,6 @@ "CatShort": "GAME", "Explanations": "Game sounds not fitting another category in this list. Cards would go here. Jenga.", "Synonyms": [ - "a", "bag", "ball", "balloon", @@ -22234,7 +22233,6 @@ "CatShort": "VEH", "Explanations": "Very old vehicles, such a Model A, Model T. Mainly cars, but possible other very old vehicles, trucks, tractors.", "Synonyms": [ - "a", "antique", "austin", "auto", @@ -23550,7 +23548,6 @@ "CatShort": "VOX", "Explanations": "A single voice singing, a child singing. For a crowd, use CROWDS-SINGING", "Synonyms": [ - "a", "cappella", "caroling", "chanting", diff --git a/tools/ucsxls2json.py b/tools/ucsxls2json.py index cad6dcc..b2f985c 100644 --- a/tools/ucsxls2json.py +++ b/tools/ucsxls2json.py @@ -85,6 +85,15 @@ for lang in langs: split_pattern = r'\W+' syn_list = re.split(split_pattern, syns_raw) category['Synonyms'] = [s.lower() for s in syn_list] + + # if the sub-category name is not in the synonym list, include it + # if category['SubCategory'].lower() not in category['Synonyms']: + # category['Synonyms'].append(category['SubCategory'].lower()) + + if lang == 'en': + for i, syn in enumerate(category['Synonyms']): + if syn == "a": + del category['Synonyms'][i] schedule.append(category)