Removing "a" as a synonym from all cats in English

This commit is contained in:
Jamie Hardt
2024-10-31 20:08:10 -07:00
parent 32f17ca7b5
commit daa714a9b4
2 changed files with 9 additions and 3 deletions

View File

@@ -85,6 +85,15 @@ for lang in langs:
split_pattern = r'\W+'
syn_list = re.split(split_pattern, syns_raw)
category['Synonyms'] = [s.lower() for s in syn_list]
# if the sub-category name is not in the synonym list, include it
# if category['SubCategory'].lower() not in category['Synonyms']:
# category['Synonyms'].append(category['SubCategory'].lower())
if lang == 'en':
for i, syn in enumerate(category['Synonyms']):
if syn == "a":
del category['Synonyms'][i]
schedule.append(category)