Work on models.md
This commit is contained in:
16
MODELS.md
Normal file
16
MODELS.md
Normal file
@@ -0,0 +1,16 @@
|
|||||||
|
# Models
|
||||||
|
|
||||||
|
## Results for Model paraphrase-multilingual-MiniLM-L12-v2 ##
|
||||||
|
|
||||||
|
(FOLYProp and FOLYFeet have been omitted from the dataset.)
|
||||||
|
|
||||||
|
| | n | pct |
|
||||||
|
|--------------------------------|------|--------|
|
||||||
|
| Total records in sample: | 2335 | |
|
||||||
|
| Top Result: | 415 | 17.77% |
|
||||||
|
| Top 5 Result: | 545 | 23.34% |
|
||||||
|
| Top 10 Result: | 419 | 17.94% |
|
||||||
|
| |
|
||||||
|
| UCS category count: | 752 | |
|
||||||
|
| Total categories in sample: | 238 | 31.65% |
|
||||||
|
| Most missed category (BLLTBy): | 140 | 6.00% |
|
32
MODELS.rst
32
MODELS.rst
@@ -1,32 +0,0 @@
|
|||||||
Results for Model paraphrase-multilingual-mpnet-base-v2
|
|
||||||
=====
|
|
||||||
|
|
||||||
================================ ==== ======
|
|
||||||
.. n pct
|
|
||||||
================================ ==== ======
|
|
||||||
Total records in sample: 3445
|
|
||||||
Top Result: 469 13.61%
|
|
||||||
Top 5 Result: 519 15.07%
|
|
||||||
Top 10 Result: 513 14.89%
|
|
||||||
================================ ==== ======
|
|
||||||
UCS category count: 752
|
|
||||||
Total categories in sample: 240 31.91%
|
|
||||||
Most missed category (FOLYProp): 1057 30.68%
|
|
||||||
================================ ==== ======
|
|
||||||
|
|
||||||
|
|
||||||
Results for Model paraphrase-multilingual-MiniLM-L12-v2
|
|
||||||
=====
|
|
||||||
|
|
||||||
================================ ==== ======
|
|
||||||
.. n pct
|
|
||||||
================================ ==== ======
|
|
||||||
Total records in sample: 3445
|
|
||||||
Top Result: 418 12.13%
|
|
||||||
Top 5 Result: 559 16.23%
|
|
||||||
Top 10 Result: 433 12.57%
|
|
||||||
================================ ==== ======
|
|
||||||
UCS category count: 752
|
|
||||||
Total categories in sample: 240 31.91%
|
|
||||||
Most missed category (FOLYProp): 1047 30.39%
|
|
||||||
================================ ==== ======
|
|
@@ -68,7 +68,9 @@ def finetune():
|
|||||||
@ucsinfer.command('evaluate')
|
@ucsinfer.command('evaluate')
|
||||||
@click.option('--offset', type=int, default=0)
|
@click.option('--offset', type=int, default=0)
|
||||||
@click.option('--limit', type=int, default=-1)
|
@click.option('--limit', type=int, default=-1)
|
||||||
@click.option('--no-foley', type=bool, default=False)
|
@click.option('--no-foley', 'no_foley', flag_value=True, default=False,
|
||||||
|
help="Ignore any data in the set with FOLYProp or FOLYFeet "
|
||||||
|
"category")
|
||||||
@click.option('--model', type=str,
|
@click.option('--model', type=str,
|
||||||
default="paraphrase-multilingual-mpnet-base-v2")
|
default="paraphrase-multilingual-mpnet-base-v2")
|
||||||
@click.argument('dataset', type=click.File('r', encoding='utf8'),
|
@click.argument('dataset', type=click.File('r', encoding='utf8'),
|
||||||
@@ -90,6 +92,9 @@ def evaluate(dataset, offset, limit, model, no_foley):
|
|||||||
break
|
break
|
||||||
|
|
||||||
cat_id, description = row
|
cat_id, description = row
|
||||||
|
if no_foley and cat_id in ['FOLYProp', 'FOLYFeet']:
|
||||||
|
continue
|
||||||
|
|
||||||
guesses = ctx.classify_text_ranked(description, limit=10)
|
guesses = ctx.classify_text_ranked(description, limit=10)
|
||||||
if cat_id == guesses[0]:
|
if cat_id == guesses[0]:
|
||||||
results.append({'catid': cat_id, 'result': "TOP"})
|
results.append({'catid': cat_id, 'result': "TOP"})
|
||||||
@@ -116,8 +121,10 @@ def evaluate(dataset, offset, limit, model, no_foley):
|
|||||||
|
|
||||||
miss_counts = sorted(miss_counts, key=lambda x: x[1])
|
miss_counts = sorted(miss_counts, key=lambda x: x[1])
|
||||||
|
|
||||||
print(f"Results for Model {model}")
|
print(f"## Results for Model {model} ##")
|
||||||
print("=====\n")
|
|
||||||
|
if no_foley:
|
||||||
|
print("(FOLYProp and FOLYFeet have been omitted from the dataset.)\n")
|
||||||
|
|
||||||
table = [
|
table = [
|
||||||
["Total records in sample:", f"{total}"],
|
["Total records in sample:", f"{total}"],
|
||||||
@@ -136,7 +143,7 @@ def evaluate(dataset, offset, limit, model, no_foley):
|
|||||||
f"{float(miss_counts[-1][1])/float(total):.2%}"]
|
f"{float(miss_counts[-1][1])/float(total):.2%}"]
|
||||||
]
|
]
|
||||||
|
|
||||||
print(tabulate(table, headers=['', 'n', 'pct'], tablefmt='rst'))
|
print(tabulate(table, headers=['', 'n', 'pct'], tablefmt='github'))
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
|
Reference in New Issue
Block a user