From f2dc0d8a7ba973f7238a7f3dde02616a6b0ea0bb Mon Sep 17 00:00:00 2001 From: Jamie Hardt Date: Sat, 8 Nov 2025 17:09:33 -0800 Subject: [PATCH] csv implementation --- pyproject.toml | 4 +++- ucsinfer/finetune.py | 3 +++ ucsinfer/import_csv.py | 3 ++- 3 files changed, 8 insertions(+), 2 deletions(-) create mode 100644 ucsinfer/finetune.py diff --git a/pyproject.toml b/pyproject.toml index 88ec063..b3bf9cd 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,7 +1,9 @@ [project] name = "ucsinfer" version = "0.1.0" -description = "Tools for applying UCS categories to sounds using large-language models" +description = """ +Tools for applying UCS categories to sounds using large-language models +""" authors = [ {name = "Jamie Hardt", email = "jamiehardt@me.com"} ] diff --git a/ucsinfer/finetune.py b/ucsinfer/finetune.py new file mode 100644 index 0000000..e967bb7 --- /dev/null +++ b/ucsinfer/finetune.py @@ -0,0 +1,3 @@ +from sentence_transformers import SentenceTransformerTrainingArguments + +args = SentenceTransformerTrainingArguments(output_dir="finetuned/") diff --git a/ucsinfer/import_csv.py b/ucsinfer/import_csv.py index 9a21318..01d0151 100644 --- a/ucsinfer/import_csv.py +++ b/ucsinfer/import_csv.py @@ -5,7 +5,8 @@ from typing import Generator from .util import parse_ucs -def csv_to_data(paths, description_key, filename_key, catid_list) -> Generator[tuple[str, str], None, None]: +def csv_to_data(paths, description_key, filename_key, catid_list) \ + -> Generator[tuple[str, str], None, None]: """ Accepts a list of paths and returns an iterator of (sentence, class) tuples.