From a49a2f093373bdea0232507dec37ac426a312f7e Mon Sep 17 00:00:00 2001 From: Joshua Wendland <80349780+joshuawe@users.noreply.github.com> Date: Wed, 6 Mar 2024 08:54:56 +0100 Subject: [PATCH] remove pytest-dependency and associated code --- requirements.txt | 1 - tests/eval/test_token_labelling.py | 19 ++++++++++--------- 2 files changed, 10 insertions(+), 10 deletions(-) diff --git a/requirements.txt b/requirements.txt index 79e0af2a..8130d532 100644 --- a/requirements.txt +++ b/requirements.txt @@ -5,7 +5,6 @@ tqdm==4.66.1 ipywidgets==8.1.1 nbformat==5.9.2 pytest==7.4.4 -pytest-dependency==0.6.0 black==23.12.1 jaxtyping==0.2.25 beartype==0.16.4 diff --git a/tests/eval/test_token_labelling.py b/tests/eval/test_token_labelling.py index e566057b..3f850f74 100644 --- a/tests/eval/test_token_labelling.py +++ b/tests/eval/test_token_labelling.py @@ -141,7 +141,6 @@ def is_valid_structure(obj: dict[int, dict[str, bool]]) -> bool: return True -@pytest.mark.dependency() def test_label_tokens_from_tokenizer(): """ Simple test, checking if download of tokinzer and the labelling of all tokens in its vocabulary works. @@ -159,16 +158,18 @@ def test_label_tokens_from_tokenizer(): assert is_valid_structure(labelled_token_ids_dict) == True -@pytest.mark.dependency(depends=["test_label_tokens_from_tokenizer"]) @pytest.mark.parametrize("path", [Path("temp/token_labels.csv")]) def test_import_token_labels(path: Path): - global labelled_token_ids_dict - assert ( - labelled_token_ids_dict is not None - ), "It should be filled for the test to run. Check test-dependency." - assert ( - labelled_token_ids_dict != {} - ), "It should be filled for the test to run. Check test-dependency." + """ + Simple test, checking if the import of token labels works. + + Note: Because we want to use pure pytest and not install any extra dependencies (e.g. pytest-depencency) we recreate the `labelled_tokens_dict` in this test as we did in `test_label_tokens_from_tokenizer`. This duplication is not ideal, but it is the best quick&dirty solution for now. + """ + # create the labelled_token_ids_dict + model_name = "delphi-suite/delphi-llama2-100k" + tokenizer = AutoTokenizer.from_pretrained(model_name) + _, labelled_token_ids_dict = tl.label_tokens_from_tokenizer(tokenizer) + # create the path path.parent.mkdir(parents=True, exist_ok=True) # save the file