Skip to content

Commit

Permalink
Increase Exception specificity for invalid model paths
Browse files Browse the repository at this point in the history
Signed-off-by: Khaled Sulayman <[email protected]>
  • Loading branch information
khaledsulayman committed Nov 13, 2024
1 parent cca058f commit 2a1a0cc
Show file tree
Hide file tree
Showing 2 changed files with 8 additions and 7 deletions.
2 changes: 1 addition & 1 deletion src/instructlab/sdg/utils/chunkers.py
Original file line number Diff line number Diff line change
Expand Up @@ -329,7 +329,7 @@ def create_tokenizer(model_name: Optional[str]):
)

else:
raise Exception(f"Received path to invalid model format {model_path}")
raise ValueError(f"Received path to invalid model format {model_path}")

logger.info(f"Successfully loaded tokenizer from: {model_path}")
return tokenizer
Expand Down
13 changes: 7 additions & 6 deletions tests/test_chunkers.py
Original file line number Diff line number Diff line change
Expand Up @@ -98,13 +98,14 @@ def test_create_tokenizer(tokenizer_model_name):


@pytest.mark.parametrize(
"model_name",
"model_name, expected_exception",
[
os.path.join(TEST_DATA_DIR, "models/invalid_gguf.gguf"),
os.path.join(TEST_DATA_DIR, "models/invalid_safetensors_dir/"),
os.path.join(TEST_DATA_DIR, "bad_path)"),
(os.path.join(TEST_DATA_DIR, "models/invalid_gguf.gguf"), ValueError)
(os.path.join(TEST_DATA_DIR, "models/invalid_safetensors_dir/"), ValueError)
(os.path.join(TEST_DATA_DIR, "bad_path)"), FileNotFoundError)
]
)
def test_invalid_tokenizer(model_name):
with pytest.raises(Exception):
def test_invalid_tokenizer(model_name, expected_exception):
# FileNot
with pytest.raises(expected_exception):
ContextAwareChunker.create_tokenizer(model_name)

0 comments on commit 2a1a0cc

Please sign in to comment.