test(huggingface): Added one additional test and refactored some others.

BlueCrescent · BlueCrescent · commit 000a9fa6b2f5 · 2025-03-06T09:21:35.000+01:00
diff --git a/tests/conversion/gpt2/conftest.py b/tests/conversion/gpt2/conftest.py
@@ -11,8 +11,9 @@
 from tests.conftest import _ROOT_DIR
 
 
-@pytest.fixture()
-def gpt2_config_path(tmp_path: Path, initialized_model: GPT2LLM, config_file_path: str) -> str:
+@pytest.fixture
+def gpt2_config_path(tmpdir_factory: pytest.TempdirFactory, initialized_model: GPT2LLM, config_file_path: str) -> str:
+    tmp_path = tmpdir_factory.mktemp("gpt2_model")
     new_config_filename = tmp_path / "gpt2_config_test.yaml"
     model_path = tmp_path / "model.pth"
     shutil.copy(config_file_path, new_config_filename)
diff --git a/tests/conversion/gpt2/test_conversion_model.py b/tests/conversion/gpt2/test_conversion_model.py
@@ -11,6 +11,12 @@
 from tests.conversion.gpt2.helper import check_same_weight_base_modules, check_same_weight_model
 
 
+def test_convert_model_can_generate(gpt2_config_path: str):
+    modalities_config = load_app_config_dict(gpt2_config_path)
+    hf_model, _ = convert_model_checkpoint(modalities_config)
+    assert hf_model.can_generate()
+
+
 def test_convert_model_checkpoint_does_not_change_weights(gpt2_config_path: str):
     modalities_config = load_app_config_dict(gpt2_config_path)
     hf_model, modalities_model = convert_model_checkpoint(modalities_config)
diff --git a/tests/conversion/gpt2/test_convert_gpt2.py b/tests/conversion/gpt2/test_convert_gpt2.py
@@ -1,33 +1,53 @@
 from pathlib import Path
 
+import pytest
 import torch
-from transformers import AutoModelForCausalLM
+from transformers import AutoModelForCausalLM, PreTrainedModel
 
 from modalities.config.config import load_app_config_dict
 from modalities.conversion.gpt2.conversion_model import check_converted_model
 from modalities.conversion.gpt2.convert_gpt2 import convert_gpt2
+from modalities.models.gpt2.gpt2_model import GPT2LLM
 from modalities.models.utils import ModelTypeEnum, get_model_from_config
 from tests.conversion.gpt2.helper import check_same_weight_model
 
 
-def test_converting_gpt2_does_not_change_weights(tmp_path: Path, gpt2_config_path: str):
-    output_dir = tmp_path / "output"
-    convert_gpt2(gpt2_config_path, output_dir)
-    modalities_config = load_app_config_dict(gpt2_config_path)
-    original_model = get_model_from_config(modalities_config, model_type=ModelTypeEnum.CHECKPOINTED_MODEL)
-    converted_model = AutoModelForCausalLM.from_pretrained(output_dir, local_files_only=True, trust_remote_code=True)
+def test_converting_gpt2_does_not_change_weights(converted_model: PreTrainedModel, original_model: GPT2LLM):
     check_same_weight_model(converted_model, original_model)
 
 
-def test_converting_gpt2_does_not_change_outputs(tmp_path: Path, gpt2_config_path: str):
-    output_dir = tmp_path / "output"
-    convert_gpt2(gpt2_config_path, output_dir)
-    modalities_config = load_app_config_dict(gpt2_config_path)
-    original_model = get_model_from_config(modalities_config, model_type=ModelTypeEnum.CHECKPOINTED_MODEL)
-    converted_model = AutoModelForCausalLM.from_pretrained(
-        output_dir, local_files_only=True, trust_remote_code=True
-    ).to(dtype=torch.bfloat16)
-    vocab_size = modalities_config["model_raw" if "model_raw" in modalities_config else "model"]["config"]["vocab_size"]
+def test_converting_gpt2_does_not_change_outputs(
+    converted_model: PreTrainedModel, original_model: GPT2LLM, vocab_size: int
+):
     check_converted_model(
         hf_model=converted_model, modalities_model=original_model, num_testruns=1, vocab_size=vocab_size
     )
+
+
+@pytest.fixture
+def converted_model(run_convert_gpt2: None, output_dir: Path) -> PreTrainedModel:
+    return AutoModelForCausalLM.from_pretrained(output_dir, local_files_only=True, trust_remote_code=True).to(
+        dtype=torch.bfloat16
+    )
+
+
+@pytest.fixture
+def run_convert_gpt2(gpt2_config_path: str, output_dir: Path):
+    convert_gpt2(gpt2_config_path, output_dir)
+
+
+@pytest.fixture
+def original_model(gpt2_config_path: str) -> GPT2LLM:
+    modalities_config = load_app_config_dict(gpt2_config_path)
+    return get_model_from_config(modalities_config, model_type=ModelTypeEnum.CHECKPOINTED_MODEL)
+
+
+@pytest.fixture
+def vocab_size(gpt2_config_path: str) -> int:
+    modalities_config = load_app_config_dict(gpt2_config_path)
+    return modalities_config["model_raw" if "model_raw" in modalities_config else "model"]["config"]["vocab_size"]
+
+
+@pytest.fixture
+def output_dir(tmp_path: Path) -> Path:
+    return tmp_path / "output"