Add dtype

vllm-project · WoosukKwon · Sep 1, 2023 · Aug 22, 2023 · Aug 22, 2023 · Aug 22, 2023
commit ac04105cdc88def7247cf81ec983f3449936ded5
diff --git a/tests/conftest.py b/tests/conftest.py
@@ -27,7 +27,7 @@ def example_prompts() -> List[str]:
 _STR_DTYPE_TO_TORCH_DTYPE = {
     "half": torch.half,
     "bfloat16": torch.bfloat16,
-    "float32": torch.float,
+    "float": torch.float,
 }
 
 

@@ -18,19 +18,21 @@
 
 
 @pytest.mark.parametrize("model", MODELS)
+@pytest.mark.parametrize("dtype", ["half"])
 @pytest.mark.parametrize("max_tokens", [128])
 def test_models(
     hf_runner,
     vllm_runner,
     example_prompts,
     model: str,
+    dtype: str,
     max_tokens: int,
 ) -> None:
-    hf_model = hf_runner(model)
+    hf_model = hf_runner(model, dtype=dtype)
     hf_outputs = hf_model.generate_greedy(example_prompts, max_tokens)
     del hf_model
 
-    vllm_model = vllm_runner(model)
+    vllm_model = vllm_runner(model, dtype=dtype)
     vllm_outputs = vllm_model.generate_greedy(example_prompts, max_tokens)
     del vllm_model