vllm-project · mgoin · Jun 5, 2025 · Jun 5, 2025 · gemini-code-assist · Jun 5, 2025
@@ -651,6 +651,7 @@ def check_model(model):
         assert output
 
 
+@pytest.mark.skip(reason="Skip until the model config is updated")
-@pytest.mark.skip(reason="Skip until the model config is updated")
+@pytest.mark.skip(reason="Skip until 'nm-testing/TinyLlama-1.1B-Chat-v1.0-FP4' model config is updated for compatibility with the current compressed-tensors version. See issue #XYZ.")
-@pytest.mark.skip(reason="Skip until the model config is updated")
+@pytest.mark.skip(reason="Skip until 'nm-testing/TinyLlama-1.1B-Chat-v1.0-FP4' model config is updated for compatibility with the current compressed-tensors version. See issue #XYZ.")
 def test_compressed_tensors_nvfp4a16(vllm_runner):
     # run weight only example
     model = "nm-testing/TinyLlama-1.1B-Chat-v1.0-FP4"