Skip to content

Commit

Permalink
update model names
Browse files Browse the repository at this point in the history
  • Loading branch information
dsikka committed Jun 7, 2024
1 parent fb1b863 commit aec7c82
Showing 1 changed file with 3 additions and 3 deletions.
6 changes: 3 additions & 3 deletions tests/quantization/test_compressed_tensors.py
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@


def test_compressed_tensors_w8a8_static_setup(vllm_runner):
model_path = "nm-testing/tinyllama-one-shot-static-quant-test-compressed"
model_path = "nm-testing/tinyllama-oneshot-w8a8-static-v2"
llm = vllm_runner(model_path,
quantization="compressed-tensors",
enforce_eager=True)
Expand Down Expand Up @@ -40,9 +40,9 @@ def test_compressed_tensors_w8a8_static_setup(vllm_runner):


def test_compressed_tensors_w8a8_dynanmic_per_token(vllm_runner):
model_path = "nm-testing/tinyllama-one-shot-dynamic-test"
model_path = "nm-testing/tinyllama-oneshot-w8a8-dynamic-token-v2"
llm = vllm_runner(model_path,
quantization="sparseml",
quantization="compressed-tensors",
enforce_eager=True,
dtype=torch.float16)
model = llm.model.llm_engine.model_executor.driver_worker.model_runner.model
Expand Down

0 comments on commit aec7c82

Please sign in to comment.