remove redundant test

dsikka · dsikka · commit 58ca798e6ad3 · 2024-08-27T13:15:46.000Z
diff --git a/tests/quantization/test_compressed_tensors.py b/tests/quantization/test_compressed_tensors.py
@@ -160,11 +160,4 @@ def test_compressed_tensors_kv_cache(vllm_runner):
     model_path = "nm-testing/TinyLlama-1.1B-compressed-tensors-kv-cache-scheme"
     with vllm_runner(model_path, kv_cache_dtype="fp8") as llm:
         output = llm.generate_greedy("Hello world!", max_tokens=20)
-        assert output
-
-
-def test_compressed_tensors_fused_moe(vllm_runner):
-    model_path = "nm-testing/Mixtral-8x7B-Instruct-v0.1-W4A16-channel-quantized"
-    with vllm_runner(model_path) as llm:
-        output = llm.generate_greedy("Hello world!", max_tokens=20)
-        assert output
+        assert output