From 9dec218c664f2e93fca9fd8d9c10845ec52f10c9 Mon Sep 17 00:00:00 2001 From: Michael Goin Date: Tue, 23 Jul 2024 18:45:12 -0400 Subject: [PATCH] [CI] Add smoke test for non-uniform AutoFP8 quantization (#6702) --- tests/quantization/test_fp8.py | 1 + 1 file changed, 1 insertion(+) diff --git a/tests/quantization/test_fp8.py b/tests/quantization/test_fp8.py index 82dc775f8d812..0602fedf0b8e3 100644 --- a/tests/quantization/test_fp8.py +++ b/tests/quantization/test_fp8.py @@ -13,6 +13,7 @@ MODELS = [ "neuralmagic/Meta-Llama-3-8B-Instruct-FP8-KV", "nm-testing/Phi-3-mini-128k-instruct-FP8", + "nm-testing/Qwen2-0.5B-Instruct-FP8-SkipQKV", ]