From 7fcac7861981be15c9ad00d900bd7afe117f3d20 Mon Sep 17 00:00:00 2001 From: youkaichao Date: Thu, 18 Jul 2024 13:16:16 -0700 Subject: [PATCH] add quantization tests --- tests/basic_correctness/test_cpu_offload.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/tests/basic_correctness/test_cpu_offload.py b/tests/basic_correctness/test_cpu_offload.py index a5df5639cf948..3ab01d52277d7 100644 --- a/tests/basic_correctness/test_cpu_offload.py +++ b/tests/basic_correctness/test_cpu_offload.py @@ -4,3 +4,5 @@ def test_cpu_offload(): compare_two_settings("meta-llama/Llama-2-7b-hf", [], ["--cpu-offload-gb", "4"]) + compare_two_settings("nm-testing/llama7b-one-shot-2_4-w4a16-marlin24-t", + [], ["--cpu-offload-gb", "1"])