fix memory check

Signed-off-by: jiqing-feng <[email protected]>
huggingface · Dec 20, 2024 · 99b5f14 · 99b5f14
1 parent f9e7e45
commit 99b5f14
Showing 1 changed file with 2 additions and 3 deletions.
diff --git a/tests/quantization/gptq/test_gptq.py b/tests/quantization/gptq/test_gptq.py
@@ -89,7 +89,7 @@ class GPTQTest(unittest.TestCase):
     EXPECTED_OUTPUTS.add("Hello my name is Katie. I am a 20 year")
 
     # this seems a little small considering that we are doing 4bit quant but we have a small model and ww don't quantize the embeddings
-    EXPECTED_RELATIVE_DIFFERENCE = 2.06184043
+    EXPECTED_RELATIVE_DIFFERENCE = 2.0618
 
     bits = 4
     sym = True
@@ -142,7 +142,7 @@ def test_memory_footprint(self):
 
         mem_quantized = self.quantized_model.get_memory_footprint()
 
-        self.assertAlmostEqual(self.mem_fp16 / mem_quantized, self.EXPECTED_RELATIVE_DIFFERENCE)
+        self.assertAlmostEqual(self.mem_fp16 / mem_quantized, self.EXPECTED_RELATIVE_DIFFERENCE, places=4)
 
     def test_device_and_dtype_assignment(self):
         r"""
@@ -271,7 +271,6 @@ def test_serialization_big_model_inference(self):
 
 @require_torch_gpu
 class GPTQTestCUDA(GPTQTest):
-    EXPECTED_RELATIVE_DIFFERENCE = 2.06183008
     device_map = {"": 0}
 
     @classmethod