diff --git a/neural_compressor/torch/quantization/config.py b/neural_compressor/torch/quantization/config.py
index 29f944b93e3..6eef8c76e8f 100644
--- a/neural_compressor/torch/quantization/config.py
+++ b/neural_compressor/torch/quantization/config.py
@@ -905,7 +905,7 @@ def __init__(
         enable_minmax_tuning: bool = True,
         lr: float = None,
         minmax_lr: float = None,
-        low_gpu_mem_usage: bool = True,
+        low_gpu_mem_usage: bool = False,
         iters: int = 200,
         seqlen: int = 2048,
         nsamples: int = 128,
@@ -938,7 +938,7 @@ def __init__(
             enable_minmax_tuning (bool): Whether to enable min-max tuning (default is True).
             lr (float): The learning rate (default is 0.005).
             minmax_lr (float): The learning rate for min-max tuning (default is None).
-            low_gpu_mem_usage (bool): Whether to use low GPU memory (default is True).
+            low_gpu_mem_usage (bool): Whether to use low GPU memory (default is False).
             iters (int): Number of iterations (default is 200).
             seqlen (int): Length of the sequence.
             nsamples (int): Number of samples (default is 512).