|
@@ -7,7 +7,7 @@ import torch
|
|
from transformers import BitsAndBytesConfig
|
|
from transformers import BitsAndBytesConfig
|
|
|
|
|
|
@dataclass
|
|
@dataclass
|
|
-class quantizatio_config:
|
|
|
|
|
|
+class quantization_config:
|
|
quant_type: str # "int4" or "int8"
|
|
quant_type: str # "int4" or "int8"
|
|
compute_dtype: torch.dtype
|
|
compute_dtype: torch.dtype
|
|
use_double_quant: bool = False
|
|
use_double_quant: bool = False
|