Update handler.py
Browse files- handler.py +4 -4
handler.py
CHANGED
@@ -14,10 +14,10 @@ class EndpointHandler():
|
|
14 |
"bits": 4,
|
15 |
"group_size": 128,
|
16 |
"damp_percent": 0.01,
|
17 |
-
"desc_act":
|
18 |
-
"static_groups":
|
19 |
-
"sym":
|
20 |
-
"true_sequential":
|
21 |
})
|
22 |
# load the optimized model
|
23 |
model = AutoGPTQForCausalLM.from_quantized(path, device="cuda:0", quantize_config=quantize_config, use_safetensors=True) #file_name="model-quantized.onnx")
|
|
|
14 |
"bits": 4,
|
15 |
"group_size": 128,
|
16 |
"damp_percent": 0.01,
|
17 |
+
"desc_act": False,
|
18 |
+
"static_groups": False,
|
19 |
+
"sym": True,
|
20 |
+
"true_sequential": True
|
21 |
})
|
22 |
# load the optimized model
|
23 |
model = AutoGPTQForCausalLM.from_quantized(path, device="cuda:0", quantize_config=quantize_config, use_safetensors=True) #file_name="model-quantized.onnx")
|