kajdun commited on
Commit
46814d3
·
1 Parent(s): b5a0ba1

Update handler.py

Browse files
Files changed (1) hide show
  1. handler.py +4 -4
handler.py CHANGED
@@ -14,10 +14,10 @@ class EndpointHandler():
14
  "bits": 4,
15
  "group_size": 128,
16
  "damp_percent": 0.01,
17
- "desc_act": false,
18
- "static_groups": false,
19
- "sym": true,
20
- "true_sequential": true
21
  })
22
  # load the optimized model
23
  model = AutoGPTQForCausalLM.from_quantized(path, device="cuda:0", quantize_config=quantize_config, use_safetensors=True) #file_name="model-quantized.onnx")
 
14
  "bits": 4,
15
  "group_size": 128,
16
  "damp_percent": 0.01,
17
+ "desc_act": False,
18
+ "static_groups": False,
19
+ "sym": True,
20
+ "true_sequential": True
21
  })
22
  # load the optimized model
23
  model = AutoGPTQForCausalLM.from_quantized(path, device="cuda:0", quantize_config=quantize_config, use_safetensors=True) #file_name="model-quantized.onnx")