Update services/model_service.py
Browse files
services/model_service.py
CHANGED
@@ -42,7 +42,7 @@ class ModelService:
|
|
42 |
settings.MODEL_NAME,
|
43 |
torch_dtype=torch.float16 if quantization_device == "cuda" else torch.float32,
|
44 |
device_map="auto" if quantization_device == "cuda" else None,
|
45 |
-
|
46 |
trust_remote_code=True
|
47 |
)
|
48 |
logger.info(f"Model {settings.MODEL_NAME} loaded successfully on {quantization_device}.")
|
|
|
42 |
settings.MODEL_NAME,
|
43 |
torch_dtype=torch.float16 if quantization_device == "cuda" else torch.float32,
|
44 |
device_map="auto" if quantization_device == "cuda" else None,
|
45 |
+
# load_in_8bit=(quantization_bits == 8),
|
46 |
trust_remote_code=True
|
47 |
)
|
48 |
logger.info(f"Model {settings.MODEL_NAME} loaded successfully on {quantization_device}.")
|