oleksandrfluxon
commited on
Commit
•
64acb26
1
Parent(s):
6ee6fc5
Update pipeline.py
Browse files- pipeline.py +1 -2
pipeline.py
CHANGED
@@ -25,8 +25,7 @@ class PreTrainedPipeline():
|
|
25 |
# torch_dtype=torch.bfloat16, # Load model weights in bfloat16
|
26 |
torch_dtype=torch.float16,
|
27 |
trust_remote_code=True,
|
28 |
-
device_map="auto",
|
29 |
-
revision="pr/47",
|
30 |
load_in_8bit=True # Load model in the lowest 4-bit precision quantization
|
31 |
)
|
32 |
# model.to('cuda')
|
|
|
25 |
# torch_dtype=torch.bfloat16, # Load model weights in bfloat16
|
26 |
torch_dtype=torch.float16,
|
27 |
trust_remote_code=True,
|
28 |
+
device_map="auto",
|
|
|
29 |
load_in_8bit=True # Load model in the lowest 4-bit precision quantization
|
30 |
)
|
31 |
# model.to('cuda')
|