Spaces:
Runtime error
Runtime error
CamiloVega
commited on
Update app.py
Browse files
app.py
CHANGED
@@ -70,13 +70,13 @@ class ModelManager:
|
|
70 |
self.model = AutoModelForCausalLM.from_pretrained(
|
71 |
model_name,
|
72 |
token=HUGGINGFACE_TOKEN,
|
73 |
-
device_map="auto",
|
74 |
-
torch_dtype=torch.float16,
|
75 |
-
low_cpu_mem_usage=True,
|
76 |
-
use_safetensors=True,
|
77 |
-
max_memory={0: "6GB"},
|
78 |
-
offload_folder="offload",
|
79 |
-
offload_state_dict=True
|
80 |
)
|
81 |
|
82 |
# Create pipeline with minimal settings
|
@@ -86,8 +86,8 @@ class ModelManager:
|
|
86 |
"text-generation",
|
87 |
model=self.model,
|
88 |
tokenizer=self.tokenizer,
|
89 |
-
device_map="auto",
|
90 |
-
torch_dtype=torch.float16,
|
91 |
max_new_tokens=512,
|
92 |
do_sample=True,
|
93 |
temperature=0.7,
|
|
|
70 |
self.model = AutoModelForCausalLM.from_pretrained(
|
71 |
model_name,
|
72 |
token=HUGGINGFACE_TOKEN,
|
73 |
+
device_map="auto",
|
74 |
+
torch_dtype=torch.float16,
|
75 |
+
low_cpu_mem_usage=True,
|
76 |
+
use_safetensors=True,
|
77 |
+
max_memory={0: "6GB"},
|
78 |
+
offload_folder="offload",
|
79 |
+
offload_state_dict=True
|
80 |
)
|
81 |
|
82 |
# Create pipeline with minimal settings
|
|
|
86 |
"text-generation",
|
87 |
model=self.model,
|
88 |
tokenizer=self.tokenizer,
|
89 |
+
device_map="auto",
|
90 |
+
torch_dtype=torch.float16,
|
91 |
max_new_tokens=512,
|
92 |
do_sample=True,
|
93 |
temperature=0.7,
|