Spaces:
Paused
Paused
Update utils.py
Browse files
utils.py
CHANGED
@@ -82,6 +82,20 @@ def load_tokenizer_and_model(base_model, load_8bit=False):
|
|
82 |
return tokenizer,model, device
|
83 |
|
84 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
85 |
def load_model(base_model, load_8bit=False):
|
86 |
if torch.cuda.is_available():
|
87 |
device = "cuda"
|
|
|
82 |
return tokenizer,model, device
|
83 |
|
84 |
|
85 |
+
def load_tokenizer_and_model_Blaize(base_model, load_8bit=True):
|
86 |
+
if torch.cuda.is_available():
|
87 |
+
device = "cuda"
|
88 |
+
else:
|
89 |
+
device = "cpu"
|
90 |
+
|
91 |
+
|
92 |
+
tokenizer = LlamaTokenizer.from_pretrained(base_model, add_eos_token=True, use_auth_token=True)
|
93 |
+
model = LlamaForCausalLM.from_pretrained(base_model, load_in_8bit=True, device_map="auto")
|
94 |
+
#model.eval()
|
95 |
+
return tokenizer,model, device
|
96 |
+
|
97 |
+
|
98 |
+
|
99 |
def load_model(base_model, load_8bit=False):
|
100 |
if torch.cuda.is_available():
|
101 |
device = "cuda"
|