BhashiniSpace_Text_gemma

Runtime error

FlawedLLM commited on May 22

Commit

9d7277a

•

1 Parent(s): dcde33a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,11 +7,11 @@ from peft import PeftModel, PeftConfig
 tokenizer = AutoTokenizer.from_pretrained("FlawedLLM/BhashiniLLM")
-# quantization_config = BitsAndBytesConfig(
-#         load_in_4bit=True,
-#         bnb_4bit_use_double_quant=True,
-#         bnb_4bit_quant_type="nf4",
-#         bnb_4bit_compute_dtype=torch.float16)
 # model = AutoModelForCausalLM.from_pretrained("FlawedLLM/BhashiniLLM",
 #                                              device_map="auto",
 #                                              quantization_config=quantization_config,
@@ -35,7 +35,7 @@ tokenizer = AutoTokenizer.from_pretrained("FlawedLLM/BhashiniLLM")
 config = PeftConfig.from_pretrained("FlawedLLM/BhashiniLLM")
-base_model = AutoModelForCausalLM.from_pretrained("unsloth/llama-3-8b-bnb-4bit",  device_map='auto')
 model = PeftModel.from_pretrained(base_model, "FlawedLLM/BhashiniLLM")

 tokenizer = AutoTokenizer.from_pretrained("FlawedLLM/BhashiniLLM")
+quantization_config = BitsAndBytesConfig(
+        load_in_4bit=True,
+        bnb_4bit_use_double_quant=True,
+        bnb_4bit_quant_type="nf4",
+        bnb_4bit_compute_dtype=torch.float16)
 # model = AutoModelForCausalLM.from_pretrained("FlawedLLM/BhashiniLLM",
 #                                              device_map="auto",
 #                                              quantization_config=quantization_config,
 config = PeftConfig.from_pretrained("FlawedLLM/BhashiniLLM")
+base_model = AutoModelForCausalLM.from_pretrained("unsloth/llama-3-8b-bnb-4bit",  device_map='auto', quantization_config=quantization_config)
 model = PeftModel.from_pretrained(base_model, "FlawedLLM/BhashiniLLM")