BhashiniSpace_Text_gemma

Runtime error

FlawedLLM commited on May 23

Commit

acee492

•

1 Parent(s): 46b1d37

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,7 +10,14 @@ from bitsandbytes.functional import quantize_blockwise
 tokenizer = AutoTokenizer.from_pretrained("FlawedLLM/Bhashini_gemma_merged4bit_clean_final")
 model = AutoModelForCausalLM.from_pretrained("FlawedLLM/Bhashini_gemma_merged4bit_clean_final")
-model= quantize_blockwise(model)
 # alpaca_prompt = You MUST copy from above!
 @spaces.GPU(duration=300)
 def chunk_it(input_command, item_list):

 tokenizer = AutoTokenizer.from_pretrained("FlawedLLM/Bhashini_gemma_merged4bit_clean_final")
 model = AutoModelForCausalLM.from_pretrained("FlawedLLM/Bhashini_gemma_merged4bit_clean_final")
+def quantize_model(model):
+    # Iterate over model parameters, not the entire model object
+    for name, module in model.named_modules():
+        if isinstance(module, torch.nn.Linear):  # Quantize only Linear layers
+            module = quantize_blockwise(module)
+# Quantize the model (modified)
+quantize_model(model)
 # alpaca_prompt = You MUST copy from above!
 @spaces.GPU(duration=300)
 def chunk_it(input_command, item_list):