zerogpu-2

Running on Zero

rphrp1985 commited on Jun 9, 2024

Commit

596a439

verified ·

1 Parent(s): ee7bd8e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -26,12 +26,12 @@ model_id = "CohereForAI/c4ai-command-r-plus-4bit"
 tokenizer = AutoTokenizer.from_pretrained(model_id, token= token)
-model = AutoModelForCausalLM.from_pretrained(model_id, token= token, torch_dtype=torch.bfloat16,
-                                             # attn_implementation="flash_attention_2",
-                                             # low_cpu_mem_usage=True,
-                                             llm_int8_enable_fp32_cpu_offload=True,
-                                             device_map="auto"
-                                            )

 tokenizer = AutoTokenizer.from_pretrained(model_id, token= token)
+# model = AutoModelForCausalLM.from_pretrained(model_id, token= token, torch_dtype=torch.bfloat16,
+#                                              # attn_implementation="flash_attention_2",
+#                                              # low_cpu_mem_usage=True,
+#                                              llm_int8_enable_fp32_cpu_offload=True,
+#                                              device_map="auto"
+#                                             )