rphrp1985 commited on
Commit
596a439
·
verified ·
1 Parent(s): ee7bd8e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -6
app.py CHANGED
@@ -26,12 +26,12 @@ model_id = "CohereForAI/c4ai-command-r-plus-4bit"
26
 
27
  tokenizer = AutoTokenizer.from_pretrained(model_id, token= token)
28
 
29
- model = AutoModelForCausalLM.from_pretrained(model_id, token= token, torch_dtype=torch.bfloat16,
30
- # attn_implementation="flash_attention_2",
31
- # low_cpu_mem_usage=True,
32
- llm_int8_enable_fp32_cpu_offload=True,
33
- device_map="auto"
34
- )
35
 
36
 
37
 
 
26
 
27
  tokenizer = AutoTokenizer.from_pretrained(model_id, token= token)
28
 
29
+ # model = AutoModelForCausalLM.from_pretrained(model_id, token= token, torch_dtype=torch.bfloat16,
30
+ # # attn_implementation="flash_attention_2",
31
+ # # low_cpu_mem_usage=True,
32
+ # llm_int8_enable_fp32_cpu_offload=True,
33
+ # device_map="auto"
34
+ # )
35
 
36
 
37