pfnet
/

nekomata-14b-pfn-qfin

Text Generation

Model card Files Files and versions Community

masanorihirano commited on Apr 5

Commit

16ea29f

•

1 Parent(s): 91f4032

Update README.md

Files changed (1) hide show

README.md +13 -0

README.md CHANGED Viewed

@@ -46,7 +46,20 @@ import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM
 tokenizer = AutoTokenizer.from_pretrained("pfnet/nekomata-14b-pfn-qfin", trust_remote_code=True)
 model = AutoModelForCausalLM.from_pretrained("pfnet/nekomata-14b-pfn-qfin", device_map="auto", trust_remote_code=True)
 text = "日本銀行は"
 input_ids = tokenizer(text, return_tensors="pt").input_ids
 with torch.no_grad():

 from transformers import AutoTokenizer, AutoModelForCausalLM
 tokenizer = AutoTokenizer.from_pretrained("pfnet/nekomata-14b-pfn-qfin", trust_remote_code=True)
+# Use GPU with bf16 (recommended for supported devices)
+# model = AutoModelForCausalLM.from_pretrained("pfnet/nekomata-14b-pfn-qfin", device_map="auto", trust_remote_code=True, bf16=True)
+# Use GPU with fp16
+# model = AutoModelForCausalLM.from_pretrained("pfnet/nekomata-14b-pfn-qfin", device_map="auto", trust_remote_code=True, fp16=True)
+# Use CPU
+# model = AutoModelForCausalLM.from_pretrained("pfnet/nekomata-14b-pfn-qfin", device_map="cpu", trust_remote_code=True)
+# Automatically select device and precision
 model = AutoModelForCausalLM.from_pretrained("pfnet/nekomata-14b-pfn-qfin", device_map="auto", trust_remote_code=True)
 text = "日本銀行は"
 input_ids = tokenizer(text, return_tensors="pt").input_ids
 with torch.no_grad():