MichaelAI23
/

falcon-rw-1b_8bit_finetuned

Inference Endpoints

Model card Files Files and versions Community

Michael Brunzel commited on Sep 12, 2023

Commit

a1f7ec0

•

1 Parent(s): b4a7bbc

Update model path

Files changed (1) hide show

handler.py +2 -2

handler.py CHANGED Viewed

@@ -8,14 +8,14 @@ class EndpointHandler:
     def __init__(self, path=""):
         # load model and processor from path
         self.model =  AutoModelForCausalLM.from_pretrained(
-            path, device_map="auto", load_in_8bit=True)
         self.model = PeftModel.from_pretrained(
             self.model,
             "MichaelAI23/falcon-rw-1b_8bit_finetuned",
             torch_dtype=torch.float16,
             device_map="auto"
         )
-        self.tokenizer = AutoTokenizer.from_pretrained(path)
         self.template = {
             "prompt_input": "Below is an instruction that describes a task, paired with an input that provides further context. Write a response that appropriately completes the request.\n\n### Instruction:\n{instruction}\n\n### Input:\n{input}\n\n### Response:\n",
             "prompt_no_input": "Below is an instruction that describes a task. Write a response that appropriately completes the request.\n\n### Instruction:\n{instruction}\n\n### Response:\n",

     def __init__(self, path=""):
         # load model and processor from path
         self.model =  AutoModelForCausalLM.from_pretrained(
+            "tiiuae/falcon-rw-1b", device_map="auto", load_in_8bit=True)
         self.model = PeftModel.from_pretrained(
             self.model,
             "MichaelAI23/falcon-rw-1b_8bit_finetuned",
             torch_dtype=torch.float16,
             device_map="auto"
         )
+        self.tokenizer = AutoTokenizer.from_pretrained("tiiuae/falcon-rw-1b")
         self.template = {
             "prompt_input": "Below is an instruction that describes a task, paired with an input that provides further context. Write a response that appropriately completes the request.\n\n### Instruction:\n{instruction}\n\n### Input:\n{input}\n\n### Response:\n",
             "prompt_no_input": "Below is an instruction that describes a task. Write a response that appropriately completes the request.\n\n### Instruction:\n{instruction}\n\n### Response:\n",