YingL19 commited on
Commit
29eb4e7
·
verified ·
1 Parent(s): a6daa92

Update handler.py

Browse files
Files changed (1) hide show
  1. handler.py +2 -2
handler.py CHANGED
@@ -34,7 +34,7 @@ class EndpointHandler():
34
  DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
35
  model_name = "moka-ai/m3e-base"
36
  self.config = PeftConfig.from_pretrained("YingL19/gemma_10epoch_1e5_lincoln1",device_map=DEVICE)
37
- self.base_model = AutoModelForCausalLM.from_pretrained("google/gemma-7b")
38
  self.newmodel = PeftModel.from_pretrained(self.base_model, "YingL19/gemma_10epoch_1e5_lincoln1",device_map=DEVICE)
39
  self.tokenizer = AutoTokenizer.from_pretrained("YingL19/gemma_10epoch_1e5_lincoln1",device_map=DEVICE)
40
 
@@ -68,7 +68,7 @@ ASSISTANT:'''
68
  template=self.prompt_template,
69
  )
70
 
71
- embeddings = HuggingFaceEmbeddings(model_name=model_name)
72
  embeddings.client = SentenceTransformer(model_name, device=DEVICE)
73
  ragdb = Chroma(persist_directory="/Lincoln_DB", embedding_function=embeddings)
74
 
 
34
  DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
35
  model_name = "moka-ai/m3e-base"
36
  self.config = PeftConfig.from_pretrained("YingL19/gemma_10epoch_1e5_lincoln1",device_map=DEVICE)
37
+ self.base_model = AutoModelForCausalLM.from_pretrained("google/gemma-7b",device_map=DEVICE)
38
  self.newmodel = PeftModel.from_pretrained(self.base_model, "YingL19/gemma_10epoch_1e5_lincoln1",device_map=DEVICE)
39
  self.tokenizer = AutoTokenizer.from_pretrained("YingL19/gemma_10epoch_1e5_lincoln1",device_map=DEVICE)
40
 
 
68
  template=self.prompt_template,
69
  )
70
 
71
+ embeddings = HuggingFaceEmbeddings(model_name=model_name,model_kwargs={'device':DEVICE})
72
  embeddings.client = SentenceTransformer(model_name, device=DEVICE)
73
  ragdb = Chroma(persist_directory="/Lincoln_DB", embedding_function=embeddings)
74