Update handler.py
Browse files- handler.py +2 -2
handler.py
CHANGED
@@ -34,7 +34,7 @@ class EndpointHandler():
|
|
34 |
DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
|
35 |
model_name = "moka-ai/m3e-base"
|
36 |
self.config = PeftConfig.from_pretrained("YingL19/gemma_10epoch_1e5_lincoln1",device_map=DEVICE)
|
37 |
-
self.base_model = AutoModelForCausalLM.from_pretrained("google/gemma-7b")
|
38 |
self.newmodel = PeftModel.from_pretrained(self.base_model, "YingL19/gemma_10epoch_1e5_lincoln1",device_map=DEVICE)
|
39 |
self.tokenizer = AutoTokenizer.from_pretrained("YingL19/gemma_10epoch_1e5_lincoln1",device_map=DEVICE)
|
40 |
|
@@ -68,7 +68,7 @@ ASSISTANT:'''
|
|
68 |
template=self.prompt_template,
|
69 |
)
|
70 |
|
71 |
-
embeddings = HuggingFaceEmbeddings(model_name=model_name)
|
72 |
embeddings.client = SentenceTransformer(model_name, device=DEVICE)
|
73 |
ragdb = Chroma(persist_directory="/Lincoln_DB", embedding_function=embeddings)
|
74 |
|
|
|
34 |
DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
|
35 |
model_name = "moka-ai/m3e-base"
|
36 |
self.config = PeftConfig.from_pretrained("YingL19/gemma_10epoch_1e5_lincoln1",device_map=DEVICE)
|
37 |
+
self.base_model = AutoModelForCausalLM.from_pretrained("google/gemma-7b",device_map=DEVICE)
|
38 |
self.newmodel = PeftModel.from_pretrained(self.base_model, "YingL19/gemma_10epoch_1e5_lincoln1",device_map=DEVICE)
|
39 |
self.tokenizer = AutoTokenizer.from_pretrained("YingL19/gemma_10epoch_1e5_lincoln1",device_map=DEVICE)
|
40 |
|
|
|
68 |
template=self.prompt_template,
|
69 |
)
|
70 |
|
71 |
+
embeddings = HuggingFaceEmbeddings(model_name=model_name,model_kwargs={'device':DEVICE})
|
72 |
embeddings.client = SentenceTransformer(model_name, device=DEVICE)
|
73 |
ragdb = Chroma(persist_directory="/Lincoln_DB", embedding_function=embeddings)
|
74 |
|