Spaces:
Running
on
T4
Running
on
T4
Update app.py
Browse files
app.py
CHANGED
@@ -5,6 +5,7 @@ import nltk
|
|
5 |
import copy
|
6 |
import time
|
7 |
import vllm
|
|
|
8 |
import spacy
|
9 |
import shutil
|
10 |
import msgpack
|
@@ -169,7 +170,7 @@ def load_models_and_documents():
|
|
169 |
quantization="bitsandbytes",
|
170 |
load_format="bitsandbytes",
|
171 |
gpu_memory_utilization=0.9,
|
172 |
-
dtype=
|
173 |
)
|
174 |
model = models.VLLM(llm)
|
175 |
|
|
|
5 |
import copy
|
6 |
import time
|
7 |
import vllm
|
8 |
+
import torch
|
9 |
import spacy
|
10 |
import shutil
|
11 |
import msgpack
|
|
|
170 |
quantization="bitsandbytes",
|
171 |
load_format="bitsandbytes",
|
172 |
gpu_memory_utilization=0.9,
|
173 |
+
dtype=torch.float16
|
174 |
)
|
175 |
model = models.VLLM(llm)
|
176 |
|