Update app.py
Browse files
app.py
CHANGED
@@ -156,8 +156,8 @@ def load_models_and_documents():
|
|
156 |
trust_remote_code=True,
|
157 |
enforce_eager=True,
|
158 |
quantization='gptq',
|
159 |
-
gpu_memory_utilization=0.5
|
160 |
-
load_format='npcache'
|
161 |
)
|
162 |
model = models.VLLM(llm)
|
163 |
|
|
|
156 |
trust_remote_code=True,
|
157 |
enforce_eager=True,
|
158 |
quantization='gptq',
|
159 |
+
gpu_memory_utilization=0.5
|
160 |
+
#load_format='npcache'
|
161 |
)
|
162 |
model = models.VLLM(llm)
|
163 |
|