devve1 commited on
Commit
280dfd9
1 Parent(s): ef856ff

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -156,8 +156,8 @@ def load_models_and_documents():
156
  trust_remote_code=True,
157
  enforce_eager=True,
158
  quantization='gptq',
159
- gpu_memory_utilization=0.5,
160
- load_format='npcache'
161
  )
162
  model = models.VLLM(llm)
163
 
 
156
  trust_remote_code=True,
157
  enforce_eager=True,
158
  quantization='gptq',
159
+ gpu_memory_utilization=0.5
160
+ #load_format='npcache'
161
  )
162
  model = models.VLLM(llm)
163