devve1 commited on
Commit
eb42954
1 Parent(s): ced9420

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -185,7 +185,7 @@ def load_models_and_documents():
185
  enforce_eager=True,
186
  quantization="awq",
187
  gpu_memory_utilization=1,
188
- max_model_len=14000,
189
  dtype=torch.float16
190
  )
191
  model = models.VLLM(llm)
 
185
  enforce_eager=True,
186
  quantization="awq",
187
  gpu_memory_utilization=1,
188
+ max_model_len=12288,
189
  dtype=torch.float16
190
  )
191
  model = models.VLLM(llm)