devve1 commited on
Commit
0d58e6f
1 Parent(s): cdc46be

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -170,7 +170,7 @@ def load_models_and_documents():
170
  quantization="bitsandbytes",
171
  load_format="bitsandbytes",
172
  gpu_memory_utilization=0.9,
173
- max_model_len=12288,
174
  dtype=torch.float16
175
  )
176
  model = models.VLLM(llm)
 
170
  quantization="bitsandbytes",
171
  load_format="bitsandbytes",
172
  gpu_memory_utilization=0.9,
173
+ max_model_len=12000,
174
  dtype=torch.float16
175
  )
176
  model = models.VLLM(llm)