devve1 commited on
Commit
c825289
1 Parent(s): 2e65f49

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -244,7 +244,7 @@ def load_models_and_documents():
244
  tensor_parallel_size=1,
245
  enforce_eager=True,
246
  gpu_memory_utilization=1,
247
- max_model_len=10240,
248
  dtype=torch.float16,
249
  max_num_seqs=64,
250
  quantization="gptq"
 
244
  tensor_parallel_size=1,
245
  enforce_eager=True,
246
  gpu_memory_utilization=1,
247
+ max_model_len=8192,
248
  dtype=torch.float16,
249
  max_num_seqs=64,
250
  quantization="gptq"