devve1 commited on
Commit
90d7d9c
1 Parent(s): 0ec14a7

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -387,7 +387,7 @@ def load_models_and_documents():
387
  tensor_parallel_size=1,
388
  enforce_eager=True,
389
  gpu_memory_utilization=1,
390
- max_model_len=11264,
391
  dtype=torch.float16,
392
  max_num_seqs=128,
393
  quantization="gptq"
 
387
  tensor_parallel_size=1,
388
  enforce_eager=True,
389
  gpu_memory_utilization=1,
390
+ max_model_len=10240,
391
  dtype=torch.float16,
392
  max_num_seqs=128,
393
  quantization="gptq"