Update app.py
Browse files
app.py
CHANGED
@@ -244,7 +244,7 @@ def load_models_and_documents():
|
|
244 |
tensor_parallel_size=1,
|
245 |
enforce_eager=True,
|
246 |
gpu_memory_utilization=1,
|
247 |
-
max_model_len=
|
248 |
dtype=torch.float16,
|
249 |
max_num_seqs=64,
|
250 |
quantization="gptq"
|
|
|
244 |
tensor_parallel_size=1,
|
245 |
enforce_eager=True,
|
246 |
gpu_memory_utilization=1,
|
247 |
+
max_model_len=8192,
|
248 |
dtype=torch.float16,
|
249 |
max_num_seqs=64,
|
250 |
quantization="gptq"
|