Update app.py
Browse files
app.py
CHANGED
@@ -185,7 +185,7 @@ def load_models_and_documents():
|
|
185 |
enforce_eager=True,
|
186 |
quantization="awq",
|
187 |
gpu_memory_utilization=1,
|
188 |
-
max_model_len=
|
189 |
dtype=torch.float16
|
190 |
)
|
191 |
model = models.VLLM(llm)
|
|
|
185 |
enforce_eager=True,
|
186 |
quantization="awq",
|
187 |
gpu_memory_utilization=1,
|
188 |
+
max_model_len=12288,
|
189 |
dtype=torch.float16
|
190 |
)
|
191 |
model = models.VLLM(llm)
|