Spaces:
Starting
on
T4
Starting
on
T4
Update app.py
Browse files
app.py
CHANGED
@@ -170,7 +170,7 @@ def load_models_and_documents():
|
|
170 |
quantization="bitsandbytes",
|
171 |
load_format="bitsandbytes",
|
172 |
gpu_memory_utilization=0.9,
|
173 |
-
max_model_len=
|
174 |
dtype=torch.float16
|
175 |
)
|
176 |
model = models.VLLM(llm)
|
|
|
170 |
quantization="bitsandbytes",
|
171 |
load_format="bitsandbytes",
|
172 |
gpu_memory_utilization=0.9,
|
173 |
+
max_model_len=12000,
|
174 |
dtype=torch.float16
|
175 |
)
|
176 |
model = models.VLLM(llm)
|