devve1 commited on
Commit
815b38b
1 Parent(s): 96f3438

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -5,6 +5,7 @@ import nltk
5
  import copy
6
  import time
7
  import vllm
 
8
  import spacy
9
  import shutil
10
  import msgpack
@@ -169,7 +170,7 @@ def load_models_and_documents():
169
  quantization="bitsandbytes",
170
  load_format="bitsandbytes",
171
  gpu_memory_utilization=0.9,
172
- dtype='float16'
173
  )
174
  model = models.VLLM(llm)
175
 
 
5
  import copy
6
  import time
7
  import vllm
8
+ import torch
9
  import spacy
10
  import shutil
11
  import msgpack
 
170
  quantization="bitsandbytes",
171
  load_format="bitsandbytes",
172
  gpu_memory_utilization=0.9,
173
+ dtype=torch.float16
174
  )
175
  model = models.VLLM(llm)
176