RyuBcn commited on
Commit
e4de614
·
verified ·
1 Parent(s): de59269

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +0 -9
app.py CHANGED
@@ -2,15 +2,6 @@ from huggingface_hub import InferenceClient
2
  client = InferenceClient(
3
  "ecastera/eva-mistral-catmacaroni-7b-spanish"
4
  )
5
- quantization_config = BitsAndBytesConfig(
6
- load_in_4bit=True,
7
- load_in_8bit=False,
8
- llm_int8_threshold=6.0,
9
- llm_int8_has_fp16_weight=False,
10
- bnb_4bit_compute_dtype="float16",
11
- bnb_4bit_use_double_quant=True,
12
- bnb_4bit_quant_type="nf4")
13
-
14
  generate_kwargs = dict(
15
  temperature=0.1,
16
  max_new_tokens=256,
 
2
  client = InferenceClient(
3
  "ecastera/eva-mistral-catmacaroni-7b-spanish"
4
  )
 
 
 
 
 
 
 
 
 
5
  generate_kwargs = dict(
6
  temperature=0.1,
7
  max_new_tokens=256,