Update app.py
Browse files
app.py
CHANGED
@@ -2,15 +2,6 @@ from huggingface_hub import InferenceClient
|
|
2 |
client = InferenceClient(
|
3 |
"ecastera/eva-mistral-catmacaroni-7b-spanish"
|
4 |
)
|
5 |
-
quantization_config = BitsAndBytesConfig(
|
6 |
-
load_in_4bit=True,
|
7 |
-
load_in_8bit=False,
|
8 |
-
llm_int8_threshold=6.0,
|
9 |
-
llm_int8_has_fp16_weight=False,
|
10 |
-
bnb_4bit_compute_dtype="float16",
|
11 |
-
bnb_4bit_use_double_quant=True,
|
12 |
-
bnb_4bit_quant_type="nf4")
|
13 |
-
|
14 |
generate_kwargs = dict(
|
15 |
temperature=0.1,
|
16 |
max_new_tokens=256,
|
|
|
2 |
client = InferenceClient(
|
3 |
"ecastera/eva-mistral-catmacaroni-7b-spanish"
|
4 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
5 |
generate_kwargs = dict(
|
6 |
temperature=0.1,
|
7 |
max_new_tokens=256,
|