Spaces:
Running
on
Zero
Running
on
Zero
Update app.py (#3)
Browse files- Update app.py (aa9bc96a6e6f5e3e3e5433725adc85b9721023d4)
app.py
CHANGED
@@ -8,14 +8,11 @@ import torch
|
|
8 |
from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStreamer
|
9 |
|
10 |
DESCRIPTION = """\
|
11 |
-
#
|
12 |
|
13 |
-
|
14 |
-
|
15 |
-
|
16 |
-
For more details, please check [our post](https://huggingface.co/blog/gemma2).
|
17 |
-
|
18 |
-
👉 Looking for a larger and more powerful version? Try the 27B version in [HuggingChat](https://huggingface.co/chat/models/google/gemma-2-27b-it) and the 9B version in [this Space](https://huggingface.co/spaces/huggingface-projects/gemma-2-9b-it).
|
19 |
"""
|
20 |
|
21 |
MAX_MAX_NEW_TOKENS = 2048
|
|
|
8 |
from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStreamer
|
9 |
|
10 |
DESCRIPTION = """\
|
11 |
+
# Llama 3.2 3B Instruct
|
12 |
|
13 |
+
Llama 3.2 3B is Meta's latest iteration of open LLMs.
|
14 |
+
This is a demo of [`meta-llama/Llama-3.2-3B-Instruct`](https://huggingface.co/meta-llama/Llama-3.2-3B-Instruct), fine-tuned for instruction following.
|
15 |
+
For more details, please check [our post](https://huggingface.co/blog/llama32).
|
|
|
|
|
|
|
16 |
"""
|
17 |
|
18 |
MAX_MAX_NEW_TOKENS = 2048
|