File size: 683 Bytes
68d064d
 
 
 
 
 
f5ab4cb
2ad72e3
f5ab4cb
 
 
 
9b64ead
32d8669
e1cb58c
 
 
2841b26
e1cb58c
2841b26
f5ab4cb
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
# /// script
# requires-python = ">=3.11,<3.12"
# dependencies = [
#     "synthetic-dataset-generator",
# ]
# ///
# ollama serve
# ollama run qwen2.5:32b-instruct-q5_K_S
import os

from synthetic_dataset_generator import launch

os.environ["HF_TOKEN"] = "hf_..."  # push the data to huggingface
os.environ["OLLAMA_BASE_URL"] = "http://127.0.0.1:11434/"  # ollama base url
os.environ["MODEL"] = "qwen2.5:32b-instruct-q5_K_S"  # model id
os.environ["TOKENIZER_ID"] = "Qwen/Qwen2.5-32B-Instruct"  # tokenizer id
os.environ["MAGPIE_PRE_QUERY_TEMPLATE"] = "qwen2"
os.environ["MAX_NUM_ROWS"] = "10000"
os.environ["DEFAULT_BATCH_SIZE"] = "2"
os.environ["MAX_NUM_TOKENS"] = "1024"

launch()