File size: 507 Bytes
f5ab4cb
 
 
 
 
e1cb58c
32d8669
 
f5ab4cb
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
# pip install synthetic-dataset-generator
import os

from synthetic_dataset_generator import launch

os.environ["HF_TOKEN"] = "hf_..."  # push the data to huggingface
os.environ["HUGGINGFACE_BASE_URL"] = "http://127.0.0.1:3000/"  # dedicated endpoint/TGI
os.environ["MAGPIE_PRE_QUERY_TEMPLATE"] = "llama3"  # magpie template
os.environ["TOKENIZER_ID"] = (
    "meta-llama/Llama-3.1-8B-Instruct"  # tokenizer for model hosted on endpoint
)
os.environ["MODEL"] = None  # model is linked to endpoint

launch()