# /// script | |
# requires-python = ">=3.11,<3.12" | |
# dependencies = [ | |
# "synthetic-dataset-generator", | |
# ] | |
# /// | |
import os | |
from synthetic_dataset_generator import launch | |
os.environ["HF_TOKEN"] = "hf_..." # push the data to huggingface | |
os.environ["HUGGINGFACE_BASE_URL"] = "http://127.0.0.1:3000/" # dedicated endpoint/TGI | |
os.environ["MAGPIE_PRE_QUERY_TEMPLATE"] = "llama3" # magpie template | |
os.environ["TOKENIZER_ID"] = ( | |
"meta-llama/Llama-3.1-8B-Instruct" # tokenizer for model hosted on endpoint | |
) | |
os.environ["MODEL"] = None # model is linked to endpoint | |
launch() | |