{ "data_path": "andyfangaf/kitsuna-dataset", "model": "google-bert/bert-base-uncased", "lr": 3e-05, "epochs": 3, "max_seq_length": 128, "batch_size": 8, "warmup_ratio": 0.1, "gradient_accumulation": 1, "optimizer": "adamw_torch", "scheduler": "linear", "weight_decay": 0.0, "max_grad_norm": 1.0, "seed": 42, "train_split": "train", "valid_split": null, "logging_steps": -1, "project_name": "autotrain-kitsuna-stpair", "auto_find_batch_size": false, "mixed_precision": "bf16", "save_total_limit": 1, "push_to_hub": true, "eval_strategy": "epoch", "username": "ThatOrJohn", "log": "tensorboard", "early_stopping_patience": 5, "early_stopping_threshold": 0.01, "trainer": "pair", "sentence1_column": "instruction", "sentence2_column": "output", "sentence3_column": "sentence3", "target_column": "target" }