llm-jp
/

NU-8x152M

Safetensors

mixtral

Model card Files Files and versions Community

Taishi-N324 commited on Dec 2, 2024

Commit

5ebac3e

verified ·

1 Parent(s): 001a0c0

Upload aggregated_result.json

Browse files

Files changed (1) hide show

aggregated_result.json +122 -0

aggregated_result.json ADDED Viewed

	@@ -0,0 +1,122 @@

+{
+  "model": "/gs/bs/tgh-NII-LLM/fp32_to_hf/upcycle-Mixtral-8x152M-torch_rand_002_iter_0477000_main_zero3/lr_2e-4-minlr_2e-5_warmup_2000_seq_4096/iter_0238419",
+  "result": {
+    "XLSUM_ja_1shot": -1.0,
+    "MATH (mgsm_ja)": -1.0,
+    "wmt20_en_ja_bleu": -1.0,
+    "wmt20_ja_en_bleu": -1.0,
+    "MC": -1.0,
+    "NLI": -1.0,
+    "QA": -1.0,
+    "RC": -1.0,
+    "jamp (NLI)": -1.0,
+    "janli (NLI)": -1.0,
+    "jcommonsenseqa": -1.0,
+    "jemhopqa": -1.0,
+    "jnli": -1.0,
+    "jsem": -1.0,
+    "jsick (NLI)": -1.0,
+    "jsquad": -1.0,
+    "jsts_pearson": -1.0,
+    "jsts_spearman": -1.0,
+    "niilc": -1.0,
+    "jmmlu": -1.0,
+    "jmmlu_social_sciences": -1.0,
+    "jmmlu_humanities": -1.0,
+    "jmmlu_stem": -1.0,
+    "jmmlu_other": -1.0,
+    "jhumaneval@1": -1.0,
+    "jhumaneval@10": -1.0,
+    "jhumaneval_answer@10": -1.0,
+    "MT-Bench (ALL)": -1.0,
+    "writing": -1.0,
+    "roleplay": -1.0,
+    "reasoning": -1.0,
+    "math": -1.0,
+    "coding": -1.0,
+    "extraction": -1.0,
+    "stem": -1.0,
+    "humanities": -1.0,
+    "gsm8k": -1.0,
+    "squad2": -1.0,
+    "triviaqa": -1.0,
+    "hellaswag": -1.0,
+    "openbookqa": -1.0,
+    "xwinograd_en": -1.0,
+    "bbh_cot": -1.0,
+    "mmlu": -1.0,
+    "mmlu_social_sciences": -1.0,
+    "mmlu_humanities": -1.0,
+    "mmlu_stem": -1.0,
+    "mmlu_other": -1.0,
+    "humaneval@1": -1.0,
+    "humaneval@10": -1.0,
+    "humaneval_answer@10": -1.0,
+    "jhumaneval-unstripped@1": -1.0,
+    "jhumaneval-unstripped@10": -1.0,
+    "jhumaneval-unstripped_answer@10": -1.0,
+    "humaneval-unstripped@1": -1.0,
+    "humaneval-unstripped@10": -1.0,
+    "humaneval-unstripped_answer@10": -1.0
+  },
+  "overall": "-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0",
+  "tasks": [
+    "XLSUM_ja_1shot",
+    "MATH (mgsm_ja)",
+    "wmt20_en_ja_bleu",
+    "wmt20_ja_en_bleu",
+    "MC",
+    "NLI",
+    "QA",
+    "RC",
+    "jamp (NLI)",
+    "janli (NLI)",
+    "jcommonsenseqa",
+    "jemhopqa",
+    "jnli",
+    "jsem",
+    "jsick (NLI)",
+    "jsquad",
+    "jsts_pearson",
+    "jsts_spearman",
+    "niilc",
+    "jmmlu",
+    "jmmlu_social_sciences",
+    "jmmlu_humanities",
+    "jmmlu_stem",
+    "jmmlu_other",
+    "jhumaneval@1",
+    "jhumaneval@10",
+    "jhumaneval_answer@10",
+    "MT-Bench (ALL)",
+    "writing",
+    "roleplay",
+    "reasoning",
+    "math",
+    "coding",
+    "extraction",
+    "stem",
+    "humanities",
+    "gsm8k",
+    "squad2",
+    "triviaqa",
+    "hellaswag",
+    "openbookqa",
+    "xwinograd_en",
+    "bbh_cot",
+    "mmlu",
+    "mmlu_social_sciences",
+    "mmlu_humanities",
+    "mmlu_stem",
+    "mmlu_other",
+    "humaneval@1",
+    "humaneval@10",
+    "humaneval_answer@10",
+    "jhumaneval-unstripped@1",
+    "jhumaneval-unstripped@10",
+    "jhumaneval-unstripped_answer@10",
+    "humaneval-unstripped@1",
+    "humaneval-unstripped@10",
+    "humaneval-unstripped_answer@10"
+  ]
+}