Spaces:
Running
Running
Zachary Siegel
commited on
Commit
·
ffe8812
1
Parent(s):
1453401
update verified agents
Browse files- verified_agents.yaml +12 -12
verified_agents.yaml
CHANGED
@@ -5,33 +5,33 @@
|
|
5 |
# verification_date: YYYY-MM-DD
|
6 |
|
7 |
corebench_easy:
|
8 |
-
- agent_name: "AutoGPT (
|
9 |
verification_date: 2024-11-26
|
10 |
-
- agent_name: "AutoGPT (
|
11 |
verification_date: 2024-11-26
|
12 |
-
- agent_name: "CORE-Agent (
|
13 |
verification_date: 2024-11-26
|
14 |
-
- agent_name: "CORE-Agent (
|
15 |
verification_date: 2024-11-26
|
16 |
|
17 |
corebench_medium:
|
18 |
-
- agent_name: "AutoGPT (
|
19 |
verification_date: 2024-11-26
|
20 |
-
- agent_name: "AutoGPT (
|
21 |
verification_date: 2024-11-26
|
22 |
-
- agent_name: "CORE-Agent (
|
23 |
verification_date: 2024-11-26
|
24 |
-
- agent_name: "CORE-Agent (
|
25 |
verification_date: 2024-11-26
|
26 |
|
27 |
corebench_hard:
|
28 |
-
- agent_name: "AutoGPT (
|
29 |
verification_date: 2024-11-26
|
30 |
-
- agent_name: "AutoGPT (
|
31 |
verification_date: 2024-11-26
|
32 |
-
- agent_name: "CORE-Agent (
|
33 |
verification_date: 2024-11-26
|
34 |
-
- agent_name: "CORE-Agent (
|
35 |
verification_date: 2024-11-26
|
36 |
- agent_name: "CORE-Agent (claude-3.5-sonnet)"
|
37 |
verification_date: 2024-11-16
|
|
|
5 |
# verification_date: YYYY-MM-DD
|
6 |
|
7 |
corebench_easy:
|
8 |
+
- agent_name: "AutoGPT (gpt-4o)"
|
9 |
verification_date: 2024-11-26
|
10 |
+
- agent_name: "AutoGPT (gpt-4o-mini)"
|
11 |
verification_date: 2024-11-26
|
12 |
+
- agent_name: "CORE-Agent (gpt-4o)"
|
13 |
verification_date: 2024-11-26
|
14 |
+
- agent_name: "CORE-Agent (gpt-4o-mini)"
|
15 |
verification_date: 2024-11-26
|
16 |
|
17 |
corebench_medium:
|
18 |
+
- agent_name: "AutoGPT (gpt-4o)"
|
19 |
verification_date: 2024-11-26
|
20 |
+
- agent_name: "AutoGPT (gpt-4o-mini)"
|
21 |
verification_date: 2024-11-26
|
22 |
+
- agent_name: "CORE-Agent (gpt-4o)"
|
23 |
verification_date: 2024-11-26
|
24 |
+
- agent_name: "CORE-Agent (gpt-4o-mini)"
|
25 |
verification_date: 2024-11-26
|
26 |
|
27 |
corebench_hard:
|
28 |
+
- agent_name: "AutoGPT (gpt-4o)"
|
29 |
verification_date: 2024-11-26
|
30 |
+
- agent_name: "AutoGPT (gpt-4o-mini)"
|
31 |
verification_date: 2024-11-26
|
32 |
+
- agent_name: "CORE-Agent (gpt-4o)"
|
33 |
verification_date: 2024-11-26
|
34 |
+
- agent_name: "CORE-Agent (gpt-4o-mini)"
|
35 |
verification_date: 2024-11-26
|
36 |
- agent_name: "CORE-Agent (claude-3.5-sonnet)"
|
37 |
verification_date: 2024-11-16
|