nguyenzzz |
1 |
1 |
1216.48 |
1219.12 |
0.73 |
5314.0 |
meseca-15062024-c1_v3 |
8B |
meseca/15062024-c1 |
meseca-15062024-c1_v3 |
10944 |
33263 |
0.56 |
0.56 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
8 |
1024 |
64 |
LlamaForCausalLM |
meseca/15062024-c1 |
2024-07-01 |
1.11 |
0.75 |
1 |
1 |
2 |
8 |
nguyenzzz |
2 |
1 |
1219.12 |
1219.12 |
0.70 |
5185.0 |
meseca-15062024-c1_v1 |
8B |
meseca/15062024-c1 |
v2-l3-70b-euryale-test-beta-1 |
10829 |
33263 |
0.56 |
0.56 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/15062024-c1 |
2024-06-15 |
1.21 |
0.13 |
3 |
1 |
1 |
16 |
nguyenzzz |
3 |
3 |
1214.52 |
1214.52 |
0.71 |
9649.0 |
meseca-20062024-c1_v1 |
8B |
meseca/20062024-c1 |
meseca-20062024-c1_v1 |
19727 |
19727 |
0.56 |
0.56 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/20062024-c1 |
2024-06-27 |
1.04 |
0.42 |
2 |
2 |
3 |
10 |
nguyenzzz |
4 |
1 |
1207.83 |
1219.12 |
0.71 |
5729.0 |
meseca-15062024-c1_v2 |
8B |
meseca/15062024-c1 |
meseca-15062024-c1_v2 |
11490 |
33263 |
0.55 |
0.56 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/15062024-c1 |
2024-07-01 |
0.80 |
0.30 |
4 |
1 |
8 |
12 |
nguyenzzz |
5 |
5 |
1212.29 |
1212.29 |
0.68 |
8808.0 |
meseca-07062024-m1_v2 |
8B |
meseca/07062024-m1 |
meseca-caspian-11_v1 |
18289 |
48889 |
0.56 |
0.56 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/07062024-m1 |
2024-06-15 |
0.96 |
-0.44 |
5 |
5 |
4 |
22 |
nguyenzzz |
6 |
6 |
1197.59 |
1197.59 |
0.70 |
5343.0 |
meseca-02072024-v1_v2 |
8B |
meseca/02072024-v1 |
meseca-02072024-v1_v2 |
11025 |
23773 |
0.52 |
0.52 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/02072024-v1 |
2024-07-02 |
0.44 |
0.12 |
7 |
7 |
15 |
17 |
nguyenzzz |
7 |
7 |
1211.05 |
1211.05 |
0.66 |
1447.0 |
meseca-caspian-0_v1 |
8B |
meseca/caspian-0 |
experiment-2-high-temp-test |
67680 |
77302 |
0.54 |
0.54 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/caspian-0 |
2024-06-03 |
0.92 |
-0.83 |
12 |
12 |
5 |
29 |
nguyenzzz |
8 |
6 |
1195.57 |
1197.59 |
0.71 |
6059.0 |
meseca-02072024-v1_v1 |
8B |
meseca/02072024-v1 |
meseca-02072024-v1_v1 |
12748 |
23773 |
0.52 |
0.52 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
8 |
1024 |
64 |
LlamaForCausalLM |
meseca/02072024-v1 |
2024-07-02 |
0.37 |
0.20 |
8 |
7 |
17 |
15 |
nguyenzzz |
9 |
5 |
1208.81 |
1212.29 |
0.67 |
8664.0 |
meseca-07062024-m1_v3 |
8B |
meseca/07062024-m1 |
07062024-m1-sft |
18336 |
48889 |
0.54 |
0.56 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/07062024-m1 |
2024-06-17 |
0.84 |
-0.74 |
9 |
5 |
6 |
27 |
nguyenzzz |
10 |
7 |
1208.02 |
1211.05 |
0.66 |
770.0 |
meseca-caspian-0_v2 |
8B |
meseca/caspian-0 |
kkk |
9622 |
77302 |
0.54 |
0.54 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/caspian-0 |
2024-06-08 |
0.81 |
-0.82 |
13 |
12 |
7 |
28 |
nguyenzzz |
11 |
11 |
1190.09 |
1191.87 |
0.71 |
5986.0 |
meseca-02072024-v1-2e_v1 |
8B |
meseca/02072024-v1-2e |
meseca-02072024-v1-2e_v1 |
12702 |
25449 |
0.51 |
0.52 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
8 |
1024 |
64 |
LlamaForCausalLM |
meseca/02072024-v1-2e |
2024-07-02 |
0.17 |
0.27 |
11 |
11 |
20 |
13 |
nguyenzzz |
12 |
11 |
1191.87 |
1191.87 |
0.70 |
6011.0 |
meseca-02072024-v1-2e_v2 |
8B |
meseca/02072024-v1-2e |
meseca-02072024-v1-2e_v2 |
12747 |
25449 |
0.52 |
0.52 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/02072024-v1-2e |
2024-07-02 |
0.23 |
-0.04 |
19 |
11 |
19 |
20 |
nguyenzzz |
13 |
13 |
1199.21 |
1200.88 |
0.67 |
190.0 |
meseca-caspian-1_v1 |
8B |
meseca/caspian-1 |
meseca-caspian-1_v1 |
10282 |
43480 |
0.55 |
0.55 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/caspian-1 |
2024-06-02 |
0.50 |
-0.56 |
18 |
18 |
13 |
24 |
nguyenzzz |
14 |
14 |
1164.75 |
1164.75 |
0.77 |
8354.0 |
meseca-20062024-c1-dpo-1e_v2 |
8B |
meseca/20062024-c1-dpo-1e |
meseca-20062024-c1-dpo-1e_v2 |
14942 |
30221 |
0.48 |
0.48 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/20062024-c1-dpo-1 |
2024-06-27 |
-0.74 |
1.63 |
6 |
6 |
29 |
3 |
nguyenzzz |
15 |
13 |
1197.27 |
1200.88 |
0.67 |
202.0 |
meseca-caspian-1_v2 |
8B |
meseca/caspian-1 |
meseca-caspian-11_v1 |
8113 |
43480 |
0.52 |
0.55 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/caspian-1 |
2024-06-02 |
0.43 |
-0.57 |
26 |
18 |
16 |
25 |
nguyenzzz |
16 |
16 |
1198.37 |
1198.37 |
0.67 |
241.0 |
meseca-caspian-1-1_v2 |
8B |
meseca/caspian-1.1 |
meseca-caspian-11_v1 |
10273 |
18531 |
0.52 |
0.52 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/caspian-1.1 |
2024-06-02 |
0.47 |
-0.69 |
24 |
24 |
14 |
26 |
nguyenzzz |
17 |
17 |
1163.58 |
1163.58 |
0.76 |
7186.0 |
meseca-20062024-c1-dpo-2e_v2 |
8B |
meseca/20062024-c1-dpo-2e |
meseca-20062024-c1-dpo-2e_v2 |
13424 |
24698 |
0.48 |
0.48 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/20062024-c1-dpo-2 |
2024-06-27 |
-0.78 |
1.54 |
14 |
14 |
31 |
4 |
nguyenzzz |
18 |
18 |
1186.26 |
1186.26 |
0.70 |
808.0 |
meseca-05062024-v2_v1 |
8B |
meseca/05062024-v2 |
meseca-05062024-v2-2e_v1 |
10921 |
10921 |
0.50 |
0.50 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/05062024-v2 |
2024-06-06 |
0.03 |
0.02 |
20 |
20 |
21 |
18 |
nguyenzzz |
19 |
19 |
1179.93 |
1179.93 |
0.72 |
5955.0 |
meseca-02072024-v1-1e_v1 |
8B |
meseca/02072024-v1-1e |
meseca-02072024-v1-1e_v1 |
12641 |
25214 |
0.49 |
0.49 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
8 |
1024 |
64 |
LlamaForCausalLM |
meseca/02072024-v1-1e |
2024-07-02 |
-0.19 |
0.43 |
10 |
10 |
24 |
9 |
nguyenzzz |
20 |
20 |
1164.61 |
1164.61 |
0.75 |
7442.0 |
meseca-20062024-c1-dpo_v1 |
8B |
meseca/20062024-c1-dpo |
meseca-20062024-c1-dpo_v1 |
15605 |
15605 |
0.47 |
0.47 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/20062024-c1-dpo |
2024-06-27 |
-0.74 |
1.34 |
15 |
15 |
30 |
5 |
nguyenzzz |
21 |
13 |
1199.30 |
1200.88 |
0.65 |
326.0 |
meseca-caspian-1_v4 |
8B |
meseca/caspian-1 |
meseca-caspian-11_v1 |
12521 |
43480 |
0.52 |
0.55 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/caspian-1 |
2024-06-02 |
0.50 |
-1.03 |
28 |
18 |
12 |
30 |
nguyenzzz |
22 |
22 |
1177.70 |
1184.59 |
0.71 |
6794.0 |
meseca-05062024-v1_v2 |
8B |
meseca/05062024-v1 |
meseca-05062024-v1_v1 |
14646 |
40709 |
0.53 |
0.53 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/05062024-v1 |
2024-06-15 |
-0.27 |
0.23 |
25 |
23 |
26 |
14 |
nguyenzzz |
23 |
5 |
1201.10 |
1212.29 |
0.64 |
861.0 |
meseca-07062024-m1_v1 |
8B |
meseca/07062024-m1 |
meseca-caspian-11_v1 |
12264 |
48889 |
0.52 |
0.56 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/07062024-m1 |
2024-06-06 |
0.56 |
-1.32 |
27 |
5 |
9 |
32 |
nguyenzzz |
24 |
22 |
1175.33 |
1184.59 |
0.71 |
5329.0 |
meseca-05062024-v1_v3 |
8B |
meseca/05062024-v1 |
meseca-05062024-v1_v1 |
11340 |
40709 |
0.50 |
0.53 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/05062024-v1 |
2024-06-15 |
-0.36 |
0.32 |
23 |
23 |
28 |
11 |
nguyenzzz |
25 |
25 |
1183.70 |
1183.70 |
0.69 |
1997.0 |
meseca-05062024-v2-2e_v1 |
8B |
meseca/05062024-v2-2e |
meseca-05062024-v2-2e_v1 |
32003 |
32003 |
0.52 |
0.52 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/05062024-v2-2e |
2024-06-06 |
-0.06 |
-0.29 |
30 |
30 |
23 |
21 |
nguyenzzz |
26 |
22 |
1184.59 |
1184.59 |
0.68 |
904.0 |
meseca-05062024-v1_v1 |
8B |
meseca/05062024-v1 |
meseca-05062024-v1_v1 |
14723 |
40709 |
0.52 |
0.53 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/05062024-v1 |
2024-06-06 |
-0.03 |
-0.48 |
31 |
23 |
22 |
23 |
nguyenzzz |
27 |
19 |
1175.89 |
1179.93 |
0.70 |
5930.0 |
meseca-02072024-v1-1e_v2 |
8B |
meseca/02072024-v1-1e |
meseca-02072024-v1-1e_v2 |
12573 |
25214 |
0.49 |
0.49 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/02072024-v1-1e |
2024-07-02 |
-0.34 |
0.00 |
32 |
10 |
27 |
19 |
nguyenzzz |
28 |
16 |
1191.92 |
1198.37 |
0.65 |
254.0 |
meseca-caspian-1-1_v1 |
8B |
meseca/caspian-1.1 |
meseca-caspian-11_v1 |
8258 |
18531 |
0.51 |
0.52 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/caspian-1.1 |
2024-06-02 |
0.24 |
-1.12 |
34 |
24 |
18 |
31 |
nguyenzzz |
29 |
13 |
1200.88 |
1200.88 |
0.62 |
304.0 |
meseca-caspian-1_v3 |
8B |
meseca/caspian-1 |
meseca-caspian-11_v1 |
12564 |
43480 |
0.53 |
0.55 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/caspian-1 |
2024-06-02 |
0.56 |
-1.78 |
29 |
18 |
10 |
34 |
nguyenzzz |
30 |
30 |
1200.21 |
1200.21 |
0.62 |
253.0 |
meseca-sophon-1_v3 |
8B |
meseca/sophon-1 |
meseca-sophon-1_v1 |
11681 |
11681 |
0.53 |
0.53 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/sophon-1 |
2024-06-02 |
0.53 |
-1.81 |
33 |
33 |
11 |
35 |
nguyenzzz |
31 |
31 |
1144.21 |
1144.21 |
0.75 |
16219.0 |
meseca-07062024-m1-dpo-1-1e_v1 |
8B |
meseca/07062024-m1-dpo-1-1e |
07062024-m1-dpo |
33169 |
48284 |
0.45 |
0.45 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/07062024-m1-dpo-1 |
2024-06-17 |
-1.47 |
1.18 |
22 |
21 |
32 |
7 |
nguyenzzz |
32 |
32 |
1178.86 |
1178.86 |
0.64 |
920.0 |
meseca-05062024-v1-qlora_2149_v1 |
8B |
meseca/05062024-v1-qlora-merged |
meseca-05062024-v1-qlora_2149_v1 |
17319 |
17319 |
0.50 |
0.50 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
8 |
1024 |
64 |
LlamaForCausalLM |
meseca/05062024-v1-qlora |
2024-06-06 |
-0.23 |
-1.37 |
35 |
35 |
25 |
33 |
nguyenzzz |
33 |
31 |
1137.64 |
1144.21 |
0.75 |
7133.0 |
meseca-07062024-m1-dpo-1_v1 |
8B |
meseca/07062024-m1-dpo-1 |
07062024-m1-dpo |
15115 |
48284 |
0.43 |
0.45 |
basic |
ChaiML/reward_gpt2_medium_preference_24m_e2 |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/07062024-m1-dpo-1 |
2024-06-17 |
-1.71 |
1.31 |
21 |
21 |
33 |
6 |
nguyenzzz |
34 |
14 |
1104.66 |
1164.75 |
0.78 |
7554.0 |
meseca-20062024-c1-dpo-1e_v1 |
8B |
meseca/20062024-c1-dpo-1e |
meseca-20062024-c1-dpo-1e_v1 |
15279 |
30221 |
0.39 |
0.48 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/20062024-c1-dpo-1 |
2024-06-27 |
-2.88 |
1.89 |
16 |
6 |
34 |
1 |
nguyenzzz |
35 |
17 |
1103.09 |
1163.58 |
0.77 |
5622.0 |
meseca-20062024-c1-dpo-2e_v1 |
8B |
meseca/20062024-c1-dpo-2e |
meseca-20062024-c1-dpo-2e_v1 |
11274 |
24698 |
0.40 |
0.48 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16 |
512 |
64 |
LlamaForCausalLM |
meseca/20062024-c1-dpo-2 |
2024-06-27 |
-2.94 |
1.82 |
17 |
14 |
35 |
2 |