robert_irvine |
1 |
1 |
1238.52 |
1238.66 |
0.72 |
11197.0 |
nitral-ai-hathor-l3-8b-v-01_v43 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v43 |
65010 |
665050 |
0.51 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-06 |
2.05 |
0.10 |
1 |
1 |
2 |
31 |
robert_irvine |
2 |
1 |
1237.71 |
1238.66 |
0.72 |
11740.0 |
nitral-ai-hathor-l3-8b-v-01_v42 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v42 |
69120 |
665050 |
0.52 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-06 |
2.03 |
0.14 |
2 |
1 |
3 |
30 |
robert_irvine |
3 |
1 |
1236.97 |
1238.66 |
0.73 |
5655.0 |
nitral-ai-hathor-l3-8b-v-01_v12 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v12 |
32705 |
665050 |
0.56 |
0.58 |
basic |
ChaiML/gpt2_xl_pairwise_89m_step_347634 |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
2.00 |
0.17 |
3 |
1 |
5 |
29 |
robert_irvine |
4 |
1 |
1237.37 |
1238.66 |
0.72 |
5471.0 |
nitral-ai-hathor-l3-8b-v-01_v11 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v11 |
32108 |
665050 |
0.57 |
0.58 |
basic |
ChaiML/gpt2_xl_pairwise_89m_step_347634 |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
2.02 |
-0.14 |
6 |
1 |
4 |
34 |
robert_irvine |
5 |
1 |
1238.66 |
1238.66 |
0.71 |
5261.0 |
nitral-ai-hathor-l3-8b-v-01_v41 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v41 |
30522 |
665050 |
0.58 |
0.58 |
basic |
ChaiML/gpt2_xl_pairwise_89m_step_347634 |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
2.05 |
-0.35 |
12 |
1 |
1 |
44 |
robert_irvine |
6 |
1 |
1236.00 |
1238.66 |
0.72 |
5365.0 |
nitral-ai-hathor-l3-8b-v-01_v38 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v38 |
31159 |
665050 |
0.58 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
1.98 |
-0.23 |
13 |
1 |
6 |
39 |
robert_irvine |
7 |
1 |
1230.45 |
1238.66 |
0.71 |
5413.0 |
nitral-ai-hathor-l3-8b-v-01_v37 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v37 |
31623 |
665050 |
0.57 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
1.82 |
-0.31 |
16 |
1 |
7 |
42 |
robert_irvine |
8 |
1 |
1211.46 |
1238.66 |
0.72 |
5431.0 |
nitral-ai-hathor-l3-8b-v-01_v36 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v36 |
32012 |
665050 |
0.54 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
1.26 |
-0.06 |
7 |
1 |
8 |
33 |
robert_irvine |
9 |
9 |
1190.48 |
1190.48 |
0.74 |
6517.0 |
nousresearch-meta-llama_4941_v78 |
8B |
NousResearch/Meta-Llama-3-8B-Instruct |
nousresearch-meta-llama_4941_v78 |
13904 |
154899 |
0.53 |
0.53 |
basic |
ChaiML/gpt2_medium_pairwise_60m_step_937500 |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
NousResearch/Meta-Llama- |
2024-07-03 |
0.65 |
0.82 |
4 |
4 |
18 |
18 |
robert_irvine |
10 |
1 |
1192.03 |
1238.66 |
0.73 |
5499.0 |
nitral-ai-hathor-l3-8b-v-01_v35 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v35 |
32756 |
665050 |
0.51 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
0.70 |
0.59 |
5 |
1 |
16 |
21 |
robert_irvine |
11 |
1 |
1208.37 |
1238.66 |
0.71 |
5293.0 |
nitral-ai-hathor-l3-8b-v-01_v32 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v32 |
30543 |
665050 |
0.54 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
1.17 |
-0.36 |
20 |
1 |
9 |
45 |
robert_irvine |
12 |
12 |
1190.88 |
1190.88 |
0.73 |
41489.0 |
undi95-meta-llama-3-70b-_6209_v3 |
71B |
Undi95/Meta-Llama-3-70B-Instruct-hf |
undi95-meta-llama-3-70b-_6209_v3 |
100528 |
100528 |
0.50 |
0.50 |
basic |
rirv938/gpt2_ties_merge_preference_plus_classic_e2_density_99 |
2.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Undi95/Meta-Llama-3-70B- |
2024-04-24 |
0.67 |
0.45 |
8 |
8 |
17 |
24 |
robert_irvine |
13 |
13 |
1199.76 |
1205.12 |
0.72 |
10699.0 |
chaoticneutrals-poppy-p_3816_v13 |
8B |
ChaoticNeutrals/Poppy_Porpoise-0.72-L3-8B |
chaoticneutrals-poppy-p_3816_v13 |
36034 |
193711 |
0.51 |
0.53 |
basic |
rirv938/gpt2_medium_pairwise_60m_step_1875000 |
8.0 |
512.0 |
64.0 |
LlamaForCausalLM |
ChaoticNeutrals/Poppy_Po |
2024-06-10 |
0.92 |
-0.16 |
15 |
15 |
12 |
35 |
robert_irvine |
14 |
13 |
1201.16 |
1205.12 |
0.71 |
10331.0 |
chaoticneutrals-poppy-p_3816_v14 |
8B |
ChaoticNeutrals/Poppy_Porpoise-0.72-L3-8B |
chaoticneutrals-poppy-p_3816_v14 |
34719 |
193711 |
0.51 |
0.53 |
basic |
rirv938/gpt2_medium_pairwise_60m_step_937500 |
8.0 |
512.0 |
64.0 |
LlamaForCausalLM |
ChaoticNeutrals/Poppy_Po |
2024-06-10 |
0.96 |
-0.44 |
25 |
15 |
11 |
48 |
robert_irvine |
15 |
9 |
1181.74 |
1190.48 |
0.73 |
6782.0 |
nousresearch-meta-llama_4941_v73 |
8B |
NousResearch/Meta-Llama-3-8B-Instruct |
nousresearch-meta-llama_4941_v73 |
14108 |
154899 |
0.52 |
0.53 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
NousResearch/Meta-Llama- |
2024-07-03 |
0.40 |
0.58 |
11 |
4 |
22 |
22 |
robert_irvine |
16 |
1 |
1169.01 |
1238.66 |
0.75 |
5209.0 |
nitral-ai-hathor-l3-8b-v-01_v34 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v34 |
29338 |
665050 |
0.48 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
0.03 |
1.18 |
9 |
1 |
32 |
10 |
robert_irvine |
17 |
9 |
1175.12 |
1190.48 |
0.74 |
6697.0 |
nousresearch-meta-llama_4941_v77 |
8B |
NousResearch/Meta-Llama-3-8B-Instruct |
nousresearch-meta-llama_4941_v77 |
13930 |
154899 |
0.51 |
0.53 |
basic |
ChaiML/gpt2_medium_pairwise_60m_step_937500 |
8.0 |
512.0 |
64.0 |
LlamaForCausalLM |
NousResearch/Meta-Llama- |
2024-07-03 |
0.21 |
0.83 |
10 |
4 |
26 |
17 |
robert_irvine |
18 |
13 |
1192.45 |
1205.12 |
0.72 |
11327.0 |
chaoticneutrals-poppy-p_3816_v11 |
8B |
ChaoticNeutrals/Poppy_Porpoise-0.72-L3-8B |
chaoticneutrals-poppy-p_3816_v11 |
37770 |
193711 |
0.50 |
0.53 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
8.0 |
512.0 |
64.0 |
LlamaForCausalLM |
ChaoticNeutrals/Poppy_Po |
2024-06-10 |
0.71 |
-0.18 |
17 |
15 |
15 |
36 |
robert_irvine |
19 |
13 |
1205.12 |
1205.12 |
0.70 |
657.0 |
chaoticneutrals-poppy-po_3816_v6 |
8B |
ChaoticNeutrals/Poppy_Porpoise-0.72-L3-8B |
chaoticneutrals-poppy-po_3816_v6 |
7161 |
193711 |
0.53 |
0.53 |
basic |
rirv938/gpt2_medium_pairwise_60m_step_937500 |
8.0 |
512.0 |
64.0 |
LlamaForCausalLM |
ChaoticNeutrals/Poppy_Po |
2024-06-09 |
1.08 |
-1.22 |
35 |
15 |
10 |
60 |
robert_irvine |
20 |
9 |
1159.34 |
1190.48 |
0.75 |
6789.0 |
nousresearch-meta-llama_4941_v76 |
8B |
NousResearch/Meta-Llama-3-8B-Instruct |
nousresearch-meta-llama_4941_v76 |
14023 |
154899 |
0.48 |
0.53 |
basic |
ChaiML/gpt2_medium_pairwise_60m_step_937500 |
4.0 |
512.0 |
64.0 |
LlamaForCausalLM |
NousResearch/Meta-Llama- |
2024-07-03 |
-0.25 |
1.23 |
14 |
4 |
39 |
8 |
robert_irvine |
21 |
1 |
1141.40 |
1238.66 |
0.77 |
5312.0 |
nitral-ai-hathor-l3-8b-v-01_v17 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v17 |
30261 |
665050 |
0.44 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
4.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
-0.77 |
2.08 |
18 |
1 |
50 |
1 |
robert_irvine |
22 |
22 |
1172.29 |
1184.90 |
0.73 |
6203.0 |
jellywibble-lora-120k-pr_2827_v8 |
8B |
Jellywibble/lora_120k_pref_data_ep2 |
jellywibble-lora-120k-pr_2827_v8 |
36438 |
71838 |
0.48 |
0.50 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Jellywibble/lora_120k_pr |
2024-07-05 |
0.13 |
0.41 |
19 |
19 |
28 |
25 |
robert_irvine |
23 |
13 |
1188.72 |
1205.12 |
0.71 |
10218.0 |
chaoticneutrals-poppy-p_3816_v15 |
8B |
ChaoticNeutrals/Poppy_Porpoise-0.72-L3-8B |
chaoticneutrals-poppy-p_3816_v15 |
34206 |
193711 |
0.49 |
0.53 |
basic |
rirv938/gpt2_medium_pairwise_60m_step_187500 |
8.0 |
512.0 |
64.0 |
LlamaForCausalLM |
ChaoticNeutrals/Poppy_Po |
2024-06-10 |
0.60 |
-0.48 |
34 |
15 |
20 |
49 |
robert_irvine |
24 |
22 |
1184.90 |
1184.90 |
0.72 |
6111.0 |
jellywibble-lora-120k-pr_2827_v9 |
8B |
Jellywibble/lora_120k_pref_data_ep2 |
jellywibble-lora-120k-pr_2827_v9 |
35400 |
71838 |
0.50 |
0.50 |
basic |
Jellywibble/CHAI_alignment_reward_model |
1.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Jellywibble/lora_120k_pr |
2024-07-05 |
0.49 |
-0.27 |
27 |
19 |
21 |
40 |
robert_irvine |
25 |
9 |
1163.16 |
1190.48 |
0.73 |
6621.0 |
nousresearch-meta-llama_4941_v72 |
8B |
NousResearch/Meta-Llama-3-8B-Instruct |
nousresearch-meta-llama_4941_v72 |
13938 |
154899 |
0.49 |
0.53 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
8.0 |
512.0 |
64.0 |
LlamaForCausalLM |
NousResearch/Meta-Llama- |
2024-07-03 |
-0.14 |
0.60 |
24 |
4 |
38 |
20 |
robert_irvine |
26 |
1 |
1138.23 |
1238.66 |
0.76 |
5502.0 |
nitral-ai-hathor-l3-8b-v-01_v14 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v14 |
32013 |
665050 |
0.44 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
-0.86 |
1.86 |
22 |
1 |
54 |
2 |
robert_irvine |
27 |
9 |
1153.42 |
1190.48 |
0.74 |
6723.0 |
nousresearch-meta-llama_4941_v71 |
8B |
NousResearch/Meta-Llama-3-8B-Instruct |
nousresearch-meta-llama_4941_v71 |
14378 |
154899 |
0.47 |
0.53 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
LlamaForCausalLM |
NousResearch/Meta-Llama- |
2024-07-03 |
-0.42 |
1.00 |
21 |
4 |
40 |
15 |
robert_irvine |
28 |
13 |
1190.23 |
1205.12 |
0.70 |
949.0 |
chaoticneutrals-poppy-po_3816_v4 |
8B |
ChaoticNeutrals/Poppy_Porpoise-0.72-L3-8B |
chaoticneutrals-poppy-po_3816_v4 |
10191 |
193711 |
0.51 |
0.53 |
basic |
rirv938/gpt2_medium_pairwise_60m_step_187500 |
8.0 |
512.0 |
64.0 |
LlamaForCausalLM |
ChaoticNeutrals/Poppy_Po |
2024-06-09 |
0.65 |
-1.03 |
41 |
15 |
19 |
55 |
robert_irvine |
29 |
1 |
1138.84 |
1238.66 |
0.76 |
5522.0 |
nitral-ai-hathor-l3-8b-v-01_v13 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v13 |
31505 |
665050 |
0.44 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
-0.85 |
1.66 |
23 |
1 |
53 |
3 |
robert_irvine |
30 |
30 |
1173.63 |
1179.36 |
0.72 |
20155.0 |
neversleep-noromaid-v0-_8068_v89 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v89 |
15243 |
523610 |
0.53 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-07-01 |
0.16 |
-0.22 |
29 |
29 |
27 |
38 |
robert_irvine |
31 |
13 |
1196.73 |
1205.12 |
0.69 |
1920.0 |
chaoticneutrals-poppy-po_3816_v5 |
8B |
ChaoticNeutrals/Poppy_Porpoise-0.72-L3-8B |
chaoticneutrals-poppy-po_3816_v5 |
22664 |
193711 |
0.52 |
0.53 |
basic |
rirv938/gpt2_medium_pairwise_60m_step_468750 |
8.0 |
512.0 |
64.0 |
LlamaForCausalLM |
ChaoticNeutrals/Poppy_Po |
2024-06-09 |
0.84 |
-1.58 |
44 |
15 |
13 |
65 |
robert_irvine |
32 |
13 |
1194.18 |
1205.12 |
0.69 |
992.0 |
chaoticneutrals-poppy-po_3816_v3 |
8B |
ChaoticNeutrals/Poppy_Porpoise-0.72-L3-8B |
chaoticneutrals-poppy-po_3816_v3 |
10966 |
193711 |
0.51 |
0.53 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
8.0 |
512.0 |
64.0 |
LlamaForCausalLM |
ChaoticNeutrals/Poppy_Po |
2024-06-09 |
0.76 |
-1.56 |
45 |
15 |
14 |
64 |
robert_irvine |
33 |
9 |
1140.80 |
1190.48 |
0.75 |
6672.0 |
nousresearch-meta-llama_4941_v75 |
8B |
NousResearch/Meta-Llama-3-8B-Instruct |
nousresearch-meta-llama_4941_v75 |
13942 |
154899 |
0.46 |
0.53 |
basic |
ChaiML/gpt2_medium_pairwise_60m_step_937500 |
2.0 |
512.0 |
64.0 |
LlamaForCausalLM |
NousResearch/Meta-Llama- |
2024-07-03 |
-0.79 |
1.18 |
26 |
4 |
51 |
9 |
robert_irvine |
34 |
30 |
1179.36 |
1179.36 |
0.70 |
714.0 |
neversleep-noromaid-v0-_8068_v68 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v68 |
5319 |
523610 |
0.50 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
1024.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-06-09 |
0.33 |
-0.94 |
43 |
29 |
23 |
54 |
robert_irvine |
35 |
30 |
1171.03 |
1179.36 |
0.71 |
2106.0 |
neversleep-noromaid-v0-_8068_v65 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v65 |
28305 |
523610 |
0.49 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
1024.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-06-07 |
0.09 |
-0.50 |
47 |
29 |
29 |
50 |
robert_irvine |
36 |
30 |
1168.79 |
1179.36 |
0.71 |
6041.0 |
neversleep-noromaid-v0_8068_v113 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0_8068_v113 |
13150 |
523610 |
0.49 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-07-02 |
0.02 |
-0.38 |
48 |
29 |
33 |
46 |
robert_irvine |
37 |
1 |
1139.39 |
1238.66 |
0.75 |
5408.0 |
nitral-ai-hathor-l3-8b-v-01_v16 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v16 |
31110 |
665050 |
0.44 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
4.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
-0.83 |
1.18 |
28 |
1 |
52 |
11 |
robert_irvine |
38 |
1 |
1150.16 |
1238.66 |
0.73 |
5347.0 |
nitral-ai-hathor-l3-8b-v-01_v15 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v15 |
31480 |
665050 |
0.45 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
1.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
-0.52 |
0.57 |
30 |
1 |
44 |
23 |
robert_irvine |
39 |
30 |
1164.85 |
1179.36 |
0.71 |
6313.0 |
neversleep-noromaid-v0_8068_v112 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0_8068_v112 |
13395 |
523610 |
0.48 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-07-02 |
-0.09 |
-0.32 |
46 |
29 |
35 |
43 |
robert_irvine |
40 |
30 |
1178.03 |
1179.36 |
0.70 |
2891.0 |
neversleep-noromaid-v0-_8068_v64 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v64 |
37551 |
523610 |
0.51 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
1024.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-06-07 |
0.29 |
-1.09 |
50 |
29 |
24 |
57 |
robert_irvine |
41 |
1 |
1132.03 |
1238.66 |
0.75 |
5498.0 |
nitral-ai-hathor-l3-8b-v-01_v26 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v26 |
31495 |
665050 |
0.43 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
-1.04 |
1.33 |
31 |
1 |
61 |
7 |
robert_irvine |
42 |
1 |
1137.47 |
1238.66 |
0.74 |
5304.0 |
nitral-ai-hathor-l3-8b-v-01_v39 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v39 |
30780 |
665050 |
0.43 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
-0.89 |
1.01 |
32 |
1 |
55 |
14 |
robert_irvine |
43 |
43 |
1163.84 |
1164.70 |
0.71 |
653.0 |
mistralai-mixtral-8x7b-_3473_v44 |
47B |
mistralai/Mixtral-8x7B-Instruct-v0.1 |
mistralai-mixtral-8x7b-_3473_v44 |
9816 |
19643 |
0.49 |
0.49 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
mistralai/Mixtral-8x7B-I |
2024-06-06 |
-0.12 |
-0.51 |
56 |
56 |
37 |
51 |
robert_irvine |
44 |
9 |
1132.69 |
1190.48 |
0.75 |
6731.0 |
nousresearch-meta-llama_4941_v70 |
8B |
NousResearch/Meta-Llama-3-8B-Instruct |
nousresearch-meta-llama_4941_v70 |
14218 |
154899 |
0.44 |
0.53 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
2.0 |
512.0 |
64.0 |
LlamaForCausalLM |
NousResearch/Meta-Llama- |
2024-07-03 |
-1.02 |
1.15 |
37 |
4 |
60 |
12 |
robert_irvine |
45 |
1 |
1133.98 |
1238.66 |
0.74 |
5132.0 |
nitral-ai-hathor-l3-8b-v-01_v33 |
8B |
Nitral-AI/Hathor-L3-8B-v.01 |
nitral-ai-hathor-l3-8b-v-01_v33 |
29510 |
665050 |
0.43 |
0.58 |
basic |
Jellywibble/CHAI_alignment_reward_model |
16.0 |
512.0 |
64.0 |
LlamaForCausalLM |
Nitral-AI/Hathor-L3-8B-v |
2024-07-05 |
-0.99 |
1.04 |
36 |
1 |
59 |
13 |
robert_irvine |
46 |
43 |
1164.70 |
1164.70 |
0.71 |
913.0 |
mistralai-mixtral-8x7b-_3473_v45 |
47B |
mistralai/Mixtral-8x7B-Instruct-v0.1 |
mistralai-mixtral-8x7b-_3473_v45 |
9827 |
19643 |
0.49 |
0.49 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
mistralai/Mixtral-8x7B-I |
2024-06-06 |
-0.09 |
-0.71 |
57 |
56 |
36 |
53 |
robert_irvine |
47 |
30 |
1170.80 |
1179.36 |
0.70 |
20290.0 |
neversleep-noromaid-v0-_8068_v80 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v80 |
61476 |
523610 |
0.54 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-06-10 |
0.08 |
-1.05 |
54 |
29 |
30 |
56 |
robert_irvine |
48 |
30 |
1145.42 |
1179.36 |
0.73 |
6359.0 |
neversleep-noromaid-v0-_8068_v97 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v97 |
13351 |
523610 |
0.49 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-07-01 |
-0.65 |
0.25 |
39 |
29 |
46 |
28 |
robert_irvine |
49 |
30 |
1169.28 |
1179.36 |
0.70 |
17519.0 |
neversleep-noromaid-v0-_8068_v83 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v83 |
52990 |
523610 |
0.53 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-06-10 |
0.04 |
-1.11 |
58 |
29 |
31 |
58 |
robert_irvine |
50 |
30 |
1142.02 |
1179.36 |
0.73 |
6436.0 |
neversleep-noromaid-v0-_8068_v94 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v94 |
13814 |
523610 |
0.48 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-07-01 |
-0.75 |
0.36 |
42 |
29 |
49 |
26 |
robert_irvine |
51 |
30 |
1152.13 |
1179.36 |
0.72 |
5990.0 |
neversleep-noromaid-v0_8068_v108 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0_8068_v108 |
12745 |
523610 |
0.47 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-07-01 |
-0.46 |
-0.18 |
49 |
29 |
42 |
37 |
robert_irvine |
52 |
30 |
1151.84 |
1179.36 |
0.71 |
512.0 |
neversleep-noromaid-v0-_8068_v69 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v69 |
3662 |
523610 |
0.46 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
1024.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-06-09 |
-0.47 |
-0.40 |
59 |
29 |
43 |
47 |
robert_irvine |
53 |
30 |
1136.75 |
1179.36 |
0.73 |
6481.0 |
neversleep-noromaid-v0-_8068_v96 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v96 |
13350 |
523610 |
0.47 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-07-01 |
-0.91 |
0.28 |
53 |
29 |
57 |
27 |
robert_irvine |
54 |
9 |
1113.56 |
1190.48 |
0.75 |
6723.0 |
nousresearch-meta-llama_4941_v69 |
8B |
NousResearch/Meta-Llama-3-8B-Instruct |
nousresearch-meta-llama_4941_v69 |
14313 |
154899 |
0.42 |
0.53 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
1.0 |
512.0 |
64.0 |
LlamaForCausalLM |
NousResearch/Meta-Llama- |
2024-07-03 |
-1.58 |
1.52 |
33 |
4 |
65 |
4 |
robert_irvine |
55 |
9 |
1112.63 |
1190.48 |
0.75 |
6573.0 |
nousresearch-meta-llama_4941_v68 |
8B |
NousResearch/Meta-Llama-3-8B-Instruct |
nousresearch-meta-llama_4941_v68 |
14327 |
154899 |
0.42 |
0.53 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
1.0 |
512.0 |
64.0 |
LlamaForCausalLM |
NousResearch/Meta-Llama- |
2024-07-03 |
-1.61 |
1.46 |
38 |
4 |
67 |
5 |
robert_irvine |
56 |
30 |
1168.72 |
1179.36 |
0.69 |
2799.0 |
neversleep-noromaid-v0-_8068_v63 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v63 |
37930 |
523610 |
0.49 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-06-07 |
0.02 |
-1.63 |
63 |
29 |
34 |
66 |
robert_irvine |
57 |
30 |
1142.45 |
1179.36 |
0.72 |
5291.0 |
neversleep-noromaid-v0-_8068_v93 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v93 |
11099 |
523610 |
0.46 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-07-01 |
-0.74 |
-0.28 |
55 |
29 |
47 |
41 |
robert_irvine |
58 |
9 |
1110.98 |
1190.48 |
0.75 |
6467.0 |
nousresearch-meta-llama_4941_v74 |
8B |
NousResearch/Meta-Llama-3-8B-Instruct |
nousresearch-meta-llama_4941_v74 |
13818 |
154899 |
0.41 |
0.53 |
basic |
ChaiML/gpt2_medium_pairwise_60m_step_937500 |
1.0 |
512.0 |
64.0 |
LlamaForCausalLM |
NousResearch/Meta-Llama- |
2024-07-03 |
-1.66 |
1.39 |
40 |
4 |
68 |
6 |
robert_irvine |
59 |
30 |
1146.21 |
1179.36 |
0.71 |
1036.0 |
neversleep-noromaid-v0-_8068_v74 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v74 |
9320 |
523610 |
0.45 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
1024.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-06-09 |
-0.63 |
-0.70 |
62 |
29 |
45 |
52 |
robert_irvine |
60 |
30 |
1177.55 |
1179.36 |
0.67 |
586.0 |
neversleep-noromaid-v0-_8068_v73 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v73 |
6608 |
523610 |
0.49 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
1024.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-06-09 |
0.28 |
-2.41 |
60 |
29 |
25 |
68 |
robert_irvine |
61 |
30 |
1120.45 |
1179.36 |
0.73 |
5420.0 |
neversleep-noromaid-v0_8068_v105 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0_8068_v105 |
11174 |
523610 |
0.42 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-07-01 |
-1.38 |
0.61 |
52 |
29 |
64 |
19 |
robert_irvine |
62 |
30 |
1112.79 |
1179.36 |
0.74 |
5268.0 |
neversleep-noromaid-v0_8068_v106 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0_8068_v106 |
10825 |
523610 |
0.41 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-07-01 |
-1.60 |
0.92 |
51 |
29 |
66 |
16 |
robert_irvine |
63 |
30 |
1127.34 |
1179.36 |
0.72 |
6539.0 |
neversleep-noromaid-v0-_8068_v95 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v95 |
14032 |
523610 |
0.46 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-07-01 |
-1.18 |
-0.03 |
61 |
29 |
63 |
32 |
robert_irvine |
64 |
30 |
1152.85 |
1179.36 |
0.68 |
1386.0 |
neversleep-noromaid-v0-_8068_v66 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v66 |
17212 |
523610 |
0.46 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
1024.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-06-09 |
-0.44 |
-1.74 |
64 |
29 |
41 |
67 |
robert_irvine |
65 |
30 |
1142.17 |
1179.36 |
0.69 |
5671.0 |
neversleep-noromaid-v0-_8068_v85 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v85 |
16478 |
523610 |
0.45 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-06-10 |
-0.75 |
-1.34 |
65 |
29 |
48 |
61 |
robert_irvine |
66 |
30 |
1137.14 |
1179.36 |
0.70 |
14929.0 |
neversleep-noromaid-v0-_8068_v82 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v82 |
45676 |
523610 |
0.47 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-06-10 |
-0.90 |
-1.20 |
66 |
29 |
56 |
59 |
robert_irvine |
67 |
30 |
1135.05 |
1179.36 |
0.69 |
5272.0 |
neversleep-noromaid-v0_8068_v107 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0_8068_v107 |
10819 |
523610 |
0.44 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-07-01 |
-0.96 |
-1.37 |
67 |
29 |
58 |
62 |
robert_irvine |
68 |
30 |
1127.82 |
1179.36 |
0.69 |
15882.0 |
neversleep-noromaid-v0-_8068_v81 |
47B |
NeverSleep/Noromaid-v0.1-mixtral-8x7b-Instruct-v3 |
neversleep-noromaid-v0-_8068_v81 |
48086 |
523610 |
0.46 |
0.54 |
basic |
rirv938/reward_gpt2_medium_preference_24m_e2 |
4.0 |
512.0 |
64.0 |
MixtralForCausalLM |
NeverSleep/Noromaid-v0.1 |
2024-06-10 |
-1.17 |
-1.43 |
68 |
29 |
62 |
63 |