rirv938 | 1 | 1.0 | 1.0 | 1353.66 | 1353.66 | 0.54 | 0.99 | rirv938-grpo-to-compare_72853_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp312_lr6_merged | rirv938-grpo-to-compare_72853_v1 | 10217 | 61115860 | 0.58 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-25 | single | 1.45 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 2.0 | 1.0 | 1353.56 | 1353.66 | 0.0 | 0.99 | rirv938-96p-4ff-rirv938_38486_v1 | 24B | rirv938/96p_4ff_rirv938_20k_100p_0ff_ri_19485_v1_cp2250_v3 | rirv938-96p-4ff-rirv938_38486_v1 | 7582 | 61115860 | 0.57 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_rirv938_ | 2025-04-03 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 3.0 | 1.0 | 1353.38 | 1353.66 | 0.55 | 0.99 | rirv938-94p-6ff-rirv938_67490_v3 | 24B | rirv938/94p_6ff_rirv938_20k_100p_0ff_ri_19485_v1_cp2250_merged | rirv938-94p-6ff-rirv938_67490_v3 | 7897 | 61115860 | 0.59 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/94p_6ff_rirv938_ | 2025-04-03 | single | 0.63 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 4.0 | 1.0 | 1352.15 | 1353.66 | 0.52 | 0.99 | rirv938-97p-3ff-rirv938_56000_v1 | 24B | rirv938/97p_3ff_rirv938_20k_100p_0ff_ri_19485_v1_cp2250_v3 | rirv938-97p-3ff-rirv938_56000_v1 | 9723 | 61115860 | 0.57 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/97p_3ff_rirv938_ | 2025-04-03 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 5.0 | 1.0 | 1349.98 | 1353.66 | 0.53 | 0.99 | rirv938-grpo-to-compare_72853_v2 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp312_lr6_merged | rirv938-grpo-to-compare_72853_v2 | 10233 | 61115860 | 0.57 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-25 | single | 1.46 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 6.0 | 1.0 | 1349.11 | 1353.66 | 0.53 | 0.99 | rirv938-96p-4ff-rirv938_38486_v2 | 24B | rirv938/96p_4ff_rirv938_20k_100p_0ff_ri_19485_v1_cp2250_v3 | rirv938-96p-4ff-rirv938_38486_v2 | 9270 | 61115860 | 0.58 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_rirv938_ | 2025-04-03 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 7.0 | 1.0 | 1348.91 | 1353.66 | 0.5 | 0.99 | rirv938-anthropic-grpo-_96183_v1 | 13B | rirv938/anthropic_grpo_40k_cp1184_0ff_merged | rirv938-anthropic-grpo-_96183_v1 | 8865 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-30 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 8.0 | 1.0 | 1348.54 | 1353.66 | 0.49 | 0.99 | function_jenir_2025-03-30 | | | dpo_data_collection | 8712 | 61115860 | 0.59 | 0.65 | function | | | | | | | 2025-03-29 | single | | |
rirv938 | 1 | 9.0 | 1.0 | 1348.25 | 1353.66 | 0.55 | 0.99 | rirv938-94p-6ff-rirv938_67490_v1 | 24B | rirv938/94p_6ff_rirv938_20k_100p_0ff_ri_19485_v1_cp2250_merged | rirv938-94p-6ff-rirv938_67490_v1 | 7122 | 61115860 | 0.57 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/94p_6ff_rirv938_ | 2025-04-03 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 10.0 | 1.0 | 1347.52 | 1353.66 | 0.51 | 0.99 | rirv938-98p-2ff-rirv938_45880_v2 | 24B | rirv938/98p_2ff_rirv938_20k_100p_0ff_ri_19485_v1_cp1496_v3 | rirv938-98p-2ff-rirv938_45880_v2 | 8864 | 61115860 | 0.58 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-04-02 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 11.0 | 1.0 | 1345.5 | 1353.66 | 0.6 | 0.99 | rirv938-tune-mistral-gr_58521_v1 | 24B | rirv938/tune_mistral_grpo_cp1184_92ff_new_merged | rirv938-tune-mistral-gr_58521_v1 | 6092 | 61115860 | 0.59 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/tune_mistral_grp | 2025-05-01 | single | 1.7 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 12.0 | 1.0 | 1345.38 | 1353.66 | 0.52 | 0.99 | chaiml-anthropic-grpo-4_77013_v1 | 13B | ChaiML/anthropic_grpo_40k_cp888_0ff | chaiml-anthropic-grpo-4_77013_v1 | 11349 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/anthropic_grpo_40 | 2025-05-01 | single | 1.61 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 13.0 | 1.0 | 1345.37 | 1353.66 | 0.54 | 0.99 | rirv938-94p-6ff-rirv938_15047_v1 | 24B | rirv938/94p_6ff_rirv938_20k_100p_0ff_ri_19485_v1_cp1125_merged | rirv938-94p-6ff-rirv938_15047_v1 | 8861 | 61115860 | 0.61 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/94p_6ff_rirv938_ | 2025-04-03 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 14.0 | 1.0 | 1345.13 | 1353.66 | 0.52 | 0.99 | chaiml-ahab-v2-rirv938-_54360_v2 | 24B | ChaiML/ahab_v2_rirv938_20250423 | chaiml-ahab-v2-rirv938-_54360_v2 | 10959 | 61115860 | 0.58 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/ahab_v2_rirv938_2 | 2025-04-22 | single | 1.73 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 15.0 | 1.0 | 1345.1 | 1353.66 | 0.52 | 0.99 | chaiml-ahab-v2-rirv938-_54360_v1 | 24B | ChaiML/ahab_v2_rirv938_20250423 | chaiml-ahab-v2-rirv938-_54360_v1 | 10166 | 61115860 | 0.57 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/ahab_v2_rirv938_2 | 2025-04-22 | single | 1.73 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 16.0 | 1.0 | 1344.25 | 1353.66 | 0.6 | 0.99 | chaiml-mistral-24b-grpo_58640_v1 | 24B | ChaiML/mistral_24b_grpo_cp1184_92ff | chaiml-mistral-24b-grpo_58640_v1 | 8374 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/mistral_24b_grpo_ | 2025-05-01 | single | 1.7 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 17.0 | 1.0 | 1344.0 | 1353.66 | 0.0 | 0.99 | rirv938-98p-2ff-rirv938_45880_v1 | 24B | rirv938/98p_2ff_rirv938_20k_100p_0ff_ri_19485_v1_cp1496_v3 | rirv938-98p-2ff-rirv938_45880_v1 | 6811 | 61115860 | 0.57 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-04-02 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 18.0 | 1.0 | 1343.9 | 1353.66 | 0.5 | 0.99 | rirv938-anthropic-grpo-_10659_v1 | 13B | rirv938/anthropic_grpo_40k_cp592_0ff_merged | rirv938-anthropic-grpo-_10659_v1 | 7433 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-30 | single | 1.64 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 19.0 | 1.0 | 1343.5 | 1353.66 | 0.53 | 0.99 | function_tafeb_2025-04-22 | | | dpo_data_collection | 7931 | 61115860 | 0.58 | 0.65 | function | | | | | | | 2025-04-21 | single | | |
rirv938 | 1 | 20.0 | 1.0 | 1342.83 | 1353.66 | 0.51 | 0.99 | rirv938-97p-3ff-rirv938-_7194_v1 | 24B | rirv938/97p_3ff_rirv938_20k_100p_0ff_ri_19485_v1_cp1125_v3 | rirv938-97p-3ff-rirv938-_7194_v1 | 9168 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/97p_3ff_rirv938_ | 2025-04-03 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 21.0 | 1.0 | 1342.77 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_29039_v1 | 13B | rirv938/anthropic_grpo_40k_cp1248_96ff_new_rm_merged | rirv938-anthropic-grpo-_29039_v1 | 6562 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-20 | single | | |
rirv938 | 1 | 22.0 | 1.0 | 1342.51 | 1353.66 | 0.55 | 0.99 | chaiml-ahab-v1-20250423_v1 | 24B | ChaiML/ahab_v1_20250423 | chaiml-ahab-v1-20250423_v1 | 9717 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/ahab_v1_20250423 | 2025-04-22 | single | 1.75 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 23.0 | 1.0 | 1342.23 | 1353.66 | 0.53 | 0.99 | rirv938-96p-4ff-rirv938_33201_v1 | 24B | rirv938/96p_4ff_rirv938_20k_100p_0ff_ri_19485_v1_cp1500_v3 | rirv938-96p-4ff-rirv938_33201_v1 | 7643 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_rirv938_ | 2025-04-03 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 24.0 | 1.0 | 1341.54 | 1353.66 | 0.56 | 0.99 | function_heron_2025-04-09 | | | dpo_data_collection | 5323 | 61115860 | 0.59 | 0.65 | function | | | | | | | 2025-04-09 | single | | |
rirv938 | 1 | 25.0 | 1.0 | 1341.2 | 1353.66 | 0.47 | 0.99 | rirv938-100p-0ff-rirv93_81442_v1 | 24B | rirv938/100p_0ff_rirv938_20k_100p_0ff_ri_19485_v1_cp561_v3 | rirv938-100p-0ff-rirv93_81442_v1 | 7680 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-02 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 26.0 | 1.0 | 1340.97 | 1353.66 | 0.52 | 0.99 | rirv938-96p-4ff-rirv938_74554_v1 | 24B | rirv938/96p_4ff_rirv938_20k_100p_0ff_ri_19485_v1_cp1125_v3 | rirv938-96p-4ff-rirv938_74554_v1 | 8796 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_rirv938_ | 2025-04-03 | single | 0.81 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 27.0 | 1.0 | 1340.76 | 1353.66 | 0.53 | 0.99 | rirv938-anthropic-grpo-4_3554_v1 | 13B | rirv938/anthropic_grpo_40k_cp888_0ff_merged | rirv938-anthropic-grpo-4_3554_v1 | 9025 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-30 | single | 1.62 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 28.0 | 1.0 | 1340.57 | 1353.66 | 0.52 | 0.99 | chaiml-anthropic-grpo-4_77013_v2 | 13B | ChaiML/anthropic_grpo_40k_cp888_0ff | chaiml-anthropic-grpo-4_77013_v2 | 6960 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/anthropic_grpo_40 | 2025-05-01 | single | 1.62 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 29.0 | 1.0 | 1340.35 | 1353.66 | 0.55 | 0.99 | rirv938-mistral-24b-grp_72186_v1 | 24B | rirv938/mistral_24b_grpo_40k_cp1184_95ff_merged | rirv938-mistral-24b-grp_72186_v1 | 6279 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_grpo | 2025-04-29 | single | 1.73 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 30.0 | 1.0 | 1339.33 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_34483_v2 | 13B | rirv938/anthropic_grpo_40k_cp2184_96ff_new_rm_merged | rirv938-anthropic-grpo-_34483_v2 | 6504 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-20 | single | | |
rirv938 | 1 | 31.0 | 1.0 | 1338.97 | 1353.66 | 0.5 | 0.99 | rirv938-98p-2ff-rirv938_26835_v1 | 24B | rirv938/98p_2ff_rirv938_20k_100p_0ff_ri_19485_v1_cp748_v3 | rirv938-98p-2ff-rirv938_26835_v1 | 6122 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-04-02 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 32.0 | 1.0 | 1338.95 | 1353.66 | 0.58 | 0.99 | rirv938-rinen-grpo-40k-_48409_v1 | 13B | rirv938/rinen_grpo_40k_cp1184_95ff_merged | rirv938-rinen-grpo-40k-_48409_v1 | 5660 | 61115860 | 0.57 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_40k_c | 2025-04-29 | single | 1.37 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 33.0 | 1.0 | 1338.8 | 1353.66 | 0.55 | 0.99 | rirv938-exp-grpo-cp624-_98027_v1 | 24B | rirv938/exp_grpo_cp624_96ff_b1_r1_merged | rirv938-exp-grpo-cp624-_98027_v1 | 8041 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-25 | single | | |
rirv938 | 1 | 34.0 | 1.0 | 1338.6 | 1353.66 | 0.56 | 0.99 | rirv938-exp-grpo-cp312-_12850_v1 | 24B | rirv938/exp_grpo_cp312_96ff_b1_r1_merged | rirv938-exp-grpo-cp312-_12850_v1 | 7038 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-25 | single | | |
rirv938 | 1 | 35.0 | 1.0 | 1338.51 | 1353.66 | 0.49 | 0.99 | rirv938-98p-2ff-rirv938_71631_v1 | 24B | rirv938/98p_2ff_rirv938_20k_100p_0ff_ri_19485_v1_cp1122_v3 | rirv938-98p-2ff-rirv938_71631_v1 | 7254 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-04-02 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 36.0 | 1.0 | 1338.3 | 1353.66 | 0.49 | 0.99 | rirv938-98p-2ff-rirv938-_1456_v1 | 24B | rirv938/98p_2ff_rirv938_98p_2ff_rirv938_42155_v1_cp624_v3 | rirv938-98p-2ff-rirv938-_1456_v1 | 8861 | 61115860 | 0.57 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-03-29 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 37.0 | 1.0 | 1338.27 | 1353.66 | 0.56 | 0.99 | rirv938-mistral-24b-grp_89290_v1 | 24B | rirv938/mistral_24b_grpo_40k_cp592_92ff_merged | rirv938-mistral-24b-grp_89290_v1 | 6117 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_grpo | 2025-04-29 | single | 1.75 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 38.0 | 1.0 | 1338.15 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_34483_v1 | 13B | rirv938/anthropic_grpo_40k_cp2184_96ff_new_rm_merged | rirv938-anthropic-grpo-_34483_v1 | 6761 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-20 | single | | |
rirv938 | 1 | 39.0 | 1.0 | 1337.84 | 1353.66 | 0.56 | 0.99 | rirv938-94p-6ff-rirv938-_8152_v3 | 24B | rirv938/94p_6ff_rirv938_20k_100p_0ff_ri_19485_v1_cp1500_merged | rirv938-94p-6ff-rirv938-_8152_v3 | 9925 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/94p_6ff_rirv938_ | 2025-04-22 | single | 1.73 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 40.0 | 1.0 | 1337.77 | 1353.66 | 0.57 | 0.99 | rirv938-mistral-24b-grp_17707_v1 | 24B | rirv938/mistral_24b_grpo_40k_cp888_92ff_merged | rirv938-mistral-24b-grp_17707_v1 | 6272 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_grpo | 2025-04-29 | single | 1.73 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 41.0 | 1.0 | 1337.74 | 1353.66 | 0.56 | 0.99 | rirv938-rinen-grpo-cp15_67201_v1 | 13B | rirv938/rinen_grpo_cp156_97ff_ava_bo1_b4_round3_merged | rirv938-rinen-grpo-cp15_67201_v1 | 6549 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp156 | 2025-05-22 | single | | |
rirv938 | 1 | 42.0 | 1.0 | 1337.7 | 1353.66 | 0.6 | 0.99 | rirv938-tune-mistral-grp_3576_v1 | 24B | rirv938/tune_mistral_grpo_cp592_92ff_new_merged | rirv938-tune-mistral-grp_3576_v1 | 6143 | 61115860 | 0.57 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/tune_mistral_grp | 2025-05-01 | single | 1.74 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 43.0 | 1.0 | 1337.69 | 1353.66 | 0.56 | 0.99 | function_ruhok_2025-04-09 | | | dpo_data_collection | 6821 | 61115860 | 0.59 | 0.65 | function | | | | | | | 2025-04-09 | single | | |
rirv938 | 1 | 44.0 | 1.0 | 1337.53 | 1353.66 | 0.52 | 0.99 | rirv938-96p-4ff-rirv938_48622_v1 | 24B | rirv938/96p_4ff_rirv938_20k_100p_0ff_ri_19485_v1_cp750_v3 | rirv938-96p-4ff-rirv938_48622_v1 | 7641 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_rirv938_ | 2025-04-03 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 45.0 | 1.0 | 1337.5 | 1353.66 | 0.56 | 0.99 | rirv938-rinen-grpo-40k-_80959_v1 | 13B | rirv938/rinen_grpo_40k_cp592_95ff_run2_merged | rirv938-rinen-grpo-40k-_80959_v1 | 8187 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_40k_c | 2025-04-30 | single | 1.38 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 46.0 | 1.0 | 1337.48 | 1353.66 | 0.47 | 0.99 | rirv938-98p-2ff-nischay_31669_v1 | 24B | rirv938/98p_2ff_nischaydnk_exp14_exp9dp_94555_v3_cp624_merged | rirv938-98p-2ff-nischay_31669_v1 | 8680 | 61115860 | 0.58 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_nischayd | 2025-04-10 | single | 0.65 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 47.0 | 1.0 | 1337.29 | 1353.66 | 0.55 | 0.99 | chaiml-rinen-grpo-40k-c_51339_v1 | 13B | ChaiML/rinen_grpo_40k_cp296_95ff | chaiml-rinen-grpo-40k-c_51339_v1 | 8271 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/rinen_grpo_40k_cp | 2025-05-01 | single | 1.39 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 48.0 | 1.0 | 1337.11 | 1353.66 | 0.56 | 0.99 | rirv938-rinen-grpo-40k-_71220_v1 | 13B | rirv938/rinen_grpo_40k_cp888_95ff_run2_merged | rirv938-rinen-grpo-40k-_71220_v1 | 8869 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_40k_c | 2025-04-30 | single | 1.33 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 49.0 | 1.0 | 1337.1 | 1353.66 | 0.54 | 0.99 | rirv938-grpo-to-compare_87284_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp156_lr6_merged | rirv938-grpo-to-compare_87284_v1 | 10625 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-25 | single | 1.44 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 50.0 | 1.0 | 1337.08 | 1353.66 | 0.56 | 0.99 | function_nelob_2025-04-09 | | | dpo_data_collection | 6922 | 61115860 | 0.58 | 0.65 | function | | | | | | | 2025-04-09 | single | | |
rirv938 | 1 | 51.0 | 1.0 | 1336.95 | 1353.66 | 0.55 | 0.99 | function_tumif_2025-04-09 | | | dpo_data_collection | 5562 | 61115860 | 0.59 | 0.65 | function | | | | | | | 2025-04-09 | single | | |
rirv938 | 1 | 52.0 | 1.0 | 1336.94 | 1353.66 | 0.55 | 0.99 | rirv938-94p-6ff-rirv938_67490_v2 | 24B | rirv938/94p_6ff_rirv938_20k_100p_0ff_ri_19485_v1_cp2250_merged | rirv938-94p-6ff-rirv938_67490_v2 | 6224 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/94p_6ff_rirv938_ | 2025-04-03 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 53.0 | 1.0 | 1336.91 | 1353.66 | 0.55 | 0.99 | chaiml-ahab-v1-20250423_v4 | 24B | ChaiML/ahab_v1_20250423 | chaiml-ahab-v1-20250423_v4 | 8919 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/ahab_v1_20250423 | 2025-04-22 | single | 1.75 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 54.0 | 1.0 | 1336.67 | 1353.66 | 0.51 | 0.99 | function_libuf_2025-04-10 | | | dpo_data_collection | 7999 | 61115860 | 0.58 | 0.65 | function | | | | | | | 2025-04-10 | single | | |
rirv938 | 1 | 55.0 | 1.0 | 1336.47 | 1353.66 | 0.55 | 0.99 | rirv938-94p-6ff-rirv938-_8152_v1 | 24B | rirv938/94p_6ff_rirv938_20k_100p_0ff_ri_19485_v1_cp1500_merged | rirv938-94p-6ff-rirv938-_8152_v1 | 8418 | 61115860 | 0.6 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/94p_6ff_rirv938_ | 2025-04-03 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 56.0 | 1.0 | 1336.35 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_90777_v1 | 13B | rirv938/anthropic_grpo_40k_cp1184_95ff_merged | rirv938-anthropic-grpo-_90777_v1 | 6352 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.1 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 57.0 | 1.0 | 1336.32 | 1353.66 | 0.52 | 0.99 | rirv938-97p-3ff-rirv938_16641_v1 | 24B | rirv938/97p_3ff_rirv938_20k_100p_0ff_ri_19485_v1_cp1500_v3 | rirv938-97p-3ff-rirv938_16641_v1 | 9243 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/97p_3ff_rirv938_ | 2025-04-03 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 58.0 | 1.0 | 1335.76 | 1353.66 | 0.5 | 0.99 | rirv938-original-96p-4f_59555_v1 | 24B | rirv938/original_96p_4ff_rirv938_98p_2ff_rirv938_42155_v1_cp624_v3 | rirv938-original-96p-4f_59555_v1 | 7077 | 61115860 | 0.57 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/original_96p_4ff | 2025-03-31 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 59.0 | 1.0 | 1335.6 | 1353.66 | 0.5 | 0.99 | rirv938-98p-2ff-rirv938_30412_v1 | 24B | rirv938/98p_2ff_rirv938_20k_100p_0ff_ri_19485_v1_cp561_v3 | rirv938-98p-2ff-rirv938_30412_v1 | 7339 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-04-02 | single | 0.76 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 60.0 | 1.0 | 1335.48 | 1353.66 | 0.51 | 0.99 | rirv938-original-96p-4f_90259_v1 | 24B | rirv938/original_96p_4ff_rirv938_98p_2ff_rirv938_42155_v1_cp936_v3 | rirv938-original-96p-4f_90259_v1 | 7452 | 61115860 | 0.57 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/original_96p_4ff | 2025-03-31 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 61.0 | 1.0 | 1335.43 | 1353.66 | 0.57 | 0.99 | rirv938-rinen-grpo-40k-_73414_v1 | 13B | rirv938/rinen_grpo_40k_cp888_95ff_merged | rirv938-rinen-grpo-40k-_73414_v1 | 5885 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_40k_c | 2025-04-29 | single | 1.33 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 62.0 | 1.0 | 1334.97 | 1353.66 | 0.51 | 0.99 | rirv938-97p-3ff-rirv938_77477_v1 | 24B | rirv938/97p_3ff_rirv938_20k_100p_0ff_ri_19485_v1_cp750_v3 | rirv938-97p-3ff-rirv938_77477_v1 | 9403 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/97p_3ff_rirv938_ | 2025-04-03 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 63.0 | 1.0 | 1334.96 | 1353.66 | 0.58 | 0.99 | rirv938-anthropic-grpo-_77193_v1 | 13B | rirv938/anthropic_grpo_40k_cp624_96ff_new_rm_merged | rirv938-anthropic-grpo-_77193_v1 | 6486 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-20 | single | | |
rirv938 | 1 | 64.0 | 1.0 | 1334.28 | 1353.66 | 0.55 | 0.99 | chaiml-ahab-v1-20250423_v3 | 24B | ChaiML/ahab_v1_20250423 | chaiml-ahab-v1-20250423_v3 | 7887 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/ahab_v1_20250423 | 2025-04-22 | single | 1.73 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 65.0 | 1.0 | 1334.27 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-4_3092_v1 | 13B | rirv938/anthropic_grpo_40k_cp888_95ff_merged | rirv938-anthropic-grpo-4_3092_v1 | 6855 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.37 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 66.0 | 1.0 | 1334.22 | 1353.66 | 0.51 | 0.99 | function_sebun_2025-04-03 | | | dpo_data_collection | 13285 | 61115860 | 0.57 | 0.65 | function | | | | | | | 2025-04-02 | single | | |
rirv938 | 1 | 67.0 | 1.0 | 1333.96 | 1353.66 | 0.49 | 0.99 | rirv938-original-98p-2f_90009_v1 | 24B | rirv938/original_98p_2ff_rirv938_98p_2ff_rirv938_42155_v1_cp624_v3 | rirv938-original-98p-2f_90009_v1 | 7695 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/original_98p_2ff | 2025-03-29 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 68.0 | 1.0 | 1333.88 | 1353.66 | 0.5 | 0.99 | rirv938-96p-4ff-rirv938_38604_v1 | 24B | rirv938/96p_4ff_rirv938_98p_2ff_rirv938_42155_v1_cp936_v3 | rirv938-96p-4ff-rirv938_38604_v1 | 6528 | 61115860 | 0.57 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_rirv938_ | 2025-03-31 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 69.0 | 1.0 | 1333.7 | 1353.66 | 0.51 | 0.99 | rirv938-anthropic-grpo-_12477_v1 | 13B | rirv938/anthropic_grpo_40k_cp296_0ff_merged | rirv938-anthropic-grpo-_12477_v1 | 6443 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-30 | single | 1.59 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 70.0 | 1.0 | 1333.53 | 1353.66 | 0.48 | 0.99 | rirv938-original-98p-2f_88189_v1 | 24B | rirv938/original_98p_2ff_rirv938_98p_2ff_rirv938_42155_v1_cp312_v3 | rirv938-original-98p-2f_88189_v1 | 8537 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/original_98p_2ff | 2025-03-29 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 71.0 | 1.0 | 1333.38 | 1353.66 | 0.56 | 0.99 | rirv938-mistral-12b-dpo_75616_v2 | 13B | rirv938/mistral_12b_dpo_40k_2374_96_output_tokens_v2 | rirv938-mistral-12b-dpo_75616_v2 | 6084 | 61115860 | 0.65 | 0.65 | basic | | 8.0 | 768.0 | 96.0 | MistralForCausalLM | rirv938/mistral_12b_dpo_ | 2025-02-24 | single | 1.02 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 72.0 | 1.0 | 1332.98 | 1353.66 | 0.48 | 0.99 | rirv938-100p-0ff-rirv93_34479_v1 | 24B | rirv938/100p_0ff_rirv938_20k_100p_0ff_ri_19485_v1_cp374_v3 | rirv938-100p-0ff-rirv93_34479_v1 | 5942 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-02 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 73.0 | 1.0 | 1332.92 | 1353.66 | 0.52 | 0.99 | function_rihit_2025-04-21 | | | dpo_data_collection | 7942 | 61115860 | 0.55 | 0.65 | function | | | | | | | 2025-04-21 | single | | |
rirv938 | 1 | 74.0 | 1.0 | 1332.65 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp624-_90544_v1 | 24B | rirv938/exp_grpo_cp624_96ff_b4_r2_merged | rirv938-exp-grpo-cp624-_90544_v1 | 5639 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-23 | single | | |
rirv938 | 1 | 75.0 | 1.0 | 1332.63 | 1353.66 | 0.56 | 0.99 | rirv938-mistral-12b-dpo_33813_v2 | 13B | rirv938/mistral_12b_dpo_40k_3561_96_output_tokens_v2 | rirv938-mistral-12b-dpo_33813_v2 | 6116 | 61115860 | 0.61 | 0.65 | basic | | 8.0 | 768.0 | 96.0 | MistralForCausalLM | rirv938/mistral_12b_dpo_ | 2025-02-24 | single | 1.03 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 76.0 | 1.0 | 1332.61 | 1353.66 | 0.52 | 0.99 | chaiml-ahab-v2-rirv938-_54360_v3 | 24B | ChaiML/ahab_v2_rirv938_20250423 | chaiml-ahab-v2-rirv938-_54360_v3 | 8351 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/ahab_v2_rirv938_2 | 2025-04-22 | single | 1.75 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 77.0 | 1.0 | 1332.29 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp624-_76327_v1 | 24B | rirv938/exp_grpo_cp624_96ff_b2_r1_merged | rirv938-exp-grpo-cp624-_76327_v1 | 8575 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-25 | single | | |
rirv938 | 1 | 78.0 | 1.0 | 1332.2 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp312-9_2759_v2 | 24B | rirv938/exp_grpo_cp312_96ff_b6_r2_less_ff_merged | rirv938-exp-grpo-cp312-9_2759_v2 | 7149 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-26 | single | | |
rirv938 | 1 | 79.0 | 1.0 | 1331.81 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_51376_v1 | 13B | rirv938/anthropic_grpo_40k_cp592_95ff_merged | rirv938-anthropic-grpo-_51376_v1 | 5508 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.36 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 80.0 | 1.0 | 1331.6 | 1353.66 | 0.56 | 0.99 | rirv938-rinen-grpo-cp31_50291_v1 | 13B | rirv938/rinen_grpo_cp312_97ff_ava_bo1_b4_round3_merged | rirv938-rinen-grpo-cp31_50291_v1 | 6349 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp312 | 2025-05-22 | single | | |
rirv938 | 1 | 81.5 | 1.0 | 1331.33 | 1353.66 | 0.47 | 0.99 | rirv938-100p-0ff-rirv93_76723_v1 | 24B | rirv938/100p_0ff_rirv938_20k_100p_0ff_ri_19485_v1_cp748_v3 | rirv938-100p-0ff-rirv93_76723_v1 | 5938 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-02 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 81.5 | 1.0 | 1331.33 | 1353.66 | 0.55 | 0.99 | rirv938-rinen-grpo-40k-_88641_v1 | 13B | rirv938/rinen_grpo_40k_cp1184_95ff_run2_merged | rirv938-rinen-grpo-40k-_88641_v1 | 8773 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_40k_c | 2025-04-30 | single | 1.36 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 83.0 | 1.0 | 1331.09 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-4_2521_v1 | 13B | rirv938/anthropic_grpo_40k_cp312_96ff_new_rm_merged | rirv938-anthropic-grpo-4_2521_v1 | 6623 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-20 | single | | |
rirv938 | 1 | 84.0 | 1.0 | 1330.98 | 1353.66 | 0.55 | 0.99 | rirv938-94p-6ff-rirv938-_8152_v2 | 24B | rirv938/94p_6ff_rirv938_20k_100p_0ff_ri_19485_v1_cp1500_merged | rirv938-94p-6ff-rirv938-_8152_v2 | 10430 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/94p_6ff_rirv938_ | 2025-04-22 | single | 1.73 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 85.0 | 1.0 | 1330.77 | 1353.66 | 0.57 | 0.99 | rirv938-mistral-24b-grp_82678_v2 | 24B | rirv938/mistral_24b_grpo_40k_cp1184_92ff_merged | rirv938-mistral-24b-grp_82678_v2 | 6301 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_grpo | 2025-04-29 | single | 1.73 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 86.0 | 1.0 | 1329.98 | 1353.66 | 0.5 | 0.99 | rirv938-98p-2ff-rirv938-_7443_v1 | 24B | rirv938/98p_2ff_rirv938_20k_100p_0ff_ri_19485_v1_cp374_v3 | rirv938-98p-2ff-rirv938-_7443_v1 | 6039 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-04-02 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 87.0 | 1.0 | 1329.79 | 1353.66 | 0.6 | 0.99 | rirv938-tune-mistral-gr_79261_v1 | 24B | rirv938/tune_mistral_grpo_cp888_92ff_new_merged | rirv938-tune-mistral-gr_79261_v1 | 6134 | 61115860 | 0.57 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/tune_mistral_grp | 2025-05-01 | single | 1.74 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 88.0 | 1.0 | 1329.65 | 1353.66 | 0.56 | 0.99 | rirv938-slerp-grpo-cp156_2041_v1 | 24B | rirv938/slerp_grpo_cp156_96ff_b4_r2_merged | rirv938-slerp-grpo-cp156_2041_v1 | 6223 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp156 | 2025-05-22 | single | | |
rirv938 | 1 | 89.0 | 1.0 | 1329.53 | 1353.66 | 0.48 | 0.99 | rirv938-98p-2ff-rirv938_80130_v1 | 24B | rirv938/98p_2ff_rirv938_98p_2ff_rirv938_42155_v1_cp312_v3 | rirv938-98p-2ff-rirv938_80130_v1 | 7606 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-03-29 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 90.0 | 1.0 | 1329.49 | 1353.66 | 0.53 | 0.99 | rirv938-grok-payloads-g_30885_v1 | 24B | rirv938/grok_payloads_grpo_cp312_98ff_b35_r1_merged | rirv938-grok-payloads-g_30885_v1 | 7440 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grok_payloads_gr | 2025-07-07 | single | 1.41 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 91.0 | 1.0 | 1329.24 | 1353.66 | 0.53 | 0.99 | rirv938-anthropic-grpo-_73855_v1 | 13B | rirv938/anthropic_grpo_40k_cp1184_99ff_merged | rirv938-anthropic-grpo-_73855_v1 | 5582 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.6 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 92.0 | 1.0 | 1329.19 | 1353.66 | 0.57 | 0.99 | chaiml-rinen-grpo-40k-c_60950_v1 | 13B | ChaiML/rinen_grpo_40k_cp1184_95ff | chaiml-rinen-grpo-40k-c_60950_v1 | 8424 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/rinen_grpo_40k_cp | 2025-05-01 | single | 1.32 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 93.0 | 1.0 | 1328.98 | 1353.66 | 0.55 | 0.99 | rirv938-exp-grpo-cp312-_49942_v1 | 24B | rirv938/exp_grpo_cp312_96ff_b4_r2_merged | rirv938-exp-grpo-cp312-_49942_v1 | 5702 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-23 | single | | |
rirv938 | 1 | 94.0 | 1.0 | 1328.9 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_38026_v1 | 13B | rirv938/anthropic_grpo_40k_cp156_96ff_new_rm_merged | rirv938-anthropic-grpo-_38026_v1 | 7253 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-20 | single | | |
rirv938 | 1 | 95.0 | 1.0 | 1328.76 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_77071_v1 | 13B | rirv938/anthropic_grpo_40k_cp3588_96ff_new_rm_b3_merged | rirv938-anthropic-grpo-_77071_v1 | 8455 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-21 | single | | |
rirv938 | 1 | 96.0 | 1.0 | 1328.44 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp156-_88924_v1 | 24B | rirv938/exp_grpo_cp156_96ff_b4_r2_merged | rirv938-exp-grpo-cp156-_88924_v1 | 5709 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp156_9 | 2025-05-23 | single | | |
rirv938 | 1 | 97.0 | 1.0 | 1328.43 | 1353.66 | 0.59 | 0.99 | chaiml-mistral-24b-grpo_99461_v1 | 24B | ChaiML/mistral_24b_grpo_cp592_92ff | chaiml-mistral-24b-grpo_99461_v1 | 8096 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/mistral_24b_grpo_ | 2025-05-01 | single | 1.72 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 98.0 | 1.0 | 1328.24 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_55424_v1 | 13B | rirv938/anthropic_grpo_40k_cp296_95ff_merged | rirv938-anthropic-grpo-_55424_v1 | 7781 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-28 | single | 1.34 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 99.0 | 1.0 | 1328.16 | 1353.66 | 0.54 | 0.99 | rirv938-94p-6ff-rirv938_39054_v1 | 24B | rirv938/94p_6ff_rirv938_20k_100p_0ff_ri_19485_v1_cp750_merged | rirv938-94p-6ff-rirv938_39054_v1 | 7358 | 61115860 | 0.59 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/94p_6ff_rirv938_ | 2025-04-03 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 100.0 | 1.0 | 1327.6 | 1353.66 | 0.56 | 0.99 | rirv938-mistral-24b-grp_82678_v1 | 24B | rirv938/mistral_24b_grpo_40k_cp1184_92ff_merged | rirv938-mistral-24b-grp_82678_v1 | 6100 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_grpo | 2025-04-29 | single | 1.72 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 101.0 | 1.0 | 1327.56 | 1353.66 | 0.56 | 0.99 | chaiml-anthropic-grpo-4_66492_v1 | 13B | ChaiML/anthropic_grpo_40k_cp1184_95ff | chaiml-anthropic-grpo-4_66492_v1 | 7487 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/anthropic_grpo_40 | 2025-05-01 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 102.0 | 1.0 | 1327.45 | 1353.66 | 0.5 | 0.99 | rirv938-original-96p-4f_39870_v1 | 24B | rirv938/original_96p_4ff_rirv938_98p_2ff_rirv938_42155_v1_cp312_v3 | rirv938-original-96p-4f_39870_v1 | 9217 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/original_96p_4ff | 2025-03-31 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 103.0 | 1.0 | 1327.43 | 1353.66 | 0.56 | 0.99 | rirv938-mistral-24b-grp_42042_v1 | 24B | rirv938/mistral_24b_grpo_40k_cp888_95ff_merged | rirv938-mistral-24b-grp_42042_v1 | 6112 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_grpo | 2025-04-29 | single | 1.75 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 104.0 | 1.0 | 1326.73 | 1353.66 | 0.5 | 0.99 | rirv938-96p-4ff-rirv938_36250_v1 | 24B | rirv938/96p_4ff_rirv938_98p_2ff_rirv938_42155_v1_cp624_v3 | rirv938-96p-4ff-rirv938_36250_v1 | 6235 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_rirv938_ | 2025-03-31 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 105.0 | 1.0 | 1326.7 | 1353.66 | 0.54 | 0.99 | chaiml-ahab-v1-20250423_v2 | 24B | ChaiML/ahab_v1_20250423 | chaiml-ahab-v1-20250423_v2 | 7319 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/ahab_v1_20250423 | 2025-04-22 | single | 1.75 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 106.0 | 1.0 | 1326.54 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_90777_v3 | 13B | rirv938/anthropic_grpo_40k_cp1184_95ff_merged | rirv938-anthropic-grpo-_90777_v3 | 8302 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.65 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 107.0 | 1.0 | 1326.3 | 1353.66 | 0.5 | 0.99 | rirv938-100p-0ff-rirv93_80560_v1 | 24B | rirv938/100p_0ff_rirv938_20k_100p_0ff_ri_19485_v1_cp187_v3 | rirv938-100p-0ff-rirv93_80560_v1 | 6603 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-02 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 108.0 | 1.0 | 1326.23 | 1353.66 | 0.51 | 0.99 | rirv938-97p-3ff-rirv938_76571_v1 | 24B | rirv938/97p_3ff_rirv938_20k_100p_0ff_ri_19485_v1_cp375_v3 | rirv938-97p-3ff-rirv938_76571_v1 | 8890 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/97p_3ff_rirv938_ | 2025-04-03 | single | 0.81 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 109.0 | 1.0 | 1326.03 | 1353.66 | 0.56 | 0.99 | chaiml-anthropic-grpo-4_66492_v3 | 13B | ChaiML/anthropic_grpo_40k_cp1184_95ff | chaiml-anthropic-grpo-4_66492_v3 | 6925 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/anthropic_grpo_40 | 2025-05-01 | single | 1.6 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 110.0 | 1.0 | 1325.52 | 1353.66 | 0.56 | 0.99 | rirv938-rinen-grpo-cp62_98390_v1 | 13B | rirv938/rinen_grpo_cp624_97ff_ava_bo1_b4_round3_merged | rirv938-rinen-grpo-cp62_98390_v1 | 7138 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp624 | 2025-05-22 | single | | |
rirv938 | 1 | 111.0 | 1.0 | 1325.46 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp624-_69622_v1 | 24B | rirv938/exp_grpo_cp624_96ff_b3_r1_merged | rirv938-exp-grpo-cp624-_69622_v1 | 8752 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-25 | single | | |
rirv938 | 1 | 112.0 | 1.0 | 1325.39 | 1353.66 | 0.0 | 0.99 | rirv938-94p-6ff-rirv938_15029_v3 | 24B | rirv938/94p_6ff_rirv938_1000_sim_100p_0_17599_v1_cp1060_merged | rirv938-94p-6ff-rirv938_15029_v3 | 7125 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/94p_6ff_rirv938_ | 2025-04-21 | single | 1.47 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 113.0 | 1.0 | 1325.24 | 1353.66 | 0.55 | 0.99 | rirv938-exp-grpo-cp312-_36697_v2 | 24B | rirv938/exp_grpo_cp312_96ff_b4_r1_merged | rirv938-exp-grpo-cp312-_36697_v2 | 5870 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-22 | single | | |
rirv938 | 1 | 114.0 | 1.0 | 1325.21 | 1353.66 | 0.5 | 0.99 | rirv938-100p-0ff-rirv93_75853_v1 | 24B | rirv938/100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp936_v3 | rirv938-100p-0ff-rirv93_75853_v1 | 5913 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-02 | single | 0.76 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 115.0 | 1.0 | 1325.17 | 1353.66 | 0.53 | 0.99 | rirv938-20k-100p-0ff-ri_19485_v1 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp468_v3 | rirv938-20k-100p-0ff-ri_19485_v1 | 5653 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-02 | single | 0.81 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 116.0 | 1.0 | 1324.82 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-4_3132_v1 | 13B | rirv938/anthropic_grpo_40k_cp888_99ff_merged | rirv938-anthropic-grpo-4_3132_v1 | 5672 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.62 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 117.0 | 1.0 | 1324.76 | 1353.66 | 0.55 | 0.99 | chaiml-anthropic-grpo-4_59715_v1 | 13B | ChaiML/anthropic_grpo_40k_cp888_95ff_20ww2_merged | chaiml-anthropic-grpo-4_59715_v1 | 5913 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/anthropic_grpo_40 | 2025-05-15 | single | 1.64 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 118.0 | 1.0 | 1324.74 | 1353.66 | 0.54 | 0.99 | rirv938-grpo-to-compare_71154_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp312_lr9_merged | rirv938-grpo-to-compare_71154_v1 | 10204 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-26 | single | 1.46 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 119.0 | 1.0 | 1324.54 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp31_45240_v1 | 24B | rirv938/slerp_grpo_cp312_96ff_b4_r1_lr2_merged | rirv938-slerp-grpo-cp31_45240_v1 | 5411 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp312 | 2025-05-23 | single | | |
rirv938 | 1 | 120.0 | 1.0 | 1324.3 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp312-_28460_v1 | 24B | rirv938/exp_grpo_cp312_96ff_b2_r1_merged | rirv938-exp-grpo-cp312-_28460_v1 | 8683 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-25 | single | | |
rirv938 | 1 | 121.0 | 1.0 | 1324.24 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp62_12095_v1 | 24B | rirv938/slerp_grpo_cp624_96ff_b4_r2_merged | rirv938-slerp-grpo-cp62_12095_v1 | 6122 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp624 | 2025-05-22 | single | | |
rirv938 | 1 | 122.0 | 1.0 | 1323.94 | 1353.66 | 0.48 | 0.99 | rirv938-98p-2ff-nischay_33448_v1 | 24B | rirv938/98p_2ff_nischaydnk_exp14_exp9dp_94555_v3_cp312_merged | rirv938-98p-2ff-nischay_33448_v1 | 8982 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_nischayd | 2025-04-10 | single | 0.65 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 123.0 | 1.0 | 1323.75 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp62_73258_v1 | 24B | rirv938/slerp_grpo_cp624_96ff_b5_r2_merged | rirv938-slerp-grpo-cp62_73258_v1 | 6112 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp624 | 2025-05-22 | single | | |
rirv938 | 1 | 124.0 | 1.0 | 1323.55 | 1353.66 | 0.54 | 0.99 | function_nubul_2025-04-03 | | | dpo_data_collection | 8661 | 61115860 | 0.53 | 0.65 | function | | | | | | | 2025-04-03 | single | | |
rirv938 | 1 | 125.5 | 1.0 | 1323.46 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp624-9_7961_v1 | 24B | rirv938/exp_grpo_cp624_96ff_b6_r2_less_ff_merged | rirv938-exp-grpo-cp624-9_7961_v1 | 6887 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-26 | single | | |
rirv938 | 1 | 125.5 | 1.0 | 1323.46 | 1353.66 | 0.53 | 0.99 | rirv938-20k-100p-0ff-ri_19485_v2 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp468_v3 | rirv938-20k-100p-0ff-ri_19485_v2 | 8195 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-03 | single | 0.64 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 127.0 | 1.0 | 1323.37 | 1353.66 | 0.54 | 0.99 | rirv938-94p-6ff-nischay_67907_v1 | 24B | rirv938/94p_6ff_nischaydnk_exp14_exp9dp_94555_v3_cp624_merged | rirv938-94p-6ff-nischay_67907_v1 | 8034 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/94p_6ff_nischayd | 2025-04-10 | single | 0.65 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 128.0 | 1.0 | 1323.36 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp156-_47530_v1 | 24B | rirv938/exp_grpo_cp156_96ff_b4_r1_less_ff_merged | rirv938-exp-grpo-cp156-_47530_v1 | 6426 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp156_9 | 2025-05-23 | single | | |
rirv938 | 1 | 129.5 | 1.0 | 1323.26 | 1353.66 | 0.51 | 0.99 | rirv938-98p-2ff-rirv938_62071_v1 | 24B | rirv938/98p_2ff_rirv938_20k_100p_0ff_ri_19485_v1_cp187_v3 | rirv938-98p-2ff-rirv938_62071_v1 | 7176 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-04-02 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 129.5 | 1.0 | 1323.26 | 1353.66 | 0.51 | 0.99 | rirv938-96p-4ff-rirv938_62112_v1 | 24B | rirv938/96p_4ff_rirv938_20k_100p_0ff_ri_19485_v1_cp375_v3 | rirv938-96p-4ff-rirv938_62112_v1 | 10083 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_rirv938_ | 2025-04-03 | single | 0.76 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 131.0 | 1.0 | 1323.23 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-4_3092_v3 | 13B | rirv938/anthropic_grpo_40k_cp888_95ff_merged | rirv938-anthropic-grpo-4_3092_v3 | 9621 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.59 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 132.0 | 1.0 | 1323.15 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp624-_21546_v1 | 24B | rirv938/exp_grpo_cp624_96ff_b4_r1_less_ff_merged | rirv938-exp-grpo-cp624-_21546_v1 | 5548 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-23 | single | | |
rirv938 | 1 | 133.0 | 1.0 | 1323.1 | 1353.66 | 0.55 | 0.99 | rirv938-rinen-grpo-40k-_56847_v1 | 13B | rirv938/rinen_grpo_40k_cp296_95ff_run2_merged | rirv938-rinen-grpo-40k-_56847_v1 | 8219 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_40k_c | 2025-04-30 | single | 1.3 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 134.0 | 1.0 | 1323.06 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp624-_85996_v2 | 24B | rirv938/exp_grpo_cp624_96ff_b6_r2_merged | rirv938-exp-grpo-cp624-_85996_v2 | 5888 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-24 | single | | |
rirv938 | 1 | 135.0 | 1.0 | 1323.03 | 1353.66 | 0.53 | 0.99 | chaiml-exp-grpo-cp312-9_39529_v1 | 24B | ChaiML/exp_grpo_cp312_96ff_b4_r1_less_ff_merged | chaiml-exp-grpo-cp312-9_39529_v1 | 5956 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/exp_grpo_cp312_96 | 2025-05-30 | single | | |
rirv938 | 1 | 136.0 | 1.0 | 1323.01 | 1353.66 | 0.5 | 0.99 | rirv938-96p-4ff-rirv938_99913_v1 | 24B | rirv938/96p_4ff_rirv938_98p_2ff_rirv938_42155_v1_cp312_v3 | rirv938-96p-4ff-rirv938_99913_v1 | 6153 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_rirv938_ | 2025-03-31 | single | 0.75 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 137.0 | 1.0 | 1322.93 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp624-_85996_v1 | 24B | rirv938/exp_grpo_cp624_96ff_b6_r2_merged | rirv938-exp-grpo-cp624-_85996_v1 | 6000 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-24 | single | | |
rirv938 | 1 | 138.0 | 1.0 | 1322.91 | 1353.66 | 0.55 | 0.99 | rirv938-20k-98p-2ff-rir_53751_v1 | 24B | rirv938/20k_98p_2ff_rirv938_mistral_24b_bon_82623_v1_cp1872_merged | rirv938-20k-98p-2ff-rir_53751_v1 | 9685 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_98p_2ff_rirv | 2025-04-09 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 139.0 | 1.0 | 1322.82 | 1353.66 | 0.52 | 0.99 | rirv938-20k-100p-0ff-ri_28508_v1 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp780_v3 | rirv938-20k-100p-0ff-ri_28508_v1 | 5629 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-02 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 140.0 | 1.0 | 1322.55 | 1353.66 | 0.54 | 0.99 | rirv938-mistral-24b-grp_30204_v1 | 24B | rirv938/mistral_24b_grpo_40k_cp592_95ff_merged | rirv938-mistral-24b-grp_30204_v1 | 6181 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_grpo | 2025-04-29 | single | 1.69 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 141.0 | 1.0 | 1322.5 | 1353.66 | 0.56 | 0.99 | rirv938-98p-2ff-rirv938_66404_v1 | 24B | rirv938/98p_2ff_rirv938_mistral_24b_bon_31129_v6_cp3125_v4 | rirv938-98p-2ff-rirv938_66404_v1 | 6226 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-04-01 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 142.0 | 1.0 | 1322.23 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_90777_v2 | 13B | rirv938/anthropic_grpo_40k_cp1184_95ff_merged | rirv938-anthropic-grpo-_90777_v2 | 7496 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.64 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 143.0 | 1.0 | 1322.09 | 1353.66 | 0.55 | 0.99 | blend_tibil_2025-04-03 | n/a | | rob_ab_test | 6219 | 61115860 | 0.52 | 0.65 | blend | | | | | | | 2025-04-03 | blended | | |
rirv938 | 1 | 144.0 | 1.0 | 1322.05 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp624-9_3383_v1 | 24B | rirv938/exp_grpo_cp624_96ff_b6_r1_merged | rirv938-exp-grpo-cp624-9_3383_v1 | 7757 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-24 | single | | |
rirv938 | 1 | 145.0 | 1.0 | 1321.82 | 1353.66 | 0.56 | 0.99 | rirv938-tune-mistral-gr_99159_v1 | 24B | rirv938/tune_mistral_grpo_cp592_92ff_run_merged | rirv938-tune-mistral-gr_99159_v1 | 5294 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/tune_mistral_grp | 2025-04-29 | single | 1.73 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 146.0 | 1.0 | 1321.47 | 1353.66 | 0.53 | 0.99 | chaiml-exp14-exp9dpoft-_83899_v1 | 24B | ChaiML/exp14_exp9dpoft_dpo_reward_rl | chaiml-exp14-exp9dpoft-_83899_v1 | 7050 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/exp14_exp9dpoft_d | 2025-06-11 | single | | |
rirv938 | 1 | 147.0 | 1.0 | 1321.45 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-_21289_v1 | 13B | rirv938/anthropic_grpo_40k_cp592_99ff_merged | rirv938-anthropic-grpo-_21289_v1 | 5511 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.57 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 148.5 | 1.0 | 1321.41 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp624-_39726_v2 | 24B | rirv938/exp_grpo_cp624_96ff_b4_r1_merged | rirv938-exp-grpo-cp624-_39726_v2 | 5722 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-22 | single | | |
rirv938 | 1 | 148.5 | 1.0 | 1321.41 | 1353.66 | 0.56 | 0.99 | rirv938-10k-97p-3ff-rir_96415_v1 | 24B | rirv938/10k_97p_3ff_rirv938_mistral_24b_bon_82623_v1_cp1872_merged | rirv938-10k-97p-3ff-rir_96415_v1 | 7096 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/10k_97p_3ff_rirv | 2025-04-08 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 150.0 | 1.0 | 1321.39 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_51376_v3 | 13B | rirv938/anthropic_grpo_40k_cp592_95ff_merged | rirv938-anthropic-grpo-_51376_v3 | 8251 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.61 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 151.0 | 1.0 | 1321.18 | 1353.66 | 0.53 | 0.99 | chaiml-exp-grpo-cp312-9_39529_v2 | 24B | ChaiML/exp_grpo_cp312_96ff_b4_r1_less_ff_merged | chaiml-exp-grpo-cp312-9_39529_v2 | 5354 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/exp_grpo_cp312_96 | 2025-05-31 | single | | |
rirv938 | 1 | 152.0 | 1.0 | 1321.16 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp312-_84193_v4 | 24B | rirv938/exp_grpo_cp312_96ff_b4_r1_less_ff_merged | rirv938-exp-grpo-cp312-_84193_v4 | 7570 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-26 | single | | |
rirv938 | 1 | 153.0 | 1.0 | 1321.15 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-beta-_88981_v4 | 13B | rirv938/anthropic_beta_2_40k_1872_bo8_95w_v2 | rirv938-anthropic-beta-_88981_v4 | 13358 | 61115860 | 0.57 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-31 | single | 1.73 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 154.0 | 1.0 | 1320.92 | 1353.66 | 0.53 | 0.99 | rirv938-20k-100p-0ff-ri_63465_v1 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp624_v3 | rirv938-20k-100p-0ff-ri_63465_v1 | 5616 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-02 | single | 0.74 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 155.0 | 1.0 | 1320.84 | 1353.66 | 0.56 | 0.99 | function_kugob_2025-04-14 | | | dpo_data_collection | 5885 | 61115860 | 0.55 | 0.65 | function | | | | | | | 2025-04-14 | single | | |
rirv938 | 1 | 156.5 | 1.0 | 1320.79 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp15_36513_v1 | 24B | rirv938/slerp_grpo_cp156_96ff_b4_r1_lr2_merged | rirv938-slerp-grpo-cp15_36513_v1 | 5552 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp156 | 2025-05-23 | single | | |
rirv938 | 1 | 156.5 | 1.0 | 1320.79 | 1353.66 | 0.56 | 0.99 | chaiml-anthropic-grpo-4_66492_v2 | 13B | ChaiML/anthropic_grpo_40k_cp1184_95ff | chaiml-anthropic-grpo-4_66492_v2 | 7943 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/anthropic_grpo_40 | 2025-05-01 | single | 1.65 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 158.0 | 1.0 | 1320.75 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp624-_51934_v1 | 24B | rirv938/exp_grpo_cp624_96ff_b5_r1_merged | rirv938-exp-grpo-cp624-_51934_v1 | 5594 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-23 | single | | |
rirv938 | 1 | 159.0 | 1.0 | 1320.74 | 1353.66 | 0.58 | 0.99 | rirv938-anthropic-grpo-_18073_v1 | 13B | rirv938/anthropic_grpo_40k_cp3744_96ff_new_rm_b3_merged | rirv938-anthropic-grpo-_18073_v1 | 8462 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-21 | single | | |
rirv938 | 1 | 160.0 | 1.0 | 1320.68 | 1353.66 | 0.56 | 0.99 | rirv938-slerp-grpo-cp31_64090_v1 | 24B | rirv938/slerp_grpo_cp312_96ff_b4_r2_merged | rirv938-slerp-grpo-cp31_64090_v1 | 6129 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp312 | 2025-05-22 | single | | |
rirv938 | 1 | 161.0 | 1.0 | 1320.65 | 1353.66 | 0.55 | 0.99 | function_sorub_2025-04-03 | | | dpo_data_collection | 7378 | 61115860 | 0.52 | 0.65 | function | | | | | | | 2025-04-03 | single | | |
rirv938 | 1 | 162.0 | 1.0 | 1320.54 | 1353.66 | 0.53 | 0.99 | rirv938-grok-payloads-g_27665_v1 | 24B | rirv938/grok_payloads_grpo_cp624_98ff_b35_r1_merged | rirv938-grok-payloads-g_27665_v1 | 7405 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grok_payloads_gr | 2025-07-07 | single | 1.33 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 163.0 | 1.0 | 1320.53 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp312-_53371_v1 | 24B | rirv938/exp_grpo_cp312_96ff_b3_r1_merged | rirv938-exp-grpo-cp312-_53371_v1 | 9195 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-25 | single | | |
rirv938 | 1 | 164.0 | 1.0 | 1320.3 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-_91303_v1 | 13B | rirv938/anthropic_grpo_40k_cp296_99ff_merged | rirv938-anthropic-grpo-_91303_v1 | 5435 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.59 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 165.0 | 1.0 | 1320.19 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_68205_v1 | 13B | rirv938/anthropic_grpo_40k_cp780_96ff_new_rm_b3_merged | rirv938-anthropic-grpo-_68205_v1 | 5945 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-20 | single | | |
rirv938 | 1 | 166.0 | 1.0 | 1319.93 | 1353.66 | 0.58 | 0.99 | rirv938-tune-mistral-gr_98214_v1 | 24B | rirv938/tune_mistral_grpo_cp296_92ff_new_merged | rirv938-tune-mistral-gr_98214_v1 | 6158 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/tune_mistral_grp | 2025-05-01 | single | 1.76 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 167.0 | 1.0 | 1319.71 | 1353.66 | 0.56 | 0.99 | rirv938-10k-97p-3ff-rir_45876_v1 | 24B | rirv938/10k_97p_3ff_rirv938_mistral_24b_bon_82623_v1_cp2808_merged | rirv938-10k-97p-3ff-rir_45876_v1 | 10171 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/10k_97p_3ff_rirv | 2025-04-08 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 168.0 | 1.0 | 1319.38 | 1353.66 | 0.56 | 0.99 | rirv938-94p-6ff-rirv938_15029_v2 | 24B | rirv938/94p_6ff_rirv938_1000_sim_100p_0_17599_v1_cp1060_merged | rirv938-94p-6ff-rirv938_15029_v2 | 7928 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/94p_6ff_rirv938_ | 2025-04-21 | single | 1.48 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 169.0 | 1.0 | 1319.35 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_55424_v3 | 13B | rirv938/anthropic_grpo_40k_cp296_95ff_merged | rirv938-anthropic-grpo-_55424_v3 | 5548 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.35 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 170.0 | 1.0 | 1319.33 | 1353.66 | 0.53 | 0.99 | rirv938-98p-2ff-chaiml-_73632_v1 | 24B | rirv938/98p_2ff_chaiml_exp14_exp9dpoft_65674_v14_cp968_merged | rirv938-98p-2ff-chaiml-_73632_v1 | 9315 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_chaiml_e | 2025-06-09 | single | | |
rirv938 | 1 | 171.0 | 1.0 | 1319.29 | 1353.66 | 0.5 | 0.99 | rirv938-98p-2ff-rirv938_42155_v1 | 24B | rirv938/98p_2ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp936_v3 | rirv938-98p-2ff-rirv938_42155_v1 | 7722 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-03-28 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 172.0 | 1.0 | 1319.18 | 1353.66 | 0.53 | 0.99 | rirv938-grok-payloads-g_30885_v2 | 24B | rirv938/grok_payloads_grpo_cp312_98ff_b35_r1_merged | rirv938-grok-payloads-g_30885_v2 | 6615 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grok_payloads_gr | 2025-07-09 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 173.0 | 1.0 | 1319.08 | 1353.66 | 0.54 | 0.99 | rirv938-20k-98p-2ff-rir_61729_v1 | 24B | rirv938/20k_98p_2ff_rirv938_mistral_24b_bon_82623_v1_cp936_merged | rirv938-20k-98p-2ff-rir_61729_v1 | 9113 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_98p_2ff_rirv | 2025-04-09 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 174.0 | 1.0 | 1318.98 | 1353.66 | 0.51 | 0.99 | chaiml-gy-grpo-cp624-98f_2782_v3 | 24B | ChaiML/gy_grpo_cp624_98ff_b35_r1_merged | chaiml-gy-grpo-cp624-98f_2782_v3 | 7010 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/gy_grpo_cp624_98f | 2025-07-09 | single | 1.33 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 175.0 | 1.0 | 1318.92 | 1353.66 | 0.53 | 0.99 | chaiml-exp-grpo-cp312-9_36146_v3 | 24B | ChaiML/exp_grpo_cp312_96ff_b6_r2_less_ff_merged | chaiml-exp-grpo-cp312-9_36146_v3 | 21460 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/exp_grpo_cp312_96 | 2025-06-05 | single | | |
rirv938 | 1 | 176.0 | 1.0 | 1318.91 | 1353.66 | 0.54 | 0.99 | function_nofun_2025-04-03 | | | dpo_data_collection | 7389 | 61115860 | 0.52 | 0.65 | function | | | | | | | 2025-04-03 | single | | |
rirv938 | 1 | 177.0 | 1.0 | 1318.73 | 1353.66 | 0.58 | 0.99 | rirv938-mistral-24b-grp_36770_v2 | 24B | rirv938/mistral_24b_grpo_40k_cp296_92ff_merged | rirv938-mistral-24b-grp_36770_v2 | 6195 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_grpo | 2025-04-29 | single | 1.73 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 178.0 | 1.0 | 1318.48 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_82258_v1 | 13B | rirv938/anthropic_grpo_40k_cp2496_96ff_new_rm_b3_merged | rirv938-anthropic-grpo-_82258_v1 | 5616 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-20 | single | | |
rirv938 | 1 | 179.5 | 1.0 | 1318.3 | 1353.66 | 0.57 | 0.99 | rirv938-grpo-to-compare-_9822_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp312_with_ff_merged | rirv938-grpo-to-compare-_9822_v1 | 7403 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-28 | single | 1.44 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 179.5 | 1.0 | 1318.3 | 1353.66 | 0.52 | 0.99 | rirv938-20k-100p-0ff-ri_54291_v1 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp1248_v3 | rirv938-20k-100p-0ff-ri_54291_v1 | 5532 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-02 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 181.0 | 1.0 | 1318.26 | 1353.66 | 0.52 | 0.99 | rirv938-94p-6ff-nischay_89530_v1 | 24B | rirv938/94p_6ff_nischaydnk_exp14_exp9dp_94555_v3_cp312_merged | rirv938-94p-6ff-nischay_89530_v1 | 8164 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/94p_6ff_nischayd | 2025-04-10 | single | 0.66 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 182.0 | 1.0 | 1318.19 | 1353.66 | 0.55 | 0.99 | rirv938-exp-grpo-cp156-_48954_v2 | 24B | rirv938/exp_grpo_cp156_96ff_b4_r1_merged | rirv938-exp-grpo-cp156-_48954_v2 | 5549 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp156_9 | 2025-05-22 | single | | |
rirv938 | 1 | 183.0 | 1.0 | 1318.16 | 1353.66 | 0.54 | 0.99 | rirv938-llama-8b-512-tok_1159_v2 | 8B | rirv938/llama_8b_512_tokens_context_3m_step_11718 | rirv938-llama-8b-512-tok_1159_v2 | 6387 | 61115860 | 0.56 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/llama_8b_512_tok | 2025-02-27 | single | | |
rirv938 | 1 | 184.0 | 1.0 | 1318.1 | 1353.66 | 0.55 | 0.99 | rirv938-rinen-grpo-cp62_71235_v2 | 13B | rirv938/rinen_grpo_cp624_97ff_ava_bo1_b4_round2_merged | rirv938-rinen-grpo-cp62_71235_v2 | 7952 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp624 | 2025-05-21 | single | | |
rirv938 | 1 | 185.0 | 1.0 | 1318.05 | 1353.66 | 0.52 | 0.99 | rirv938-20k-100p-0ff-ri_79574_v1 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp936_v3 | rirv938-20k-100p-0ff-ri_79574_v1 | 5616 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-02 | single | 0.81 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 186.0 | 1.0 | 1317.95 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp624-_39726_v1 | 24B | rirv938/exp_grpo_cp624_96ff_b4_r1_merged | rirv938-exp-grpo-cp624-_39726_v1 | 5663 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-22 | single | | |
rirv938 | 1 | 187.5 | 1.0 | 1317.72 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp31_44772_v1 | 24B | rirv938/slerp_grpo_cp312_96ff_b5_r2_merged | rirv938-slerp-grpo-cp31_44772_v1 | 6060 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp312 | 2025-05-22 | single | | |
rirv938 | 1 | 187.5 | 1.0 | 1317.72 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp15_69038_v1 | 24B | rirv938/slerp_grpo_cp156_96ff_b5_r2_merged | rirv938-slerp-grpo-cp15_69038_v1 | 6340 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp156 | 2025-05-22 | single | | |
rirv938 | 1 | 189.0 | 1.0 | 1317.65 | 1353.66 | 0.56 | 0.99 | rirv938-rinen-grpo-40k-cp_892_v1 | 13B | rirv938/rinen_grpo_40k_cp296_95ff_merged | rirv938-rinen-grpo-40k-cp_892_v1 | 9313 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_40k_c | 2025-04-29 | single | 1.33 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 190.0 | 1.0 | 1317.55 | 1353.66 | 0.53 | 0.99 | rirv938-20k-100p-0ff-ri_70659_v5 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp468_merged | rirv938-20k-100p-0ff-ri_70659_v5 | 6003 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-16 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 191.0 | 1.0 | 1317.4 | 1353.66 | 0.53 | 0.99 | chaiml-exp-grpo-cp312-9_36146_v1 | 24B | ChaiML/exp_grpo_cp312_96ff_b6_r2_less_ff_merged | chaiml-exp-grpo-cp312-9_36146_v1 | 5132 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/exp_grpo_cp312_96 | 2025-05-30 | single | | |
rirv938 | 1 | 192.0 | 1.0 | 1317.37 | 1353.66 | 0.54 | 0.99 | blend_lebin_2025-04-03 | n/a | | rob_ab_test | 8433 | 61115860 | 0.52 | 0.65 | blend | | | | | | | 2025-04-03 | blended | | |
rirv938 | 1 | 193.0 | 1.0 | 1317.3 | 1353.66 | 0.55 | 0.99 | rirv938-96p-4ff-rirv938_92749_v3 | 24B | rirv938/96p_4ff_rirv938_1000_sim_100p_0_17599_v1_cp1060_merged | rirv938-96p-4ff-rirv938_92749_v3 | 7110 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_rirv938_ | 2025-04-21 | single | 1.49 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 194.0 | 1.0 | 1317.09 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp312-9_2759_v1 | 24B | rirv938/exp_grpo_cp312_96ff_b6_r2_less_ff_merged | rirv938-exp-grpo-cp312-9_2759_v1 | 7188 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-26 | single | | |
rirv938 | 1 | 195.0 | 1.0 | 1317.06 | 1353.66 | 0.52 | 0.99 | chaiml-94p-6ff-nischayd_52369_v1 | 24B | ChaiML/94p_6ff_nischaydnk_exp14_exp9dp_94555_v3_cp624_merged | chaiml-94p-6ff-nischayd_52369_v1 | 7059 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/94p_6ff_nischaydn | 2025-05-15 | single | 1.42 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 196.0 | 1.0 | 1316.91 | 1353.66 | 0.58 | 0.99 | rirv938-anthropic-beta-_88981_v3 | 13B | rirv938/anthropic_beta_2_40k_1872_bo8_95w_v2 | rirv938-anthropic-beta-_88981_v3 | 17327 | 61115860 | 0.57 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-30 | single | 1.8 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 197.0 | 1.0 | 1316.86 | 1353.66 | 0.56 | 0.99 | rirv938-20250411-reward_99450_v2 | 8B | rirv938/20250411_reward_safety_1_5_removed | rirv938-20250411-reward_99450_v2 | 9432 | 61115860 | 0.54 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250411_reward_ | 2025-04-12 | single | | |
rirv938 | 1 | 198.0 | 1.0 | 1316.83 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp312-_52783_v1 | 24B | rirv938/exp_grpo_cp312_96ff_b6_r1_merged | rirv938-exp-grpo-cp312-_52783_v1 | 7346 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-24 | single | | |
rirv938 | 1 | 199.0 | 1.0 | 1316.79 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp156-_47530_v3 | 24B | rirv938/exp_grpo_cp156_96ff_b4_r1_less_ff_merged | rirv938-exp-grpo-cp156-_47530_v3 | 5490 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp156_9 | 2025-05-23 | single | | |
rirv938 | 1 | 200.0 | 1.0 | 1316.78 | 1353.66 | 0.54 | 0.99 | rirv938-40k-98p-2ff-rirv_1029_v1 | 24B | rirv938/40k_98p_2ff_rirv938_mistral_24b_bon_82623_v1_cp1872_merged | rirv938-40k-98p-2ff-rirv_1029_v1 | 7840 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/40k_98p_2ff_rirv | 2025-04-09 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 201.0 | 1.0 | 1316.77 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-4_6340_v1 | 13B | rirv938/anthropic_grpo_40k_cp468_96ff_new_rm_b3_merged | rirv938-anthropic-grpo-4_6340_v1 | 9362 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-20 | single | | |
rirv938 | 1 | 202.0 | 1.0 | 1316.76 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp62_52900_v1 | 24B | rirv938/slerp_grpo_cp624_96ff_b4_r1_lr2_merged | rirv938-slerp-grpo-cp62_52900_v1 | 5524 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp624 | 2025-05-23 | single | | |
rirv938 | 1 | 203.0 | 1.0 | 1316.65 | 1353.66 | 0.56 | 0.99 | rirv938-rinen-grpo-cp31_26298_v2 | 13B | rirv938/rinen_grpo_cp312_97ff_ava_bo1_b4_round2_merged | rirv938-rinen-grpo-cp31_26298_v2 | 6511 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp312 | 2025-05-21 | single | | |
rirv938 | 1 | 204.0 | 1.0 | 1316.64 | 1353.66 | 0.57 | 0.99 | rirv938-mistral-12b-dpo_47715_v1 | 13B | rirv938/mistral_12b_dpo_40k_2374_96_output_tokens_more_ff_v2 | rirv938-mistral-12b-dpo_47715_v1 | 5771 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 96.0 | MistralForCausalLM | rirv938/mistral_12b_dpo_ | 2025-02-24 | single | 1.01 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 205.0 | 1.0 | 1316.6 | 1353.66 | 0.65 | 0.99 | function_pafok_2025-04-11 | | | dpo_data_collection | 8891 | 61115860 | 0.54 | 0.65 | function | | | | | | | 2025-04-11 | single | | |
rirv938 | 1 | 206.0 | 1.0 | 1316.56 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp31_74623_v1 | 24B | rirv938/slerp_grpo_cp312_96ff_b4_r1_lr3_merged | rirv938-slerp-grpo-cp31_74623_v1 | 5538 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp312 | 2025-05-23 | single | | |
rirv938 | 1 | 207.0 | 1.0 | 1316.5 | 1353.66 | 0.57 | 0.99 | rirv938-5k-98p-2ff-rirv_58310_v1 | 24B | rirv938/5k_98p_2ff_rirv938_mistral_24b_bon_31129_v6_cp624_v4 | rirv938-5k-98p-2ff-rirv_58310_v1 | 7268 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/5k_98p_2ff_rirv9 | 2025-04-01 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 208.0 | 1.0 | 1316.46 | 1353.66 | 0.53 | 0.99 | rirv938-devstral-cp624-_46237_v1 | 24B | rirv938/devstral_cp624_98ff_b35_r1_high_quality_merged | rirv938-devstral-cp624-_46237_v1 | 10841 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/devstral_cp624_9 | 2025-07-08 | single | 1.29 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 209.5 | 1.0 | 1316.41 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_44019_v3 | 13B | rirv938/anthropic_grpo_40k_cp148_95ff_merged | rirv938-anthropic-grpo-_44019_v3 | 9248 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.61 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 209.5 | 1.0 | 1316.41 | 1353.66 | 0.0 | 0.99 | chaiml-gy-exp96-dpo-exp8_1696_v2 | 24B | ChaiML/gy-exp96-dpo-exp86ep8s2-grok-payloads-0705-dpo-diff-gt0.05-ep1 | chaiml-gy-exp96-dpo-exp8_1696_v2 | 8356 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/gy-exp96-dpo-exp8 | 2025-07-07 | single | 1.32 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 211.0 | 1.0 | 1316.39 | 1353.66 | 0.55 | 0.99 | chaiml-slerpv5-reward-dpo-rl_v1 | 24B | ChaiML/slerpv5_reward_dpo_rl | chaiml-slerpv5-reward-dpo-rl_v1 | 10765 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerpv5_reward_dp | 2025-06-11 | single | | |
rirv938 | 1 | 212.0 | 1.0 | 1316.25 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-beta-_75151_v3 | 13B | rirv938/anthropic_beta_2_40k_2496_bo8_95w_v2 | rirv938-anthropic-beta-_75151_v3 | 13570 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-31 | single | 1.68 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 213.0 | 1.0 | 1316.01 | 1353.66 | 0.56 | 0.99 | chaiml-panflute-v1-rirv_23337_v2 | 24B | ChaiML/panflute_v1_rirv938_20250423 | chaiml-panflute-v1-rirv_23337_v2 | 8246 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/panflute_v1_rirv9 | 2025-04-22 | single | 1.45 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 214.0 | 1.0 | 1315.99 | 1353.66 | 0.53 | 0.99 | rirv938-20k-100p-0ff-ri_70659_v1 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp468_merged | rirv938-20k-100p-0ff-ri_70659_v1 | 5405 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-16 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 215.0 | 1.0 | 1315.95 | 1353.66 | 0.53 | 0.99 | chaiml-grok-payloads-gr_12038_v3 | 24B | ChaiML/grok_payloads_grpo_cp312_98ff_b35_r1_merged | chaiml-grok-payloads-gr_12038_v3 | 7356 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/grok_payloads_grp | 2025-07-09 | single | 1.32 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 216.0 | 1.0 | 1315.72 | 1353.66 | 0.5 | 0.99 | rirv938-gy-grpo-r2-cp62_33770_v1 | 24B | rirv938/gy_grpo_r2_cp624_98ff_b5_merged | rirv938-gy-grpo-r2-cp62_33770_v1 | 6434 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/gy_grpo_r2_cp624 | 2025-07-08 | single | 1.35 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 217.0 | 1.0 | 1315.7 | 1353.66 | 0.55 | 0.99 | rirv938-20250411-reward_76110_v1 | 8B | rirv938/20250411_reward_safety_1_removed | rirv938-20250411-reward_76110_v1 | 7294 | 61115860 | 0.55 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250411_reward_ | 2025-04-11 | single | | |
rirv938 | 1 | 218.0 | 1.0 | 1315.68 | 1353.66 | 0.58 | 0.99 | rirv938-anthropic-grpo-_55424_v4 | 13B | rirv938/anthropic_grpo_40k_cp296_95ff_merged | rirv938-anthropic-grpo-_55424_v4 | 5440 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.58 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 219.0 | 1.0 | 1315.55 | 1353.66 | 0.52 | 0.99 | function_kasil_2025-03-06 | | | retune_with_base | 11265 | 61115860 | 0.54 | 0.65 | function | | | | | | | 2025-03-06 | single | | |
rirv938 | 1 | 220.0 | 1.0 | 1315.5 | 1353.66 | 0.53 | 0.99 | chaiml-grok-payloads-gr_12038_v2 | 24B | ChaiML/grok_payloads_grpo_cp312_98ff_b35_r1_merged | chaiml-grok-payloads-gr_12038_v2 | 6311 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/grok_payloads_grp | 2025-07-09 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 221.0 | 1.0 | 1315.43 | 1353.66 | 0.56 | 0.99 | rirv938-rinen-grpo-40k-_59006_v1 | 13B | rirv938/rinen_grpo_40k_cp592_95ff_merged | rirv938-rinen-grpo-40k-_59006_v1 | 5942 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_40k_c | 2025-04-29 | single | 1.35 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 222.0 | 1.0 | 1315.4 | 1353.66 | 0.53 | 0.99 | rirv938-20k-100p-0ff-ri_72360_v1 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp1092_v3 | rirv938-20k-100p-0ff-ri_72360_v1 | 5715 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-02 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 223.0 | 1.0 | 1315.25 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp156-_48954_v1 | 24B | rirv938/exp_grpo_cp156_96ff_b4_r1_merged | rirv938-exp-grpo-cp156-_48954_v1 | 5606 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp156_9 | 2025-05-22 | single | | |
rirv938 | 1 | 224.0 | 1.0 | 1315.24 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp62_75772_v1 | 24B | rirv938/slerp_grpo_cp624_96ff_b4_r1_lr_merged | rirv938-slerp-grpo-cp62_75772_v1 | 6977 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp624 | 2025-05-23 | single | | |
rirv938 | 1 | 225.0 | 1.0 | 1315.23 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_55424_v5 | 13B | rirv938/anthropic_grpo_40k_cp296_95ff_merged | rirv938-anthropic-grpo-_55424_v5 | 8261 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.61 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 226.5 | 1.0 | 1315.22 | 1353.66 | 0.54 | 0.99 | rirv938-reward-model-ret_4859_v1 | 8B | rirv938/reward_model_retuned_2_old_multihead | rirv938-reward-model-ret_4859_v1 | 8783 | 61115860 | 0.54 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/reward_model_ret | 2025-03-29 | single | | |
rirv938 | 1 | 226.5 | 1.0 | 1315.22 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp312-9_2759_v3 | 24B | rirv938/exp_grpo_cp312_96ff_b6_r2_less_ff_merged | rirv938-exp-grpo-cp312-9_2759_v3 | 5468 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-30 | single | | |
rirv938 | 1 | 228.0 | 1.0 | 1315.06 | 1353.66 | 0.54 | 0.99 | rirv938-98p-2ff-chaiml-_25299_v1 | 24B | rirv938/98p_2ff_chaiml_slerpv5_mistral_24540_v17_cp1000_merged | rirv938-98p-2ff-chaiml-_25299_v1 | 11565 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_chaiml_s | 2025-06-10 | single | | |
rirv938 | 1 | 229.0 | 1.0 | 1314.98 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp62_20925_v1 | 24B | rirv938/slerp_grpo_cp624_96ff_b6_r2_merged | rirv938-slerp-grpo-cp62_20925_v1 | 7590 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp624 | 2025-05-24 | single | | |
rirv938 | 1 | 230.0 | 1.0 | 1314.92 | 1353.66 | 0.53 | 0.99 | rirv938-llama-8b-256-to_50255_v3 | 8B | rirv938/llama_8b_256_tokens_context_3m_step_11718 | rirv938-llama-8b-256-to_50255_v3 | 6902 | 61115860 | 0.55 | 0.65 | basic | | 1.0 | 1024.0 | 1.0 | LlamaForSequenceClassification | rirv938/llama_8b_256_tok | 2025-02-27 | single | | |
rirv938 | 1 | 231.0 | 1.0 | 1314.91 | 1353.66 | 0.49 | 0.99 | rirv938-100p-0ff-rirv93_43678_v2 | 24B | rirv938/100p_0ff_rirv938_mistral_24b_oai_77698_v2_cp748_merged | rirv938-100p-0ff-rirv93_43678_v2 | 6438 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-18 | single | 0.64 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 232.0 | 1.0 | 1314.9 | 1353.66 | 0.54 | 0.99 | rirv938-reward-model-re_76185_v6 | 8B | rirv938/reward_model_retuned_1_old_multihead | rirv938-reward-model-re_76185_v6 | 12719 | 61115860 | 0.54 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/reward_model_ret | 2025-04-23 | single | | |
rirv938 | 1 | 233.0 | 1.0 | 1314.89 | 1353.66 | 0.53 | 0.99 | chaiml-exp-grpo-cp312-9_36146_v2 | 24B | ChaiML/exp_grpo_cp312_96ff_b6_r2_less_ff_merged | chaiml-exp-grpo-cp312-9_36146_v2 | 5351 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/exp_grpo_cp312_96 | 2025-05-31 | single | | |
rirv938 | 1 | 234.0 | 1.0 | 1314.85 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-4_3092_v2 | 13B | rirv938/anthropic_grpo_40k_cp888_95ff_merged | rirv938-anthropic-grpo-4_3092_v2 | 6230 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 235.0 | 1.0 | 1314.75 | 1353.66 | 0.52 | 0.99 | rirv938-grok-payloads-g_30885_v3 | 24B | rirv938/grok_payloads_grpo_cp312_98ff_b35_r1_merged | rirv938-grok-payloads-g_30885_v3 | 6354 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grok_payloads_gr | 2025-07-09 | single | 1.36 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 236.0 | 1.0 | 1314.69 | 1353.66 | 0.55 | 0.99 | rirv938-reward-model-re_76185_v2 | 8B | rirv938/reward_model_retuned_1_old_multihead | rirv938-reward-model-re_76185_v2 | 10504 | 61115860 | 0.55 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/reward_model_ret | 2025-03-28 | single | | |
rirv938 | 1 | 237.0 | 1.0 | 1314.66 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp624-9_3383_v2 | 24B | rirv938/exp_grpo_cp624_96ff_b6_r1_merged | rirv938-exp-grpo-cp624-9_3383_v2 | 5497 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-30 | single | | |
rirv938 | 1 | 238.0 | 1.0 | 1314.65 | 1353.66 | 0.54 | 0.99 | rirv938-80k-98p-2ff-rir_93843_v2 | 24B | rirv938/80k_98p_2ff_rirv938_mistral_24b_bon_82623_v1_cp1872_merged | rirv938-80k-98p-2ff-rir_93843_v2 | 6177 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/80k_98p_2ff_rirv | 2025-04-08 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 239.0 | 1.0 | 1314.62 | 1353.66 | 0.55 | 0.99 | rirv938-reward-model-re_76185_v4 | 8B | rirv938/reward_model_retuned_1_old_multihead | rirv938-reward-model-re_76185_v4 | 9211 | 61115860 | 0.54 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/reward_model_ret | 2025-04-02 | single | | |
rirv938 | 1 | 240.0 | 1.0 | 1314.58 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp624-_21546_v2 | 24B | rirv938/exp_grpo_cp624_96ff_b4_r1_less_ff_merged | rirv938-exp-grpo-cp624-_21546_v2 | 7113 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-26 | single | | |
rirv938 | 1 | 241.0 | 1.0 | 1314.53 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-beta-_36670_v1 | 13B | rirv938/anthropic_beta_2_40k_2496_bo8_100w_v2 | rirv938-anthropic-beta-_36670_v1 | 12378 | 61115860 | 0.56 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-30 | single | 1.77 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 242.5 | 1.0 | 1314.52 | 1353.66 | 0.49 | 0.99 | rirv938-gy-grpo-r2-cp31_81326_v1 | 24B | rirv938/gy_grpo_r2_cp312_98ff_b5_merged | rirv938-gy-grpo-r2-cp31_81326_v1 | 6392 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/gy_grpo_r2_cp312 | 2025-07-08 | single | 1.3 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 242.5 | 1.0 | 1314.52 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp156-_47530_v2 | 24B | rirv938/exp_grpo_cp156_96ff_b4_r1_less_ff_merged | rirv938-exp-grpo-cp156-_47530_v2 | 6317 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp156_9 | 2025-05-23 | single | | |
rirv938 | 1 | 244.0 | 1.0 | 1314.47 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_44019_v1 | 13B | rirv938/anthropic_grpo_40k_cp148_95ff_merged | rirv938-anthropic-grpo-_44019_v1 | 5834 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.33 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 245.0 | 1.0 | 1314.24 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_77402_v1 | 13B | rirv938/anthropic_grpo_40k_cp546_95ff_baseline_merged | rirv938-anthropic-grpo-_77402_v1 | 5919 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-15 | single | 1.57 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 246.0 | 1.0 | 1314.22 | 1353.66 | 0.52 | 0.99 | function_boren_2025-06-08 | | | dpo_data_collection | 12020 | 61115860 | 0.56 | 0.65 | function | | | | | | | 2025-06-08 | single | | |
rirv938 | 1 | 247.0 | 1.0 | 1314.15 | 1353.66 | 0.58 | 0.99 | rirv938-anthropic-grpo-4_1864_v1 | 13B | rirv938/anthropic_grpo_40k_cp3744_96ff_new_rm_b5_merged | rirv938-anthropic-grpo-4_1864_v1 | 8066 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-21 | single | | |
rirv938 | 1 | 248.5 | 1.0 | 1314.09 | 1353.66 | 0.55 | 0.99 | rirv938-rinen-grpo-cp15_10147_v2 | 13B | rirv938/rinen_grpo_cp156_97ff_ava_bo1_b4_round2_merged | rirv938-rinen-grpo-cp15_10147_v2 | 6378 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp156 | 2025-05-21 | single | | |
rirv938 | 1 | 248.5 | 1.0 | 1314.09 | 1353.66 | 0.58 | 0.99 | rirv938-mistral-12b-dpo_17812_v1 | 13B | rirv938/mistral_12b_dpo_40k_1187_96_output_tokens_more_ff_v2 | rirv938-mistral-12b-dpo_17812_v1 | 5545 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 96.0 | MistralForCausalLM | rirv938/mistral_12b_dpo_ | 2025-02-24 | single | 1.02 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 250.0 | 1.0 | 1314.02 | 1353.66 | 0.58 | 0.99 | rirv938-98p-2ff-rirv938_77810_v1 | 24B | rirv938/98p_2ff_rirv938_mistral_24b_bon_31129_v6_cp2500_v4 | rirv938-98p-2ff-rirv938_77810_v1 | 8269 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-04-01 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 251.0 | 1.0 | 1314.01 | 1353.66 | 0.61 | 0.99 | rirv938-mistral-12b-dpo_76739_v1 | 13B | rirv938/mistral_12b_dpo_40k_2374_96_output_tokens_much_ff_v2 | rirv938-mistral-12b-dpo_76739_v1 | 5698 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 96.0 | MistralForCausalLM | rirv938/mistral_12b_dpo_ | 2025-02-24 | single | 1.05 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 252.0 | 1.0 | 1313.91 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp312-_70375_v1 | 24B | rirv938/exp_grpo_cp312_96ff_b5_r1_merged | rirv938-exp-grpo-cp312-_70375_v1 | 7438 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-23 | single | | |
rirv938 | 1 | 253.0 | 1.0 | 1313.86 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp624-_29644_v1 | 24B | rirv938/exp_grpo_cp624_96ff_b7_r1_merged | rirv938-exp-grpo-cp624-_29644_v1 | 7212 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-24 | single | | |
rirv938 | 1 | 254.0 | 1.0 | 1313.81 | 1353.66 | 0.54 | 0.99 | rirv938-20250331-reward_66174_v1 | 8B | rirv938/20250331_reward_ablation_bo1_bon_mixed | rirv938-20250331-reward_66174_v1 | 10763 | 61115860 | 0.54 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250331_reward_ | 2025-03-31 | single | | |
rirv938 | 1 | 255.0 | 1.0 | 1313.6 | 1353.66 | 0.54 | 0.99 | rirv938-20250331-reward_96848_v2 | 8B | rirv938/20250331_reward_ablation_bon | rirv938-20250331-reward_96848_v2 | 11691 | 61115860 | 0.54 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250331_reward_ | 2025-03-31 | single | | |
rirv938 | 1 | 256.0 | 1.0 | 1313.54 | 1353.66 | 0.56 | 0.99 | rirv938-slerp-grpo-cp15_79826_v1 | 24B | rirv938/slerp_grpo_cp156_96ff_b4_r1_lr3_merged | rirv938-slerp-grpo-cp15_79826_v1 | 7143 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp156 | 2025-05-23 | single | | |
rirv938 | 1 | 257.0 | 1.0 | 1313.26 | 1353.66 | 0.55 | 0.99 | rirv938-10k-97p-3ff-rir_82190_v1 | 24B | rirv938/10k_97p_3ff_rirv938_mistral_24b_bon_82623_v1_cp468_merged | rirv938-10k-97p-3ff-rir_82190_v1 | 7037 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/10k_97p_3ff_rirv | 2025-04-08 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 258.0 | 1.0 | 1313.21 | 1353.66 | 0.5 | 0.99 | rirv938-gy-grpo-cp624-9_14536_v1 | 24B | rirv938/gy_grpo_cp624_98ff_b35_r1_merged | rirv938-gy-grpo-cp624-9_14536_v1 | 6912 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/gy_grpo_cp624_98 | 2025-07-02 | single | 1.63 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 259.0 | 1.0 | 1313.2 | 1353.66 | 0.56 | 0.99 | rirv938-10k-97p-3ff-rir_62566_v1 | 24B | rirv938/10k_97p_3ff_rirv938_mistral_24b_bon_82623_v1_cp936_merged | rirv938-10k-97p-3ff-rir_62566_v1 | 9577 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/10k_97p_3ff_rirv | 2025-04-08 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 260.0 | 1.0 | 1313.15 | 1353.66 | 0.56 | 0.99 | rirv938-mistral-12b-dpo_40235_v1 | 13B | rirv938/mistral_12b_dpo_40k_1187_96_output_tokens_v2 | rirv938-mistral-12b-dpo_40235_v1 | 5489 | 61115860 | 0.58 | 0.65 | basic | | 8.0 | 768.0 | 96.0 | MistralForCausalLM | rirv938/mistral_12b_dpo_ | 2025-02-24 | single | 1.03 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 261.0 | 1.0 | 1313.14 | 1353.66 | 0.55 | 0.99 | rirv938-96p-4ff-rirv938_92749_v2 | 24B | rirv938/96p_4ff_rirv938_1000_sim_100p_0_17599_v1_cp1060_merged | rirv938-96p-4ff-rirv938_92749_v2 | 7280 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_rirv938_ | 2025-04-21 | single | 1.46 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 262.0 | 1.0 | 1313.12 | 1353.66 | 0.55 | 0.99 | rirv938-mistral-12b-dpo-_9564_v3 | 13B | rirv938/mistral_12b_dpo_40k_2374_64_output_tokens_v2 | rirv938-mistral-12b-dpo-_9564_v3 | 6198 | 61115860 | 0.62 | 0.65 | basic | | 8.0 | 768.0 | 96.0 | MistralForCausalLM | rirv938/mistral_12b_dpo_ | 2025-02-24 | single | 1.06 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 263.0 | 1.0 | 1312.95 | 1353.66 | 0.54 | 0.99 | rirv938-devstral-cp312-_74673_v1 | 24B | rirv938/devstral_cp312_98ff_b35_r1_high_quality_merged | rirv938-devstral-cp312-_74673_v1 | 10926 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/devstral_cp312_9 | 2025-07-08 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 264.0 | 1.0 | 1312.89 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp312-_84193_v2 | 24B | rirv938/exp_grpo_cp312_96ff_b4_r1_less_ff_merged | rirv938-exp-grpo-cp312-_84193_v2 | 8940 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-26 | single | | |
rirv938 | 1 | 265.0 | 1.0 | 1312.88 | 1353.66 | 0.56 | 0.99 | rirv938-slerp-grpo-cp624_1506_v2 | 24B | rirv938/slerp_grpo_cp624_96ff_b4_r1_merged | rirv938-slerp-grpo-cp624_1506_v2 | 5827 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp624 | 2025-05-22 | single | | |
rirv938 | 1 | 266.0 | 1.0 | 1312.87 | 1353.66 | 0.55 | 0.99 | rirv938-20250402-reward_22740_v2 | 8B | rirv938/20250402_reward_ava_cosine_2 | rirv938-20250402-reward_22740_v2 | 12330 | 61115860 | 0.54 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250402_reward_ | 2025-04-02 | single | | |
rirv938 | 1 | 267.0 | 1.0 | 1312.72 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp156-_47530_v4 | 24B | rirv938/exp_grpo_cp156_96ff_b4_r1_less_ff_merged | rirv938-exp-grpo-cp156-_47530_v4 | 7420 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp156_9 | 2025-05-26 | single | | |
rirv938 | 1 | 268.0 | 1.0 | 1312.63 | 1353.66 | 0.52 | 0.99 | rirv938-100p-0ff-rirv93_11122_v1 | 24B | rirv938/100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp468_v3 | rirv938-100p-0ff-rirv93_11122_v1 | 6067 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-02 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 269.0 | 1.0 | 1312.5 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-beta-_88981_v2 | 13B | rirv938/anthropic_beta_2_40k_1872_bo8_95w_v2 | rirv938-anthropic-beta-_88981_v2 | 13568 | 61115860 | 0.55 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-30 | single | 2.95 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 270.0 | 1.0 | 1312.46 | 1353.66 | 0.53 | 0.99 | rirv938-20250402-reward-a_184_v1 | 8B | rirv938/20250402_reward_ava_basic | rirv938-20250402-reward-a_184_v1 | 9428 | 61115860 | 0.54 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250402_reward_ | 2025-04-02 | single | | |
rirv938 | 1 | 271.0 | 1.0 | 1312.36 | 1353.66 | 0.53 | 0.99 | function_gonom_2025-06-08 | | | dpo_data_collection | 7231 | 61115860 | 0.55 | 0.65 | function | | | | | | | 2025-06-08 | single | | |
rirv938 | 1 | 272.0 | 1.0 | 1312.24 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp312-_84193_v3 | 24B | rirv938/exp_grpo_cp312_96ff_b4_r1_less_ff_merged | rirv938-exp-grpo-cp312-_84193_v3 | 8966 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-26 | single | | |
rirv938 | 1 | 273.0 | 1.0 | 1312.17 | 1353.66 | 0.55 | 0.99 | rirv938-reward-model-re_76185_v3 | 8B | rirv938/reward_model_retuned_1_old_multihead | rirv938-reward-model-re_76185_v3 | 10855 | 61115860 | 0.54 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/reward_model_ret | 2025-03-31 | single | | |
rirv938 | 1 | 274.0 | 1.0 | 1312.14 | 1353.66 | 0.55 | 0.99 | chaiml-0sw-95p-5ff-rine_63828_v4 | 13B | ChaiML/0sw_95p_5ff_rinen0721_dpo_0130_cp3000_v8_merged | chaiml-0sw-95p-5ff-rine_63828_v4 | 8158 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/0sw_95p_5ff_rinen | 2025-05-15 | single | 1.35 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 275.0 | 1.0 | 1312.13 | 1353.66 | 0.51 | 0.99 | rirv938-98p-2ff-rirv938_42155_v2 | 24B | rirv938/98p_2ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp936_v3 | rirv938-98p-2ff-rirv938_42155_v2 | 8972 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-03-28 | single | 0.81 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 276.0 | 1.0 | 1312.02 | 1353.66 | 0.53 | 0.99 | rirv938-llama-8b-1024-t_67568_v1 | 8B | rirv938/llama_8b_1024_tokens_context_3m_step_11718 | rirv938-llama-8b-1024-t_67568_v1 | 6612 | 61115860 | 0.55 | 0.65 | basic | | 1.0 | 1024.0 | 1.0 | LlamaForSequenceClassification | rirv938/llama_8b_1024_to | 2025-02-27 | single | | |
rirv938 | 1 | 277.0 | 1.0 | 1312.0 | 1353.66 | 0.58 | 0.99 | rirv938-anthropic-grpo-_51376_v2 | 13B | rirv938/anthropic_grpo_40k_cp592_95ff_merged | rirv938-anthropic-grpo-_51376_v2 | 5649 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.59 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 278.0 | 1.0 | 1311.97 | 1353.66 | 0.57 | 0.99 | rirv938-tune-mistral-gr_30207_v1 | 24B | rirv938/tune_mistral_grpo_cp592_92ff_v3_run_merged | rirv938-tune-mistral-gr_30207_v1 | 8607 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/tune_mistral_grp | 2025-04-30 | single | 1.72 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 279.0 | 1.0 | 1311.58 | 1353.66 | 0.52 | 0.99 | rirv938-100p-0ff-rirv93_53941_v1 | 24B | rirv938/100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp624_v3 | rirv938-100p-0ff-rirv93_53941_v1 | 5795 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-02 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 280.0 | 1.0 | 1311.53 | 1353.66 | 0.57 | 0.99 | rirv938-98p-2ff-rirv938-_3333_v1 | 24B | rirv938/98p_2ff_rirv938_mistral_24b_bon_31129_v6_cp1875_v4 | rirv938-98p-2ff-rirv938-_3333_v1 | 6211 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-04-01 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 281.0 | 1.0 | 1311.52 | 1353.66 | 0.54 | 0.99 | rirv938-20250331-reward-_2681_v1 | 8B | rirv938/20250331_reward_ablation_bo1 | rirv938-20250331-reward-_2681_v1 | 10906 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250331_reward_ | 2025-03-31 | single | | |
rirv938 | 1 | 282.0 | 1.0 | 1311.49 | 1353.66 | 0.55 | 0.99 | rirv938-rinen-grpo-cp62_71235_v1 | 13B | rirv938/rinen_grpo_cp624_97ff_ava_bo1_b4_round2_merged | rirv938-rinen-grpo-cp62_71235_v1 | 8713 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp624 | 2025-05-21 | single | | |
rirv938 | 1 | 283.0 | 1.0 | 1311.38 | 1353.66 | 0.54 | 0.99 | chaiml-devstral-cp624-9_95911_v1 | 24B | ChaiML/devstral_cp624_98ff_b35_r1_high_quality_merged | chaiml-devstral-cp624-9_95911_v1 | 7902 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/devstral_cp624_98 | 2025-07-09 | single | 1.36 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 284.0 | 1.0 | 1311.37 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp62_11749_v3 | 24B | rirv938/slerp_grpo_cp624_96ff_b5_r1_merged | rirv938-slerp-grpo-cp62_11749_v3 | 7272 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp624 | 2025-05-23 | single | | |
rirv938 | 1 | 285.0 | 1.0 | 1311.33 | 1353.66 | 0.5 | 0.99 | rirv938-98p-2ff-rirv938_32328_v1 | 24B | rirv938/98p_2ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp312_v3 | rirv938-98p-2ff-rirv938_32328_v1 | 7731 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-03-28 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 286.0 | 1.0 | 1311.23 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_44019_v2 | 13B | rirv938/anthropic_grpo_40k_cp148_95ff_merged | rirv938-anthropic-grpo-_44019_v2 | 8598 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-29 | single | 1.61 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 287.0 | 1.0 | 1311.13 | 1353.66 | 0.57 | 0.99 | rirv938-98p-2ff-rirv938_23194_v1 | 24B | rirv938/98p_2ff_rirv938_mistral_24b_bon_31129_v6_cp1250_v4 | rirv938-98p-2ff-rirv938_23194_v1 | 8152 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-04-01 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 288.0 | 1.0 | 1311.1 | 1353.66 | 0.56 | 0.99 | rirv938-20250411-reward_33516_v1 | 8B | rirv938/20250411_reward_safety_1_2_removed | rirv938-20250411-reward_33516_v1 | 14202 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250411_reward_ | 2025-04-12 | single | | |
rirv938 | 1 | 289.0 | 1.0 | 1311.06 | 1353.66 | 0.58 | 0.99 | rirv938-96p-4ff-chaiml-_36445_v1 | 24B | rirv938/96p_4ff_chaiml_slerpv5_mistral_24540_v17_cp1000_merged | rirv938-96p-4ff-chaiml-_36445_v1 | 10289 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_chaiml_s | 2025-06-10 | single | | |
rirv938 | 1 | 290.0 | 1.0 | 1311.05 | 1353.66 | 0.56 | 0.99 | function_kehol_2025-04-14 | | | dpo_data_collection | 1501619 | 61115860 | 0.53 | 0.65 | function | | | | | | | 2025-04-14 | single | | |
rirv938 | 1 | 291.0 | 1.0 | 1311.01 | 1353.66 | 0.5 | 0.99 | rirv938-98p-2ff-rirv938_58882_v1 | 24B | rirv938/98p_2ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp624_v3 | rirv938-98p-2ff-rirv938_58882_v1 | 7691 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-03-28 | single | 0.82 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 292.0 | 1.0 | 1310.99 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_20077_v1 | 13B | rirv938/anthropic_grpo_40k_cp468_96ff_new_rm_b5_merged | rirv938-anthropic-grpo-_20077_v1 | 9439 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-20 | single | | |
rirv938 | 1 | 293.0 | 1.0 | 1310.98 | 1353.66 | 0.58 | 0.99 | rirv938-slerp-grpo-cp15_53863_v1 | 24B | rirv938/slerp_grpo_cp156_96ff_b5_r1_merged | rirv938-slerp-grpo-cp15_53863_v1 | 6402 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp156 | 2025-05-22 | single | | |
rirv938 | 1 | 294.0 | 1.0 | 1310.97 | 1353.66 | 0.56 | 0.99 | rirv938-rinen-grpo-cp31_26362_v1 | 13B | rirv938/rinen_grpo_cp312_97ff_old_prompts_merged | rirv938-rinen-grpo-cp31_26362_v1 | 5783 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp312 | 2025-05-21 | single | | |
rirv938 | 1 | 295.0 | 1.0 | 1310.81 | 1353.66 | 0.0 | 0.99 | rirv938-llama-8b-1024-t_67568_v3 | 8B | rirv938/llama_8b_1024_tokens_context_3m_step_11718 | rirv938-llama-8b-1024-t_67568_v3 | 7495 | 61115860 | 0.54 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/llama_8b_1024_to | 2025-02-27 | single | | |
rirv938 | 1 | 296.0 | 1.0 | 1310.8 | 1353.66 | 0.52 | 0.99 | chaiml-grok-payloads-gr_12038_v1 | 24B | ChaiML/grok_payloads_grpo_cp312_98ff_b35_r1_merged | chaiml-grok-payloads-gr_12038_v1 | 7726 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/grok_payloads_grp | 2025-07-09 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 297.0 | 1.0 | 1310.75 | 1353.66 | 0.52 | 0.99 | rirv938-100p-0ff-rirv93_62906_v1 | 24B | rirv938/100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp780_v3 | rirv938-100p-0ff-rirv93_62906_v1 | 6407 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-02 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 298.0 | 1.0 | 1310.74 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp312-_84193_v5 | 24B | rirv938/exp_grpo_cp312_96ff_b4_r1_less_ff_merged | rirv938-exp-grpo-cp312-_84193_v5 | 8242 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-26 | single | | |
rirv938 | 1 | 299.0 | 1.0 | 1310.73 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp312-_84193_v6 | 24B | rirv938/exp_grpo_cp312_96ff_b4_r1_less_ff_merged | rirv938-exp-grpo-cp312-_84193_v6 | 5504 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-30 | single | | |
rirv938 | 1 | 300.0 | 1.0 | 1310.61 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp31_77415_v1 | 24B | rirv938/slerp_grpo_cp312_96ff_b6_r1_merged | rirv938-slerp-grpo-cp31_77415_v1 | 7200 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp312 | 2025-05-24 | single | | |
rirv938 | 1 | 301.0 | 1.0 | 1310.52 | 1353.66 | 0.53 | 0.99 | rirv938-exp-grpo-cp312-_36697_v1 | 24B | rirv938/exp_grpo_cp312_96ff_b4_r1_merged | rirv938-exp-grpo-cp312-_36697_v1 | 5682 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-22 | single | | |
rirv938 | 1 | 302.0 | 1.0 | 1310.37 | 1353.66 | 0.57 | 0.99 | rirv938-20250411-reward_50080_v1 | 8B | rirv938/20250411_reward_safety_2_removed | rirv938-20250411-reward_50080_v1 | 15249 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250411_reward_ | 2025-04-11 | single | | |
rirv938 | 1 | 303.0 | 1.0 | 1310.3 | 1353.66 | 0.56 | 0.99 | chaiml-panflute-v1-rirv_23337_v3 | 24B | ChaiML/panflute_v1_rirv938_20250423 | chaiml-panflute-v1-rirv_23337_v3 | 6505 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/panflute_v1_rirv9 | 2025-04-22 | single | 1.44 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 304.0 | 1.0 | 1310.25 | 1353.66 | 0.54 | 0.99 | rirv938-mistral-24b-rou_91022_v2 | 24B | rirv938/mistral_24b_round_2_dpo_40k_85w_pref_20w_swear_2500_v2 | rirv938-mistral-24b-rou_91022_v2 | 12143 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-06 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 305.0 | 1.0 | 1310.16 | 1353.66 | 0.54 | 0.99 | chaiml-exp14-exp9dpoft-_65674_v7 | 24B | ChaiML/exp14-exp9DPOFt-chaidatav1dpo6k-24B | chaiml-exp14-exp9dpoft-_65674_v7 | 5857 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/exp14-exp9DPOFt-c | 2025-05-22 | single | | |
rirv938 | 1 | 306.0 | 1.0 | 1310.13 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp31_22331_v2 | 24B | rirv938/slerp_grpo_cp312_96ff_b5_r1_merged | rirv938-slerp-grpo-cp31_22331_v2 | 7428 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp312 | 2025-05-23 | single | | |
rirv938 | 1 | 307.5 | 1.0 | 1309.82 | 1353.66 | 0.54 | 0.99 | rirv938-mistral-12b-dpo_28324_v3 | 13B | rirv938/mistral_12b_dpo_40k_3561_64_output_tokens_v2 | rirv938-mistral-12b-dpo_28324_v3 | 6088 | 61115860 | 0.57 | 0.65 | basic | | 8.0 | 768.0 | 96.0 | MistralForCausalLM | rirv938/mistral_12b_dpo_ | 2025-02-24 | single | 1.03 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 307.5 | 1.0 | 1309.82 | 1353.66 | 0.51 | 0.99 | rirv938-gy-grpo-cp624-9_14536_v3 | 24B | rirv938/gy_grpo_cp624_98ff_b35_r1_merged | rirv938-gy-grpo-cp624-9_14536_v3 | 7332 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/gy_grpo_cp624_98 | 2025-07-09 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 309.0 | 1.0 | 1309.75 | 1353.66 | 0.56 | 0.99 | rirv938-slerp-grpo-cp31_51162_v1 | 24B | rirv938/slerp_grpo_cp312_96ff_b6_r2_merged | rirv938-slerp-grpo-cp31_51162_v1 | 7936 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp312 | 2025-05-24 | single | | |
rirv938 | 1 | 310.0 | 1.0 | 1309.58 | 1353.66 | 0.54 | 0.99 | chaiml-exp-grpo-cp312-9_39529_v3 | 24B | ChaiML/exp_grpo_cp312_96ff_b4_r1_less_ff_merged | chaiml-exp-grpo-cp312-9_39529_v3 | 21482 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/exp_grpo_cp312_96 | 2025-06-05 | single | | |
rirv938 | 1 | 311.0 | 1.0 | 1309.55 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-beta-_88254_v2 | 13B | rirv938/anthropic_beta_2_40k_2496_bo8_100w_b4_v2 | rirv938-anthropic-beta-_88254_v2 | 13017 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-31 | single | 1.64 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 312.0 | 1.0 | 1309.54 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp624-_29644_v2 | 24B | rirv938/exp_grpo_cp624_96ff_b7_r1_merged | rirv938-exp-grpo-cp624-_29644_v2 | 7220 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-24 | single | | |
rirv938 | 1 | 313.0 | 1.0 | 1309.49 | 1353.66 | 0.5 | 0.99 | chaiml-gy-grpo-cp624-98f_2782_v2 | 24B | ChaiML/gy_grpo_cp624_98ff_b35_r1_merged | chaiml-gy-grpo-cp624-98f_2782_v2 | 7183 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/gy_grpo_cp624_98f | 2025-07-09 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 314.0 | 1.0 | 1309.47 | 1353.66 | 0.58 | 0.99 | rirv938-slerp-grpo-cp31_98528_v1 | 24B | rirv938/slerp_grpo_cp312_96ff_b4_r1_merged | rirv938-slerp-grpo-cp31_98528_v1 | 6290 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp312 | 2025-05-22 | single | | |
rirv938 | 1 | 315.0 | 1.0 | 1309.28 | 1353.66 | 0.54 | 0.99 | function_ditot_2025-02-27 | | | retune_with_base | 5725 | 61115860 | 0.55 | 0.65 | function | | | | | | | 2025-02-27 | single | | |
rirv938 | 1 | 316.0 | 1.0 | 1309.26 | 1353.66 | 0.58 | 0.99 | rirv938-anthropic-beta-_88981_v1 | 13B | rirv938/anthropic_beta_2_40k_1872_bo8_95w_v2 | rirv938-anthropic-beta-_88981_v1 | 16042 | 61115860 | 0.55 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-30 | single | 2.87 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 317.0 | 1.0 | 1309.24 | 1353.66 | 0.56 | 0.99 | rirv938-grpo-to-compare_44163_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp156_lr9_merged | rirv938-grpo-to-compare_44163_v1 | 10350 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-26 | single | 1.42 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 318.0 | 1.0 | 1309.16 | 1353.66 | 0.54 | 0.99 | rirv938-20250331-reward_78765_v2 | 8B | rirv938/20250331_reward_ablation_bon_256 | rirv938-20250331-reward_78765_v2 | 9092 | 61115860 | 0.54 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250331_reward_ | 2025-03-31 | single | | |
rirv938 | 1 | 319.0 | 1.0 | 1309.1 | 1353.66 | 0.54 | 0.99 | rirv938-98p-2ff-chaiml-_19088_v1 | 24B | rirv938/98p_2ff_chaiml_slerpv5_mistral_24540_v17_cp500_merged | rirv938-98p-2ff-chaiml-_19088_v1 | 11908 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_chaiml_s | 2025-06-10 | single | | |
rirv938 | 1 | 320.0 | 1.0 | 1309.08 | 1353.66 | 0.58 | 0.99 | rirv938-anthropic-grpo-_55424_v2 | 13B | rirv938/anthropic_grpo_40k_cp296_95ff_merged | rirv938-anthropic-grpo-_55424_v2 | 7744 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-04-28 | single | 1.61 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 321.0 | 1.0 | 1309.02 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-beta-_75151_v2 | 13B | rirv938/anthropic_beta_2_40k_2496_bo8_95w_v2 | rirv938-anthropic-beta-_75151_v2 | 17365 | 61115860 | 0.55 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-30 | single | 1.82 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 322.0 | 1.0 | 1309.0 | 1353.66 | 0.59 | 0.99 | rirv938-mistral-24b-grp_36770_v1 | 24B | rirv938/mistral_24b_grpo_40k_cp296_92ff_merged | rirv938-mistral-24b-grp_36770_v1 | 10014 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_grpo | 2025-04-28 | single | 1.46 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 323.0 | 1.0 | 1308.9 | 1353.66 | 0.58 | 0.99 | rirv938-slerp-grpo-cp624_1506_v1 | 24B | rirv938/slerp_grpo_cp624_96ff_b4_r1_merged | rirv938-slerp-grpo-cp624_1506_v1 | 6273 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp624 | 2025-05-22 | single | | |
rirv938 | 1 | 324.0 | 1.0 | 1308.87 | 1353.66 | 0.52 | 0.99 | rirv938-98p-2ff-chaiml-_32109_v1 | 24B | rirv938/98p_2ff_chaiml_exp14_exp9dpoft_65674_v14_cp484_merged | rirv938-98p-2ff-chaiml-_32109_v1 | 8569 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_chaiml_e | 2025-06-09 | single | | |
rirv938 | 1 | 325.0 | 1.0 | 1308.84 | 1353.66 | 0.53 | 0.99 | rirv938-llama-8b-256-to_50255_v6 | 8B | rirv938/llama_8b_256_tokens_context_3m_step_11718 | rirv938-llama-8b-256-to_50255_v6 | 14721 | 61115860 | 0.55 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/llama_8b_256_tok | 2025-02-28 | single | | |
rirv938 | 1 | 326.0 | 1.0 | 1308.82 | 1353.66 | 0.56 | 0.99 | rirv938-rinen-grpo-cp62_73478_v2 | 13B | rirv938/rinen_grpo_cp624_97ff_ava_bo1_b4_80k_merged | rirv938-rinen-grpo-cp62_73478_v2 | 5740 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp624 | 2025-05-21 | single | | |
rirv938 | 1 | 327.0 | 1.0 | 1308.78 | 1353.66 | 0.57 | 0.99 | rirv938-tune-mistral-gr_11107_v1 | 24B | rirv938/tune_mistral_grpo_cp1184_92ff_v3_run3_merged | rirv938-tune-mistral-gr_11107_v1 | 8783 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/tune_mistral_grp | 2025-04-30 | single | 1.74 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 328.0 | 1.0 | 1308.54 | 1353.66 | 0.54 | 0.99 | chaiml-exp-grpo-cp624-96_5228_v2 | 24B | ChaiML/exp_grpo_cp624_96ff_b6_r1_merged | chaiml-exp-grpo-cp624-96_5228_v2 | 5427 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/exp_grpo_cp624_96 | 2025-05-31 | single | | |
rirv938 | 1 | 329.0 | 1.0 | 1308.53 | 1353.66 | 0.55 | 0.99 | rirv938-96p-4ff-rirv938_92749_v1 | 24B | rirv938/96p_4ff_rirv938_1000_sim_100p_0_17599_v1_cp1060_merged | rirv938-96p-4ff-rirv938_92749_v1 | 6343 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_rirv938_ | 2025-04-21 | single | 1.41 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 330.0 | 1.0 | 1308.48 | 1353.66 | 0.54 | 0.99 | rirv938-exp-grpo-cp624-_38275_v1 | 24B | rirv938/exp_grpo_cp624_96ff_b8_r1_merged | rirv938-exp-grpo-cp624-_38275_v1 | 6394 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-24 | single | | |
rirv938 | 1 | 331.0 | 1.0 | 1308.46 | 1353.66 | 0.55 | 0.99 | rirv938-40k-98p-2ff-rir_73607_v1 | 24B | rirv938/40k_98p_2ff_rirv938_mistral_24b_bon_82623_v1_cp936_merged | rirv938-40k-98p-2ff-rir_73607_v1 | 7668 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/40k_98p_2ff_rirv | 2025-04-09 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 332.0 | 1.0 | 1308.4 | 1353.66 | 0.55 | 0.99 | rirv938-rinen-grpo-cp31_12130_v1 | 13B | rirv938/rinen_grpo_cp312_97ff_ava_bo1_b4_merged | rirv938-rinen-grpo-cp31_12130_v1 | 6420 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp312 | 2025-05-21 | single | | |
rirv938 | 1 | 333.0 | 1.0 | 1308.39 | 1353.66 | 0.5 | 0.99 | rirv938-gy-grpo-cp624-9_14536_v2 | 24B | rirv938/gy_grpo_cp624_98ff_b35_r1_merged | rirv938-gy-grpo-cp624-9_14536_v2 | 7349 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/gy_grpo_cp624_98 | 2025-07-09 | single | 1.32 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 334.0 | 1.0 | 1308.31 | 1353.66 | 0.54 | 0.99 | rirv938-rinen-grpo-cp156_9482_v1 | 13B | rirv938/rinen_grpo_cp156_97ff_mixed_rm_b4_merged | rirv938-rinen-grpo-cp156_9482_v1 | 8635 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp156 | 2025-05-21 | single | | |
rirv938 | 1 | 335.5 | 1.0 | 1308.3 | 1353.66 | 0.55 | 0.99 | rirv938-20250411-reward_70981_v1 | 8B | rirv938/20250411_reward_safety_no_removed | rirv938-20250411-reward_70981_v1 | 7128 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250411_reward_ | 2025-04-11 | single | | |
rirv938 | 1 | 335.5 | 1.0 | 1308.3 | 1353.66 | 0.54 | 0.99 | blend_tutok_2025-05-01 | n/a | | rob_ab_test | 9073 | 61115860 | 0.52 | 0.65 | blend | | | | | | | 2025-05-01 | blended | | |
rirv938 | 1 | 337.0 | 1.0 | 1308.16 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_55424_v6 | 13B | rirv938/anthropic_grpo_40k_cp296_95ff_merged | rirv938-anthropic-grpo-_55424_v6 | 7120 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-13 | single | 1.6 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 338.0 | 1.0 | 1308.15 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp31_70857_v1 | 24B | rirv938/slerp_grpo_cp312_96ff_b4_r1_lr_merged | rirv938-slerp-grpo-cp31_70857_v1 | 6705 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp312 | 2025-05-23 | single | | |
rirv938 | 1 | 339.0 | 1.0 | 1308.12 | 1353.66 | 0.53 | 0.99 | rirv938-mistral-24b-bas_54279_v1 | 24B | rirv938/mistral_24b_base_2_dpo_40k_95w_pref_2500_v2 | rirv938-mistral-24b-bas_54279_v1 | 8419 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_base | 2025-03-05 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 340.0 | 1.0 | 1308.09 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp62_11749_v2 | 24B | rirv938/slerp_grpo_cp624_96ff_b5_r1_merged | rirv938-slerp-grpo-cp62_11749_v2 | 5816 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp624 | 2025-05-22 | single | | |
rirv938 | 1 | 341.0 | 1.0 | 1308.04 | 1353.66 | 0.57 | 0.99 | rirv938-5k-98p-2ff-rirv_87701_v1 | 24B | rirv938/5k_98p_2ff_rirv938_mistral_24b_bon_31129_v6_cp312_v4 | rirv938-5k-98p-2ff-rirv_87701_v1 | 6551 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/5k_98p_2ff_rirv9 | 2025-04-01 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 342.0 | 1.0 | 1307.89 | 1353.66 | 0.55 | 0.99 | rirv938-rinen-grpo-cp156_9412_v1 | 13B | rirv938/rinen_grpo_cp156_97ff_ava_bo1_b4_merged | rirv938-rinen-grpo-cp156_9412_v1 | 8558 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp156 | 2025-05-21 | single | | |
rirv938 | 1 | 343.5 | 1.0 | 1307.81 | 1353.66 | 0.54 | 0.99 | function_jedim_2025-06-12 | | | dpo_data_collection | 7939 | 61115860 | 0.54 | 0.65 | function | | | | | | | 2025-06-11 | single | | |
rirv938 | 1 | 343.5 | 1.0 | 1307.81 | 1353.66 | 0.52 | 0.99 | rirv938-20k-100p-0ff-ri_70659_v4 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp468_merged | rirv938-20k-100p-0ff-ri_70659_v4 | 5986 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-16 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 345.0 | 1.0 | 1307.8 | 1353.66 | 0.54 | 0.99 | rirv938-20250331-reward_37564_v1 | 8B | rirv938/20250331_reward_ablation_random | rirv938-20250331-reward_37564_v1 | 10918 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250331_reward_ | 2025-03-31 | single | | |
rirv938 | 1 | 346.0 | 1.0 | 1307.74 | 1353.66 | 0.55 | 0.99 | rirv938-exp-grpo-cp624-_38275_v2 | 24B | rirv938/exp_grpo_cp624_96ff_b8_r1_merged | rirv938-exp-grpo-cp624-_38275_v2 | 6452 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp624_9 | 2025-05-24 | single | | |
rirv938 | 1 | 347.0 | 1.0 | 1307.73 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_75042_v1 | 13B | rirv938/anthropic_grpo_40k_cp156_96ff_new_rm_b3_merged | rirv938-anthropic-grpo-_75042_v1 | 9386 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-20 | single | | |
rirv938 | 1 | 348.0 | 1.0 | 1307.5 | 1353.66 | 0.59 | 0.99 | rirv938-20250411-reward_71097_v1 | 8B | rirv938/20250411_reward_safety_4_removed | rirv938-20250411-reward_71097_v1 | 13049 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250411_reward_ | 2025-04-11 | single | | |
rirv938 | 1 | 349.0 | 1.0 | 1307.49 | 1353.66 | 0.63 | 0.99 | rirv938-96p-4ff-chaiml-_10106_v1 | 24B | rirv938/96p_4ff_chaiml_slerpv5_mistral3_24540_v2_cp1936_merged | rirv938-96p-4ff-chaiml-_10106_v1 | 20052 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_chaiml_s | 2025-06-07 | single | | |
rirv938 | 1 | 350.0 | 1.0 | 1307.47 | 1353.66 | 0.58 | 0.99 | function_panem_2025-04-02 | | | dpo_data_collection | 9553 | 61115860 | 0.55 | 0.65 | function | | | | | | | 2025-04-02 | single | | |
rirv938 | 1 | 351.0 | 1.0 | 1307.46 | 1353.66 | 0.49 | 0.99 | rirv938-simp-grpo-cp312_25497_v1 | 24B | rirv938/simp_grpo_cp312_96ff_b3_r1_12m_US_merged | rirv938-simp-grpo-cp312_25497_v1 | 8492 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/simp_grpo_cp312_ | 2025-06-30 | single | 1.38 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 352.0 | 1.0 | 1307.41 | 1353.66 | 0.55 | 0.99 | rirv938-exp-grpo-cp312-_36697_v3 | 24B | rirv938/exp_grpo_cp312_96ff_b4_r1_merged | rirv938-exp-grpo-cp312-_36697_v3 | 7659 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/exp_grpo_cp312_9 | 2025-05-26 | single | | |
rirv938 | 1 | 353.0 | 1.0 | 1307.24 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_65405_v1 | 13B | rirv938/anthropic_grpo_40k_cp780_96ff_new_rm_b5_merged | rirv938-anthropic-grpo-_65405_v1 | 6733 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-20 | single | | |
rirv938 | 1 | 354.0 | 1.0 | 1307.2 | 1353.66 | 0.53 | 0.99 | rirv938-20k-100p-0ff-ri_70659_v6 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp468_merged | rirv938-20k-100p-0ff-ri_70659_v6 | 6699 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-16 | single | 0.81 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 355.0 | 1.0 | 1307.19 | 1353.66 | 0.52 | 0.99 | rirv938-mistral-24b-bas_54279_v3 | 24B | rirv938/mistral_24b_base_2_dpo_40k_95w_pref_2500_v2 | rirv938-mistral-24b-bas_54279_v3 | 10519 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_base | 2025-03-06 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 356.0 | 1.0 | 1307.18 | 1353.66 | 0.52 | 0.99 | rirv938-20k-100p-0ff-ri_70659_v3 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp468_merged | rirv938-20k-100p-0ff-ri_70659_v3 | 6118 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-16 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 357.0 | 1.0 | 1307.01 | 1353.66 | 0.52 | 0.99 | rirv938-dpo-to-compare-_98349_v1 | 24B | rirv938/dpo_to_compare_to_grpo_10k_cp310_b2_merged | rirv938-dpo-to-compare-_98349_v1 | 8757 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/dpo_to_compare_t | 2025-04-26 | single | 1.44 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 358.0 | 1.0 | 1306.97 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-beta-2_6346_v2 | 13B | rirv938/anthropic_beta_2_40k_2496_bo4_v2 | rirv938-anthropic-beta-2_6346_v2 | 12431 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-31 | single | 1.64 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 359.0 | 1.0 | 1306.94 | 1353.66 | 0.51 | 0.99 | rirv938-mistral-24b-rou_50061_v3 | 24B | rirv938/mistral_24b_round_2_dpo_40k_95w_pref_2500_v2 | rirv938-mistral-24b-rou_50061_v3 | 10296 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-06 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 360.0 | 1.0 | 1306.89 | 1353.66 | 0.56 | 0.99 | rirv938-rinen-grpo-cp31_26298_v1 | 13B | rirv938/rinen_grpo_cp312_97ff_ava_bo1_b4_round2_merged | rirv938-rinen-grpo-cp31_26298_v1 | 7401 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp312 | 2025-05-21 | single | | |
rirv938 | 1 | 361.0 | 1.0 | 1306.81 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-_49826_v1 | 13B | rirv938/anthropic_grpo_40k_cp1184_95ff_beta6_3_merged | rirv938-anthropic-grpo-_49826_v1 | 10252 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-17 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 362.0 | 1.0 | 1306.8 | 1353.66 | 0.55 | 0.99 | rirv938-rinen-grpo-cp62_73478_v1 | 13B | rirv938/rinen_grpo_cp624_97ff_ava_bo1_b4_80k_merged | rirv938-rinen-grpo-cp62_73478_v1 | 6006 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp624 | 2025-05-21 | single | | |
rirv938 | 1 | 363.5 | 1.0 | 1306.78 | 1353.66 | 0.57 | 0.99 | rirv938-mistral-24b-dpo-_8520_v1 | 24B | rirv938/mistral_24b_dpo_40k_95w_pref_2500_instruct_dpo_1_v2 | rirv938-mistral-24b-dpo-_8520_v1 | 8443 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-02-23 | single | 0.76 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 363.5 | 1.0 | 1306.78 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-_65100_v1 | 13B | rirv938/anthropic_grpo_40k_cp2368_95ff_beta6_3_merged | rirv938-anthropic-grpo-_65100_v1 | 9127 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-17 | single | 1.65 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 365.0 | 1.0 | 1306.77 | 1353.66 | 0.49 | 0.99 | rirv938-simp-grpo-cp312_69371_v1 | 24B | rirv938/simp_grpo_cp312_2ff_b2_r1_ava_rm_merged | rirv938-simp-grpo-cp312_69371_v1 | 6797 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/simp_grpo_cp312_ | 2025-07-02 | single | 1.37 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 366.0 | 1.0 | 1306.75 | 1353.66 | 0.64 | 0.99 | rirv938-95p-5ff-rirv938-_6463_v1 | 24B | rirv938/95p_5ff_rirv938_95p_5ff_rirv938_66486_v1_cp1248_merged | rirv938-95p-5ff-rirv938-_6463_v1 | 7737 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/95p_5ff_rirv938_ | 2025-04-11 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 367.0 | 1.0 | 1306.74 | 1353.66 | 0.58 | 0.99 | rirv938-slerp-grpo-cp62_11749_v1 | 24B | rirv938/slerp_grpo_cp624_96ff_b5_r1_merged | rirv938-slerp-grpo-cp62_11749_v1 | 5615 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp624 | 2025-05-22 | single | | |
rirv938 | 1 | 368.0 | 1.0 | 1306.64 | 1353.66 | 0.52 | 0.99 | rirv938-mistral-24b-bas_54279_v2 | 24B | rirv938/mistral_24b_base_2_dpo_40k_95w_pref_2500_v2 | rirv938-mistral-24b-bas_54279_v2 | 8506 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_base | 2025-03-06 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 369.0 | 1.0 | 1306.6 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-beta-_54778_v3 | 13B | rirv938/anthropic_beta_2_40k_2496_bo8_v2 | rirv938-anthropic-beta-_54778_v3 | 12124 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-31 | single | 1.65 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 370.0 | 1.0 | 1306.57 | 1353.66 | 0.54 | 0.99 | rirv938-100p-0ff-rirv93_35621_v2 | 24B | rirv938/100p_0ff_rirv938_mistral_24b_lex__1090_v2_cp748_merged | rirv938-100p-0ff-rirv93_35621_v2 | 7918 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-21 | single | 0.63 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 371.0 | 1.0 | 1306.51 | 1353.66 | 0.57 | 0.99 | chaiml-slerpv5-reward-d_98061_v1 | 24B | ChaiML/slerpv5_reward_dpo_rl_ff | chaiml-slerpv5-reward-d_98061_v1 | 8661 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerpv5_reward_dp | 2025-06-11 | single | | |
rirv938 | 1 | 372.0 | 1.0 | 1306.47 | 1353.66 | 0.56 | 0.99 | rirv938-mistral-24b-dpo_20225_v1 | 24B | rirv938/mistral_24b_dpo_40k_95w_pref_3750_instruct_dpo_1_v2 | rirv938-mistral-24b-dpo_20225_v1 | 6744 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-02-23 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 373.0 | 1.0 | 1306.43 | 1353.66 | 0.54 | 0.99 | rirv938-rinen-grpo-cp31_66645_v1 | 13B | rirv938/rinen_grpo_cp312_97ff_slerp_rm_b4_merged | rirv938-rinen-grpo-cp31_66645_v1 | 8774 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp312 | 2025-05-21 | single | | |
rirv938 | 1 | 374.5 | 1.0 | 1306.4 | 1353.66 | 0.56 | 0.99 | rirv938-1000-sim-100p-0_99519_v1 | 24B | rirv938/1000_sim_100p_0ff_rirv938_mistral_24b_lex__1090_v2_cp124_v9_merged | rirv938-1000-sim-100p-0_99519_v1 | 6938 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/1000_sim_100p_0f | 2025-04-21 | single | 1.45 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 374.5 | 1.0 | 1306.4 | 1353.66 | 0.52 | 0.99 | chaiml-20250411-rob-ava-_6550_v3 | 8B | ChaiML/20250411_rob_ava_reward_300k_safety_threshold_1_2 | chaiml-20250411-rob-ava-_6550_v3 | 5820 | 61115860 | 0.52 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | ChaiML/20250411_rob_ava_ | 2025-05-30 | single | | |
rirv938 | 1 | 376.0 | 1.0 | 1306.37 | 1353.66 | 0.57 | 0.99 | rirv938-5k-98p-2ff-rirv_43370_v1 | 24B | rirv938/5k_98p_2ff_rirv938_mistral_24b_bon_31129_v6_cp468_v4 | rirv938-5k-98p-2ff-rirv_43370_v1 | 7221 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/5k_98p_2ff_rirv9 | 2025-04-01 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 377.0 | 1.0 | 1306.22 | 1353.66 | 0.53 | 0.99 | chaiml-devstral-24b-dpo_14531_v3 | 24B | ChaiML/devstral-24b-dpos1-prefsftgrok-v1-2e-11k-1 | chaiml-devstral-24b-dpo_14531_v3 | 11302 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/devstral-24b-dpos | 2025-07-08 | single | 1.35 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 378.0 | 1.0 | 1306.16 | 1353.66 | 0.5 | 0.99 | rirv938-100p-0ff-rirv938_2517_v2 | 24B | rirv938/100p_0ff_rirv938_mistral_24b_oai_77698_v2_cp374_merged | rirv938-100p-0ff-rirv938_2517_v2 | 5478 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-18 | single | 0.65 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 379.0 | 1.0 | 1306.06 | 1353.66 | 0.56 | 0.99 | rirv938-v9-pref-plus-03-_7925_v2 | 13B | rirv938/v9_pref_plus_03_mistral_1116_v2 | rirv938-v9-pref-plus-03-_7925_v2 | 19062 | 61115860 | 0.56 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/v9_pref_plus_03_ | 2024-12-22 | single | 1.77 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 380.5 | 1.0 | 1305.92 | 1353.66 | 0.57 | 0.99 | rirv938-mistral-24b-rou_70379_v1 | 24B | rirv938/mistral_24b_round_3_dpo_40k_65w_pref_10w_swear_2500_v2 | rirv938-mistral-24b-rou_70379_v1 | 11301 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-08 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 380.5 | 1.0 | 1305.92 | 1353.66 | 0.52 | 0.99 | rirv938-anthropic-grpo-_87408_v1 | 13B | rirv938/anthropic_grpo_40k_cp444_95ff_20ww_v3_merged | rirv938-anthropic-grpo-_87408_v1 | 7964 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-14 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 382.0 | 1.0 | 1305.89 | 1353.66 | 0.57 | 0.99 | rirv938-prefgrok-r2-cp6_85163_v1 | 24B | rirv938/prefgrok_r2_cp624_98ff_b5_v2_merged | rirv938-prefgrok-r2-cp6_85163_v1 | 6994 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/prefgrok_r2_cp62 | 2025-07-09 | single | 1.31 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 383.0 | 1.0 | 1305.78 | 1353.66 | 0.54 | 0.99 | chaiml-0sw-95p-5ff-rine_63828_v5 | 13B | ChaiML/0sw_95p_5ff_rinen0721_dpo_0130_cp3000_v8_merged | chaiml-0sw-95p-5ff-rine_63828_v5 | 6779 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/0sw_95p_5ff_rinen | 2025-05-21 | single | | |
rirv938 | 1 | 384.0 | 1.0 | 1305.72 | 1353.66 | 0.55 | 0.99 | function_befuf_2025-04-18 | | | dpo_data_collection | 7203 | 61115860 | 0.55 | 0.65 | function | | | | | | | 2025-04-18 | single | | |
rirv938 | 1 | 385.0 | 1.0 | 1305.71 | 1353.66 | 0.52 | 0.99 | function_febil_2025-03-28 | | | dpo_data_collection | 6510 | 61115860 | 0.54 | 0.65 | function | | | | | | | 2025-03-28 | single | | |
rirv938 | 1 | 386.5 | 1.0 | 1305.67 | 1353.66 | 0.57 | 0.99 | rirv938-grpo-to-compare_97129_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp156_with_ff_merged | rirv938-grpo-to-compare_97129_v1 | 8880 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-28 | single | 1.46 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 386.5 | 1.0 | 1305.67 | 1353.66 | 0.65 | 0.99 | function_dijos_2025-04-11 | | | dpo_data_collection | 9355 | 61115860 | 0.53 | 0.65 | function | | | | | | | 2025-04-11 | single | | |
rirv938 | 1 | 388.5 | 1.0 | 1305.66 | 1353.66 | 0.58 | 0.99 | rirv938-prefgrok-r2-cp3_99593_v1 | 24B | rirv938/prefgrok_r2_cp312_reformat_high_quality_merged | rirv938-prefgrok-r2-cp3_99593_v1 | 7565 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/prefgrok_r2_cp31 | 2025-07-08 | single | 1.29 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 388.5 | 1.0 | 1305.66 | 1353.66 | 0.49 | 0.99 | chaiml-simp-grpo-cp312-_43926_v1 | 24B | ChaiML/simp_grpo_cp312_96ff_b3_r1_12m_US_merged | chaiml-simp-grpo-cp312-_43926_v1 | 7665 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/simp_grpo_cp312_9 | 2025-07-09 | single | 1.58 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 390.0 | 1.0 | 1305.65 | 1353.66 | 0.55 | 0.99 | rirv938-mistral-24b-bas_95787_v1 | 24B | rirv938/mistral_24b_base_2_dpo_40k_85w_pref_20w_swear_2500_v2 | rirv938-mistral-24b-bas_95787_v1 | 10044 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_base | 2025-03-06 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 391.0 | 1.0 | 1305.6 | 1353.66 | 0.5 | 0.99 | chaiml-gy-grpo-cp624-98f_2782_v1 | 24B | ChaiML/gy_grpo_cp624_98ff_b35_r1_merged | chaiml-gy-grpo-cp624-98f_2782_v1 | 7534 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/gy_grpo_cp624_98f | 2025-07-09 | single | 1.62 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 392.0 | 1.0 | 1305.59 | 1353.66 | 0.55 | 0.99 | rirv938-anthropic-grpo-_44019_v4 | 13B | rirv938/anthropic_grpo_40k_cp148_95ff_merged | rirv938-anthropic-grpo-_44019_v4 | 5852 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-13 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 393.0 | 1.0 | 1305.58 | 1353.66 | 0.57 | 0.99 | blend_hupub_2025-03-08 | n/a | | rob_ab_test | 8027 | 61115860 | 0.53 | 0.65 | blend | | | | | | | 2025-03-08 | blended | | |
rirv938 | 1 | 394.5 | 1.0 | 1305.51 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp15_72849_v1 | 24B | rirv938/slerp_grpo_cp156_96ff_b4_r1_merged | rirv938-slerp-grpo-cp15_72849_v1 | 6286 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp156 | 2025-05-22 | single | | |
rirv938 | 1 | 394.5 | 1.0 | 1305.51 | 1353.66 | 0.57 | 0.99 | chaiml-slerp-grpo-cp312_10606_v3 | 24B | ChaiML/slerp_grpo_cp312_96ff_b4_r1_lr3_merged | chaiml-slerp-grpo-cp312_10606_v3 | 5543 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerp_grpo_cp312_ | 2025-05-31 | single | | |
rirv938 | 1 | 396.0 | 1.0 | 1305.44 | 1353.66 | 0.56 | 0.99 | blend_fajer_2025-04-14 | n/a | | rob_ab_test | 7861856 | 61115860 | 0.53 | 0.65 | blend | | | | | | | 2025-04-14 | blended | | |
rirv938 | 1 | 397.0 | 1.0 | 1305.35 | 1353.66 | 0.55 | 0.99 | rirv938-0sw-95p-5ff-rin_34350_v1 | 13B | rirv938/0sw_95p_5ff_rinen0721_dpo_0130_cp3000_v8_merge | rirv938-0sw-95p-5ff-rin_34350_v1 | 7092 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/0sw_95p_5ff_rine | 2025-03-19 | single | 1.37 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 398.0 | 1.0 | 1305.29 | 1353.66 | 0.56 | 0.99 | rirv938-grpo-to-compare_34174_v2 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp312_lr8_merged | rirv938-grpo-to-compare_34174_v2 | 8713 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-26 | single | 1.4 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 399.0 | 1.0 | 1305.27 | 1353.66 | 0.57 | 0.99 | rirv938-96p-4ff-chaiml-_93679_v1 | 24B | rirv938/96p_4ff_chaiml_slerpv5_mistral_24540_v17_cp500_merged | rirv938-96p-4ff-chaiml-_93679_v1 | 11128 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_chaiml_s | 2025-06-10 | single | | |
rirv938 | 1 | 400.0 | 1.0 | 1305.24 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp62_62732_v1 | 24B | rirv938/slerp_grpo_cp624_96ff_b7_r1_merged | rirv938-slerp-grpo-cp62_62732_v1 | 6510 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp624 | 2025-05-24 | single | | |
rirv938 | 1 | 401.0 | 1.0 | 1305.11 | 1353.66 | 0.59 | 0.99 | rirv938-slerp-grpo-cp31_22331_v1 | 24B | rirv938/slerp_grpo_cp312_96ff_b5_r1_merged | rirv938-slerp-grpo-cp31_22331_v1 | 6454 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp312 | 2025-05-22 | single | | |
rirv938 | 1 | 402.0 | 1.0 | 1305.1 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-_44658_v1 | 13B | rirv938/anthropic_grpo_40k_cp592_95ff_20ww_merged | rirv938-anthropic-grpo-_44658_v1 | 6228 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-13 | single | 1.5 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 403.0 | 1.0 | 1305.08 | 1353.66 | 0.53 | 0.99 | blend_lopul_2025-05-15 | n/a | | rob_ab_test | 7745 | 61115860 | 0.52 | 0.65 | blend | | | | | | | 2025-05-15 | blended | | |
rirv938 | 1 | 404.5 | 1.0 | 1305.07 | 1353.66 | 0.57 | 0.99 | rirv938-94p-6ff-rirv938_15029_v1 | 24B | rirv938/94p_6ff_rirv938_1000_sim_100p_0_17599_v1_cp1060_merged | rirv938-94p-6ff-rirv938_15029_v1 | 6333 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/94p_6ff_rirv938_ | 2025-04-21 | single | 1.46 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 404.5 | 1.0 | 1305.07 | 1353.66 | 0.55 | 0.99 | chaiml-0sw-95p-5ff-rine_63828_v2 | 13B | ChaiML/0sw_95p_5ff_rinen0721_dpo_0130_cp3000_v8_merged | chaiml-0sw-95p-5ff-rine_63828_v2 | 5774 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/0sw_95p_5ff_rinen | 2025-04-28 | single | 1.33 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 406.0 | 1.0 | 1304.9 | 1353.66 | 0.54 | 0.99 | rirv938-20k-100p-0ff-ri_69584_v1 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp312_v3 | rirv938-20k-100p-0ff-ri_69584_v1 | 5656 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-02 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 407.0 | 1.0 | 1304.86 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp31_41064_v1 | 24B | rirv938/slerp_grpo_cp312_96ff_b8_r1_merged | rirv938-slerp-grpo-cp31_41064_v1 | 7871 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp312 | 2025-05-24 | single | | |
rirv938 | 1 | 408.0 | 1.0 | 1304.84 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_79367_v1 | 13B | rirv938/anthropic_grpo_40k_cp3588_96ff_new_rm_b5_merged | rirv938-anthropic-grpo-_79367_v1 | 7375 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-21 | single | | |
rirv938 | 1 | 409.0 | 1.0 | 1304.83 | 1353.66 | 0.57 | 0.99 | blend_laror_2025-04-14 | n/a | | rob_ab_test | 7857876 | 61115860 | 0.53 | 0.65 | blend | | | | | | | 2025-04-14 | blended | | |
rirv938 | 1 | 410.0 | 1.0 | 1304.8 | 1353.66 | 0.56 | 0.99 | rirv938-slerp-grpo-cp46_19195_v1 | 24B | rirv938/slerp_grpo_cp468_96ff_b3_r1_20k_merged | rirv938-slerp-grpo-cp46_19195_v1 | 10061 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp468 | 2025-06-10 | single | | |
rirv938 | 1 | 411.0 | 1.0 | 1304.67 | 1353.66 | 0.55 | 0.99 | rirv938-anthropic-grpo-_82907_v1 | 13B | rirv938/anthropic_grpo_40k_cp1776_95ff_beta6_3_merged | rirv938-anthropic-grpo-_82907_v1 | 10081 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-17 | single | 1.57 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 412.0 | 1.0 | 1304.64 | 1353.66 | 0.54 | 0.99 | chaiml-exp-grpo-cp624-96_5228_v3 | 24B | ChaiML/exp_grpo_cp624_96ff_b6_r1_merged | chaiml-exp-grpo-cp624-96_5228_v3 | 21435 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/exp_grpo_cp624_96 | 2025-06-05 | single | | |
rirv938 | 1 | 413.0 | 1.0 | 1304.63 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-4_2727_v2 | 13B | rirv938/anthropic_grpo_40k_cp888_95ff_20ww2_merged | rirv938-anthropic-grpo-4_2727_v2 | 7420 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-15 | single | 1.59 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 414.0 | 1.0 | 1304.6 | 1353.66 | 0.55 | 0.99 | rirv938-anthropic-grpo-_51376_v4 | 13B | rirv938/anthropic_grpo_40k_cp592_95ff_merged | rirv938-anthropic-grpo-_51376_v4 | 6523 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-13 | single | 1.64 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 415.0 | 1.0 | 1304.57 | 1353.66 | 0.52 | 0.99 | blend_hogis_2025-05-15 | n/a | | rob_ab_test | 6717 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-05-15 | blended | | |
rirv938 | 1 | 416.0 | 1.0 | 1304.51 | 1353.66 | 0.5 | 0.99 | rirv938-gy-grpo-cp312-9_54074_v1 | 24B | rirv938/gy_grpo_cp312_98ff_b35_r1_merged | rirv938-gy-grpo-cp312-9_54074_v1 | 6652 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/gy_grpo_cp312_98 | 2025-07-02 | single | 1.58 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 417.0 | 1.0 | 1304.4 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-beta-_16989_v1 | 13B | rirv938/anthropic_beta_2_40k_3744_bo8_95w_v2 | rirv938-anthropic-beta-_16989_v1 | 13185 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-30 | single | 2.92 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 418.0 | 1.0 | 1304.39 | 1353.66 | 0.54 | 0.99 | rirv938-20250331-reward_78765_v1 | 8B | rirv938/20250331_reward_ablation_bon_256 | rirv938-20250331-reward_78765_v1 | 10139 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 256.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250331_reward_ | 2025-03-31 | single | | |
rirv938 | 1 | 419.0 | 1.0 | 1304.3 | 1353.66 | 0.57 | 0.99 | chaiml-slerpv5-mistral3_24540_v6 | 24B | ChaiML/slerpv5_mistral31_simpo_dpo_dpoold_s2 | chaiml-slerpv5-mistral3_24540_v6 | 5396 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerpv5_mistral31 | 2025-05-22 | single | | |
rirv938 | 1 | 420.0 | 1.0 | 1304.17 | 1353.66 | 0.53 | 0.99 | rirv938-100p-0ff-rirv93_86207_v1 | 24B | rirv938/100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp312_v3 | rirv938-100p-0ff-rirv93_86207_v1 | 5794 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-02 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 421.0 | 1.0 | 1304.11 | 1353.66 | 0.56 | 0.99 | rirv938-mistral-24b-dpo_54609_v1 | 24B | rirv938/mistral_24b_dpo_40k_95w_pref_1250_instruct_dpo_1_v2 | rirv938-mistral-24b-dpo_54609_v1 | 7373 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-02-23 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 422.5 | 1.0 | 1304.09 | 1353.66 | 0.56 | 0.99 | rirv938-tune-mistral-gr_51403_v1 | 24B | rirv938/tune_mistral_grpo_cp592_92ff_v3_run3_merged | rirv938-tune-mistral-gr_51403_v1 | 6324 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/tune_mistral_grp | 2025-04-30 | single | 1.74 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 422.5 | 1.0 | 1304.09 | 1353.66 | 0.54 | 0.99 | function_nurir_2025-06-12 | | | dpo_data_collection | 11785 | 61115860 | 0.54 | 0.65 | function | | | | | | | 2025-06-11 | single | | |
rirv938 | 1 | 424.5 | 1.0 | 1304.04 | 1353.66 | 0.51 | 0.99 | rirv938-mistral-24b-rou_50061_v2 | 24B | rirv938/mistral_24b_round_2_dpo_40k_95w_pref_2500_v2 | rirv938-mistral-24b-rou_50061_v2 | 8147 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-06 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 424.5 | 1.0 | 1304.04 | 1353.66 | 0.56 | 0.99 | function_gofas_2025-06-10 | | | dpo_data_collection | 10112 | 61115860 | 0.54 | 0.65 | function | | | | | | | 2025-06-09 | single | | |
rirv938 | 1 | 426.0 | 1.0 | 1303.98 | 1353.66 | 0.53 | 0.99 | rirv938-20250331-reward_96848_v4 | 8B | rirv938/20250331_reward_ablation_bon | rirv938-20250331-reward_96848_v4 | 9350 | 61115860 | 0.54 | 0.65 | basic | | 1.0 | 256.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250331_reward_ | 2025-03-31 | single | | |
rirv938 | 1 | 427.0 | 1.0 | 1303.92 | 1353.66 | 0.49 | 0.99 | rirv938-bold-100p-0ff-ri_7996_v1 | 24B | rirv938/bold_100p_0ff_rirv938_mistral_24b_oai_77698_v2_cp372_merged | rirv938-bold-100p-0ff-ri_7996_v1 | 6411 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/bold_100p_0ff_ri | 2025-04-18 | single | 0.65 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 428.0 | 1.0 | 1303.89 | 1353.66 | 0.57 | 0.99 | rirv938-tune-mistral-gr_66976_v1 | 24B | rirv938/tune_mistral_grpo_cp62_92ff_merged | rirv938-tune-mistral-gr_66976_v1 | 7460 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/tune_mistral_grp | 2025-04-29 | single | 1.73 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 429.0 | 1.0 | 1303.86 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp62_11541_v1 | 24B | rirv938/slerp_grpo_cp624_96ff_b6_r1_merged | rirv938-slerp-grpo-cp62_11541_v1 | 9074 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp624 | 2025-05-24 | single | | |
rirv938 | 1 | 430.0 | 1.0 | 1303.84 | 1353.66 | 0.61 | 0.99 | function_hadaf_2025-03-07 | | | retune_with_base | 8003 | 61115860 | 0.54 | 0.65 | function | | | | | | | 2025-03-07 | single | | |
rirv938 | 1 | 431.0 | 1.0 | 1303.83 | 1353.66 | 0.61 | 0.99 | rirv938-anthropic-beta-_64925_v4 | 13B | rirv938/anthropic_beta_2_40k_2496_bo16_v2 | rirv938-anthropic-beta-_64925_v4 | 12087 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-31 | single | 1.75 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 432.0 | 1.0 | 1303.82 | 1353.66 | 0.53 | 0.99 | blend_disal_2025-05-01 | n/a | | rob_ab_test | 9671 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-05-01 | blended | | |
rirv938 | 1 | 433.0 | 1.0 | 1303.79 | 1353.66 | 0.54 | 0.99 | rirv938-llama-8b-1024-t_67568_v4 | 8B | rirv938/llama_8b_1024_tokens_context_3m_step_11718 | rirv938-llama-8b-1024-t_67568_v4 | 10490 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/llama_8b_1024_to | 2025-02-27 | single | | |
rirv938 | 1 | 434.0 | 1.0 | 1303.75 | 1353.66 | 0.58 | 0.99 | rirv938-mistral-24b-base_6604_v1 | 24B | rirv938/mistral_24b_base_2_dpo_40k_70w_pref_16w_swear_2500_v2 | rirv938-mistral-24b-base_6604_v1 | 9099 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_base | 2025-03-07 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 435.5 | 1.0 | 1303.71 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-4_3092_v4 | 13B | rirv938/anthropic_grpo_40k_cp888_95ff_merged | rirv938-anthropic-grpo-4_3092_v4 | 7456 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-13 | single | 1.67 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 435.5 | 1.0 | 1303.71 | 1353.66 | 0.57 | 0.99 | rirv938-98p-2ff-rirv938_86941_v1 | 24B | rirv938/98p_2ff_rirv938_mistral_24b_bon_31129_v6_cp625_v4 | rirv938-98p-2ff-rirv938_86941_v1 | 6405 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-04-01 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 437.0 | 1.0 | 1303.56 | 1353.66 | 0.55 | 0.99 | chaiml-exp-grpo-cp624-96_5228_v1 | 24B | ChaiML/exp_grpo_cp624_96ff_b6_r1_merged | chaiml-exp-grpo-cp624-96_5228_v1 | 5203 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/exp_grpo_cp624_96 | 2025-05-30 | single | | |
rirv938 | 1 | 438.0 | 1.0 | 1303.54 | 1353.66 | 0.55 | 0.99 | rirv938-80k-98p-2ff-rir_37615_v1 | 24B | rirv938/80k_98p_2ff_rirv938_mistral_24b_bon_82623_v1_cp936_merged | rirv938-80k-98p-2ff-rir_37615_v1 | 7124 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/80k_98p_2ff_rirv | 2025-04-08 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 439.0 | 1.0 | 1303.53 | 1353.66 | 0.53 | 0.99 | rirv938-groksyn-grpo-cp_67088_v3 | 24B | rirv938/groksyn_grpo_cp312_98ff_b35_r1_merged | rirv938-groksyn-grpo-cp_67088_v3 | 8794 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1536.0 | 64.0 | MistralForCausalLM | rirv938/groksyn_grpo_cp3 | 2025-07-07 | single | 0.99 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 440.0 | 1.0 | 1303.52 | 1353.66 | 0.53 | 0.99 | function_subir_2025-06-12 | | | dpo_data_collection | 9847 | 61115860 | 0.54 | 0.65 | function | | | | | | | 2025-06-11 | single | | |
rirv938 | 1 | 441.5 | 1.0 | 1303.47 | 1353.66 | 0.52 | 0.99 | rirv938-98p-2ff-rirv938_33106_v1 | 24B | rirv938/98p_2ff_rirv938_1000_sim_100p_0_17599_v1_cp1060_merged | rirv938-98p-2ff-rirv938_33106_v1 | 6402 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-04-21 | single | 1.45 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 441.5 | 1.0 | 1303.47 | 1353.66 | 0.53 | 0.99 | function_pojif_2025-05-31 | | | dpo_data_collection | 6027 | 61115860 | 0.52 | 0.65 | function | | | | | | | 2025-05-31 | single | | |
rirv938 | 1 | 443.5 | 1.0 | 1303.41 | 1353.66 | 0.56 | 0.99 | rirv938-1000-sim-100p-0_89759_v2 | 24B | rirv938/1000_sim_100p_0ff_rirv938_mistral_24b_lex__1090_v2_cp248_v9_merged | rirv938-1000-sim-100p-0_89759_v2 | 8183 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/1000_sim_100p_0f | 2025-04-21 | single | 1.43 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 443.5 | 1.0 | 1303.41 | 1353.66 | 0.54 | 0.99 | blend_jenet_2025-06-12 | n/a | | rob_ab_test | 8595 | 61115860 | 0.54 | 0.65 | blend | | | | | | | 2025-06-11 | blended | | |
rirv938 | 1 | 445.0 | 1.0 | 1303.38 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp31_62351_v1 | 24B | rirv938/slerp_grpo_cp312_96ff_b7_r1_merged | rirv938-slerp-grpo-cp31_62351_v1 | 6588 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp312 | 2025-05-24 | single | | |
rirv938 | 1 | 446.5 | 1.0 | 1303.37 | 1353.66 | 0.53 | 0.99 | rirv938-98p-2ff-rirv938_42155_v3 | 24B | rirv938/98p_2ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp936_v3 | rirv938-98p-2ff-rirv938_42155_v3 | 7394 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-03-28 | single | 1.26 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 446.5 | 1.0 | 1303.37 | 1353.66 | 0.53 | 0.99 | chaiml-exp14-exp9dpoft-_65674_v6 | 24B | ChaiML/exp14-exp9DPOFt-chaidatav1dpo6k-24B | chaiml-exp14-exp9dpoft-_65674_v6 | 5776 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/exp14-exp9DPOFt-c | 2025-05-22 | single | | |
rirv938 | 1 | 448.0 | 1.0 | 1303.36 | 1353.66 | 0.58 | 0.99 | rirv938-mistral-24b-bas_69595_v1 | 24B | rirv938/mistral_24b_base_3_dpo_40k_70w_pref_10w_swear_2448_v2 | rirv938-mistral-24b-bas_69595_v1 | 10929 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_base | 2025-03-07 | single | 0.76 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 449.0 | 1.0 | 1303.35 | 1353.66 | 0.56 | 0.99 | rirv938-v9-pref-plus-03-_4881_v1 | 13B | rirv938/v9_pref_plus_03_mistral_558_v2 | rirv938-v9-pref-plus-03-_4881_v1 | 28566 | 61115860 | 0.55 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/v9_pref_plus_03_ | 2024-12-22 | single | 1.77 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 450.0 | 1.0 | 1303.33 | 1353.66 | 0.52 | 0.99 | rirv938-mistral-24b-rou_30981_v1 | 24B | rirv938/mistral_24b_round_2_dpo_40k_95w_pref_1250_v2 | rirv938-mistral-24b-rou_30981_v1 | 8713 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-05 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 451.0 | 1.0 | 1303.29 | 1353.66 | 0.58 | 0.99 | chaiml-slerpv5-mistral3_24540_v5 | 24B | ChaiML/slerpv5_mistral31_simpo_dpo_dpoold_s2 | chaiml-slerpv5-mistral3_24540_v5 | 5676 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerpv5_mistral31 | 2025-05-22 | single | | |
rirv938 | 1 | 452.0 | 1.0 | 1303.28 | 1353.66 | 0.56 | 0.99 | rirv938-grpo-to-compare_34174_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp312_lr8_merged | rirv938-grpo-to-compare_34174_v1 | 11379 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-26 | single | 1.45 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 453.0 | 1.0 | 1303.22 | 1353.66 | 0.53 | 0.99 | rirv938-llama-8b-256-to_50255_v5 | 8B | rirv938/llama_8b_256_tokens_context_3m_step_11718 | rirv938-llama-8b-256-to_50255_v5 | 9343 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 256.0 | 1.0 | LlamaForSequenceClassification | rirv938/llama_8b_256_tok | 2025-02-27 | single | | |
rirv938 | 1 | 454.0 | 1.0 | 1303.18 | 1353.66 | 0.56 | 0.99 | rirv938-5k-98p-2ff-rirv_20793_v1 | 24B | rirv938/5k_98p_2ff_rirv938_mistral_24b_bon_31129_v6_cp780_v4 | rirv938-5k-98p-2ff-rirv_20793_v1 | 7261 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/5k_98p_2ff_rirv9 | 2025-04-01 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 455.0 | 1.0 | 1303.15 | 1353.66 | 0.58 | 0.99 | rirv938-prefgrok-r2-cp3_32680_v1 | 24B | rirv938/prefgrok_r2_cp312_reformat_low_quality_merged | rirv938-prefgrok-r2-cp3_32680_v1 | 8479 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/prefgrok_r2_cp31 | 2025-07-08 | single | 1.33 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 456.0 | 1.0 | 1303.03 | 1353.66 | 0.53 | 0.99 | rirv938-llama-8b-1024-t_67568_v2 | 8B | rirv938/llama_8b_1024_tokens_context_3m_step_11718 | rirv938-llama-8b-1024-t_67568_v2 | 6192 | 61115860 | 0.54 | 0.65 | basic | | 1.0 | 256.0 | 1.0 | LlamaForSequenceClassification | rirv938/llama_8b_1024_to | 2025-02-27 | single | | |
rirv938 | 1 | 457.0 | 1.0 | 1302.99 | 1353.66 | 0.58 | 0.99 | rirv938-anthropic-beta-_39249_v1 | 13B | rirv938/anthropic_beta_2_40k_1248_bo8_100w_v2 | rirv938-anthropic-beta-_39249_v1 | 12210 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-30 | single | 1.73 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 458.0 | 1.0 | 1302.96 | 1353.66 | 0.56 | 0.99 | rirv938-1000-sim-100p-0_89759_v1 | 24B | rirv938/1000_sim_100p_0ff_rirv938_mistral_24b_lex__1090_v2_cp248_v9_merged | rirv938-1000-sim-100p-0_89759_v1 | 7904 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/1000_sim_100p_0f | 2025-04-21 | single | 1.45 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 459.0 | 1.0 | 1302.87 | 1353.66 | 0.54 | 0.99 | rirv938-mistral-24b-rou_91022_v1 | 24B | rirv938/mistral_24b_round_2_dpo_40k_85w_pref_20w_swear_2500_v2 | rirv938-mistral-24b-rou_91022_v1 | 11624 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-06 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 460.0 | 1.0 | 1302.79 | 1353.66 | 0.59 | 0.99 | rirv938-v10-pref-plus-03_8807_v1 | 13B | rirv938/v10_pref_plus_03_mistral_1116_v2 | rirv938-v10-pref-plus-03_8807_v1 | 28153 | 61115860 | 0.56 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/v10_pref_plus_03 | 2024-12-23 | single | 1.73 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 461.0 | 1.0 | 1302.76 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-2_60007_v1 | 13B | rirv938/anthropic_40k_2496_bo8_85w_b4_2xlora_lr4_v2 | rirv938-anthropic-40k-2_60007_v1 | 19425 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_24 | 2025-01-01 | single | 1.62 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 462.0 | 1.0 | 1302.73 | 1353.66 | 0.55 | 0.99 | rirv938-rinen-grpo-cp31_76768_v1 | 13B | rirv938/rinen_grpo_cp312_97ff_mixed_rm_b4_merged | rirv938-rinen-grpo-cp31_76768_v1 | 6580 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp312 | 2025-05-21 | single | | |
rirv938 | 1 | 463.0 | 1.0 | 1302.72 | 1353.66 | 0.56 | 0.99 | rirv938-rinen-grpo-cp15_91180_v1 | 13B | rirv938/rinen_grpo_cp1560_97ff_ava_bo1_b4_80k_merged | rirv938-rinen-grpo-cp15_91180_v1 | 7389 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp156 | 2025-05-21 | single | | |
rirv938 | 1 | 464.0 | 1.0 | 1302.68 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-beta-_88254_v1 | 13B | rirv938/anthropic_beta_2_40k_2496_bo8_100w_b4_v2 | rirv938-anthropic-beta-_88254_v1 | 12416 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-30 | single | 1.74 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 465.0 | 1.0 | 1302.6 | 1353.66 | 0.57 | 0.99 | rirv938-prefgrok-r2-cp3_99593_v2 | 24B | rirv938/prefgrok_r2_cp312_reformat_high_quality_merged | rirv938-prefgrok-r2-cp3_99593_v2 | 7387 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/prefgrok_r2_cp31 | 2025-07-08 | single | 1.33 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 466.0 | 1.0 | 1302.53 | 1353.66 | 0.53 | 0.99 | rirv938-groksyn-grpo-cp_95280_v1 | 24B | rirv938/groksyn_grpo_cp312_98ff_b35_r1_reformat_merged | rirv938-groksyn-grpo-cp_95280_v1 | 6582 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/groksyn_grpo_cp3 | 2025-07-07 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 467.0 | 1.0 | 1302.44 | 1353.66 | 0.56 | 0.99 | function_ketal_2025-01-27 | | | retune_with_base | 7554 | 61115860 | 0.55 | 0.65 | function | | | | | | | 2025-01-27 | single | | |
rirv938 | 1 | 468.0 | 1.0 | 1302.43 | 1353.66 | 0.54 | 0.99 | blend_perok_2025-06-12 | n/a | | rob_ab_test | 9142 | 61115860 | 0.54 | 0.65 | blend | | | | | | | 2025-06-11 | blended | | |
rirv938 | 1 | 469.0 | 1.0 | 1302.31 | 1353.66 | 0.57 | 0.99 | rirv938-prefgrok-r2-cp3_29730_v2 | 24B | rirv938/prefgrok_r2_cp312_98ff_b5_merged | rirv938-prefgrok-r2-cp3_29730_v2 | 7825 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/prefgrok_r2_cp31 | 2025-07-09 | single | 1.36 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 470.5 | 1.0 | 1302.29 | 1353.66 | 0.54 | 0.99 | rirv938-groksyn-grpo-cp_55837_v3 | 24B | rirv938/groksyn_grpo_cp624_98ff_b35_r1_merged | rirv938-groksyn-grpo-cp_55837_v3 | 8599 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1536.0 | 64.0 | MistralForCausalLM | rirv938/groksyn_grpo_cp6 | 2025-07-07 | single | 1.02 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 470.5 | 1.0 | 1302.29 | 1353.66 | 0.52 | 0.99 | rirv938-99p-1ff-nischayd_7844_v2 | 24B | rirv938/99p_1ff_nischaydnk_exp14_exp9dp_94555_v6_cp500_merged | rirv938-99p-1ff-nischayd_7844_v2 | 21811 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/99p_1ff_nischayd | 2025-06-08 | single | | |
rirv938 | 1 | 472.0 | 1.0 | 1302.28 | 1353.66 | 0.0 | 0.99 | function_belal_2025-06-25 | | | dpo_data_collection | 1917 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-06-25 | single | | |
rirv938 | 1 | 473.0 | 1.0 | 1302.25 | 1353.66 | 0.53 | 0.99 | nischaydnk-exp14-exp9dp_94555_v5 | 24B | NischayDnk/exp14-exp9DPOft-Chaidatav1dpo6k-Mistral24B | nischaydnk-exp14-exp9dp_94555_v5 | 6894 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | NischayDnk/exp14-exp9DPO | 2025-04-10 | single | 0.64 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 474.0 | 1.0 | 1302.14 | 1353.66 | 0.5 | 0.99 | rirv938-100p-0ff-rirv938_1567_v1 | 24B | rirv938/100p_0ff_rirv938_mistral_24b_oai_77698_v1_cp374_merged | rirv938-100p-0ff-rirv938_1567_v1 | 6541 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-18 | single | 0.64 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 475.0 | 1.0 | 1302.12 | 1353.66 | 0.55 | 0.99 | rirv938-rinen-grpo-cp15_53211_v1 | 13B | rirv938/rinen_grpo_cp156_97ff_old_prompts_merged | rirv938-rinen-grpo-cp15_53211_v1 | 5942 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp156 | 2025-05-21 | single | | |
rirv938 | 1 | 476.0 | 1.0 | 1302.07 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-_74526_v1 | 13B | rirv938/anthropic_grpo_40k_cp592_95ff_beta6_3_merged | rirv938-anthropic-grpo-_74526_v1 | 9684 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-17 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 477.0 | 1.0 | 1302.03 | 1353.66 | 0.49 | 0.99 | rirv938-simp-grpo-cp624_96435_v1 | 24B | rirv938/simp_grpo_cp624_96ff_b3_r1_12m_US_merged | rirv938-simp-grpo-cp624_96435_v1 | 9118 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/simp_grpo_cp624_ | 2025-06-30 | single | 1.61 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 478.0 | 1.0 | 1301.95 | 1353.66 | 0.53 | 0.99 | chaiml-20250611-retune-u_1558_v1 | 8B | ChaiML/20250611_retune_US_7_to_13_seconds | chaiml-20250611-retune-u_1558_v1 | 8424 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | ChaiML/20250611_retune_U | 2025-06-11 | single | | |
rirv938 | 1 | 479.0 | 1.0 | 1301.89 | 1353.66 | 0.55 | 0.99 | blend_libok_2025-05-01 | n/a | | rob_ab_test | 9098 | 61115860 | 0.52 | 0.65 | blend | | | | | | | 2025-05-01 | blended | | |
rirv938 | 1 | 480.0 | 1.0 | 1301.65 | 1353.66 | 0.64 | 0.99 | rirv938-95p-5ff-rirv938_10719_v1 | 24B | rirv938/95p_5ff_rirv938_95p_5ff_rirv938_66486_v1_cp624_merged | rirv938-95p-5ff-rirv938_10719_v1 | 7737 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/95p_5ff_rirv938_ | 2025-04-11 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 481.0 | 1.0 | 1301.64 | 1353.66 | 0.57 | 0.99 | rirv938-prefgrok-r2-cp3_47407_v1 | 24B | rirv938/prefgrok_r2_cp312_98ff_b5_v2_merged | rirv938-prefgrok-r2-cp3_47407_v1 | 7425 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/prefgrok_r2_cp31 | 2025-07-09 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 482.0 | 1.0 | 1301.62 | 1353.66 | 0.63 | 0.99 | rirv938-96p-4ff-chaiml-_52095_v1 | 24B | rirv938/96p_4ff_chaiml_slerpv5_mistral3_24540_v2_cp1452_merged | rirv938-96p-4ff-chaiml-_52095_v1 | 20235 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_chaiml_s | 2025-06-07 | single | | |
rirv938 | 1 | 483.0 | 1.0 | 1301.59 | 1353.66 | 0.51 | 0.99 | rirv938-mistral-24b-rou_50061_v1 | 24B | rirv938/mistral_24b_round_2_dpo_40k_95w_pref_2500_v2 | rirv938-mistral-24b-rou_50061_v1 | 7640 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-05 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 484.5 | 1.0 | 1301.55 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-beta-_75151_v1 | 13B | rirv938/anthropic_beta_2_40k_2496_bo8_95w_v2 | rirv938-anthropic-beta-_75151_v1 | 13843 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-30 | single | 2.98 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 484.5 | 1.0 | 1301.55 | 1353.66 | 0.52 | 0.99 | chaiml-llama-8b-multihe_54063_v2 | 8B | ChaiML/llama_8b_multihead_204m_preference | chaiml-llama-8b-multihe_54063_v2 | 6034 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 1024.0 | 1.0 | LlamaForSequenceClassification | ChaiML/llama_8b_multihea | 2025-02-27 | single | | |
rirv938 | 1 | 486.0 | 1.0 | 1301.46 | 1353.66 | 0.52 | 0.99 | chaiml-20250411-rob-ava-_6550_v2 | 8B | ChaiML/20250411_rob_ava_reward_300k_safety_threshold_1_2 | chaiml-20250411-rob-ava-_6550_v2 | 5969 | 61115860 | 0.51 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | ChaiML/20250411_rob_ava_ | 2025-05-30 | single | | |
rirv938 | 1 | 487.0 | 1.0 | 1301.43 | 1353.66 | 0.55 | 0.99 | rirv938-anthropic-grpo-_62978_v1 | 13B | rirv938/anthropic_grpo_40k_cp1184_95ff_6ww_v2_merged | rirv938-anthropic-grpo-_62978_v1 | 7776 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-13 | single | 1.59 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 488.0 | 1.0 | 1301.22 | 1353.66 | 0.53 | 0.99 | chaiml-20250611-retune-_68276_v1 | 8B | ChaiML/20250611_retune_app_for_week_less_swears | chaiml-20250611-retune-_68276_v1 | 7247 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | ChaiML/20250611_retune_a | 2025-06-11 | single | | |
rirv938 | 1 | 489.0 | 1.0 | 1301.21 | 1353.66 | 0.56 | 0.99 | rirv938-slerp-grpo-cp15_79826_v2 | 24B | rirv938/slerp_grpo_cp156_96ff_b4_r1_lr3_merged | rirv938-slerp-grpo-cp15_79826_v2 | 5474 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp156 | 2025-05-23 | single | | |
rirv938 | 1 | 491.0 | 1.0 | 1301.14 | 1353.66 | 0.54 | 0.99 | rirv938-mistral-24b-bas_95787_v2 | 24B | rirv938/mistral_24b_base_2_dpo_40k_85w_pref_20w_swear_2500_v2 | rirv938-mistral-24b-bas_95787_v2 | 9999 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_base | 2025-03-06 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 491.0 | 1.0 | 1301.14 | 1353.66 | 0.54 | 0.99 | rirv938-datamix-v2-cp624_3841_v1 | 24B | rirv938/datamix_v2_cp624_98ff_b35_r1_reformat_high_quality_merged | rirv938-datamix-v2-cp624_3841_v1 | 10940 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/datamix_v2_cp624 | 2025-07-08 | single | 1.36 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 491.0 | 1.0 | 1301.14 | 1353.66 | 0.51 | 0.99 | rirv938-99p-1ff-nischay_62699_v2 | 24B | rirv938/99p_1ff_nischaydnk_exp14_exp9dp_94555_v6_cp1000_merged | rirv938-99p-1ff-nischay_62699_v2 | 15123 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/99p_1ff_nischayd | 2025-06-08 | single | | |
rirv938 | 1 | 493.0 | 1.0 | 1301.1 | 1353.66 | 0.41 | 0.99 | rirv938-b4-98p-2ff-rirv_19085_v2 | 24B | rirv938/b4_98p_2ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp936_v3 | rirv938-b4-98p-2ff-rirv_19085_v2 | 7215 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/b4_98p_2ff_rirv9 | 2025-03-28 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 494.0 | 1.0 | 1301.08 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp54_69036_v1 | 24B | rirv938/slerp_grpo_cp546_96ff_b3_r1_20k_merged | rirv938-slerp-grpo-cp54_69036_v1 | 8971 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp546 | 2025-06-10 | single | | |
rirv938 | 1 | 495.0 | 1.0 | 1301.07 | 1353.66 | 0.6 | 0.99 | rirv938-mistral-24b-dpo_29487_v1 | 24B | rirv938/mistral_24b_dpo_40k_95w_pref_1250_instruct_dpo_2_v2 | rirv938-mistral-24b-dpo_29487_v1 | 6139 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-02-23 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 496.0 | 1.0 | 1301.06 | 1353.66 | 0.55 | 0.99 | function_lehul_2025-03-08 | | | retune_with_base | 8796 | 61115860 | 0.52 | 0.65 | function | | | | | | | 2025-03-08 | single | | |
rirv938 | 1 | 497.0 | 1.0 | 1301.0 | 1353.66 | 0.54 | 0.99 | chaiml-groksyn-grpo-cp3_82161_v1 | 24B | ChaiML/groksyn_grpo_cp312_98ff_b35_r1_merged | chaiml-groksyn-grpo-cp3_82161_v1 | 9672 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/groksyn_grpo_cp31 | 2025-07-09 | single | 1.36 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 498.0 | 1.0 | 1300.99 | 1353.66 | 0.53 | 0.99 | function_ragun_2025-06-12 | | | dpo_data_collection | 10873 | 61115860 | 0.55 | 0.65 | function | | | | | | | 2025-06-11 | single | | |
rirv938 | 1 | 499.0 | 1.0 | 1300.96 | 1353.66 | 0.53 | 0.99 | rirv938-20250521-rm-exp_v1 | 8B | rirv938/20250521_rm_exp | rirv938-20250521-rm-exp_v1 | 13159 | 61115860 | 0.54 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250521_rm_exp | 2025-06-08 | single | | |
rirv938 | 1 | 500.0 | 1.0 | 1300.91 | 1353.66 | 0.63 | 0.99 | rirv938-96p-4ff-chaiml-_75685_v1 | 24B | rirv938/96p_4ff_chaiml_slerpv5_mistral3_24540_v2_cp968_merged | rirv938-96p-4ff-chaiml-_75685_v1 | 20152 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_chaiml_s | 2025-06-07 | single | | |
rirv938 | 1 | 501.0 | 1.0 | 1300.82 | 1353.66 | 0.55 | 0.99 | rirv938-mistral-24b-rou_50261_v1 | 24B | rirv938/mistral_24b_round_3_dpo_40k_70w_pref_10w_swear_2500_v2 | rirv938-mistral-24b-rou_50261_v1 | 11334 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-07 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 502.0 | 1.0 | 1300.75 | 1353.66 | 0.5 | 0.99 | rirv938-simp-grpo-cp312_57442_v1 | 24B | rirv938/simp_grpo_cp312_96ff_b1_r1_merged | rirv938-simp-grpo-cp312_57442_v1 | 8659 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/simp_grpo_cp312_ | 2025-06-10 | single | | |
rirv938 | 1 | 503.0 | 1.0 | 1300.7 | 1353.66 | 0.53 | 0.99 | rirv938-dpo-to-compare-_42409_v2 | 24B | rirv938/dpo_to_compare_to_grpo_10k_cp620_merged | rirv938-dpo-to-compare-_42409_v2 | 9700 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/dpo_to_compare_t | 2025-04-25 | single | 1.45 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 504.0 | 1.0 | 1300.66 | 1353.66 | 0.48 | 0.99 | rirv938-simp-grpo-cp624_58266_v1 | 24B | rirv938/simp_grpo_cp624_2ff_b2_r1_ava_rm_merged | rirv938-simp-grpo-cp624_58266_v1 | 6687 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/simp_grpo_cp624_ | 2025-07-02 | single | 1.62 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 505.0 | 1.0 | 1300.62 | 1353.66 | 0.51 | 0.99 | rirv938-simp-grpo-cp624_75422_v1 | 24B | rirv938/simp_grpo_cp624_96ff_b3_r1_merged | rirv938-simp-grpo-cp624_75422_v1 | 9769 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/simp_grpo_cp624_ | 2025-06-11 | single | | |
rirv938 | 1 | 506.0 | 1.0 | 1300.56 | 1353.66 | 0.59 | 0.99 | function_kimar_2025-06-07 | | | dpo_data_collection | 10613 | 61115860 | 0.53 | 0.65 | function | | | | | | | 2025-06-07 | single | | |
rirv938 | 1 | 507.0 | 1.0 | 1300.51 | 1353.66 | 0.52 | 0.99 | chaiml-llama-8b-multihe_54063_v1 | 8B | ChaiML/llama_8b_multihead_204m_preference | chaiml-llama-8b-multihe_54063_v1 | 6285 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 256.0 | 1.0 | LlamaForSequenceClassification | ChaiML/llama_8b_multihea | 2025-02-27 | single | | |
rirv938 | 1 | 508.0 | 1.0 | 1300.45 | 1353.66 | 0.53 | 0.99 | rirv938-mistral-24b-rou_67411_v1 | 24B | rirv938/mistral_24b_round_2_dpo_40k_95w_pref_25w_swear_2500_v2 | rirv938-mistral-24b-rou_67411_v1 | 9426 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-06 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 509.0 | 1.0 | 1300.44 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-4_2727_v3 | 13B | rirv938/anthropic_grpo_40k_cp888_95ff_20ww2_merged | rirv938-anthropic-grpo-4_2727_v3 | 7135 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-15 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 510.0 | 1.0 | 1300.39 | 1353.66 | 0.52 | 0.99 | function_leguf_2025-03-18 | | | dpo_data_collection | 7759 | 61115860 | 0.53 | 0.65 | function | | | | | | | 2025-03-17 | single | | |
rirv938 | 1 | 511.0 | 1.0 | 1300.25 | 1353.66 | 0.59 | 0.99 | rirv938-nitral-beta-4-4_29933_v2 | 13B | rirv938/nitral_beta_4_40k_2496_v2 | rirv938-nitral-beta-4-4_29933_v2 | 15259 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/nitral_beta_4_40 | 2025-01-06 | single | 1.7 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 512.0 | 1.0 | 1300.22 | 1353.66 | 0.54 | 0.99 | chaiml-exp14-exp9dpoft_65674_v12 | 24B | ChaiML/exp14-exp9DPOFt-chaidatav1dpo6k-24B | chaiml-exp14-exp9dpoft_65674_v12 | 5664 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/exp14-exp9DPOFt-c | 2025-05-31 | single | | |
rirv938 | 1 | 513.0 | 1.0 | 1300.16 | 1353.66 | 0.54 | 0.99 | function_budes_2025-02-27 | | | retune_with_base | 5701 | 61115860 | 0.53 | 0.65 | function | | | | | | | 2025-02-27 | single | | |
rirv938 | 1 | 514.0 | 1.0 | 1300.06 | 1353.66 | 0.63 | 0.99 | rirv938-0sw-90p-10ff-ri_52696_v1 | 13B | rirv938/0sw_90p_10ff_rinen0721_dpo_0130_cp3000_v8_merge | rirv938-0sw-90p-10ff-ri_52696_v1 | 7859 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/0sw_90p_10ff_rin | 2025-03-19 | single | 1.35 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 515.0 | 1.0 | 1300.05 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-24_7081_v1 | 13B | rirv938/anthropic_40k_2496_bo8_80w_no_filter_v2 | rirv938-anthropic-40k-24_7081_v1 | 20027 | 61115860 | 0.55 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_24 | 2025-01-01 | single | 1.71 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 516.0 | 1.0 | 1300.04 | 1353.66 | 0.56 | 0.99 | rirv938-rinen-grpo-cp15_10147_v1 | 13B | rirv938/rinen_grpo_cp156_97ff_ava_bo1_b4_round2_merged | rirv938-rinen-grpo-cp15_10147_v1 | 7299 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp156 | 2025-05-21 | single | | |
rirv938 | 1 | 517.0 | 1.0 | 1299.88 | 1353.66 | 0.5 | 0.99 | rirv938-bold-100p-0ff-r_37254_v1 | 24B | rirv938/bold_100p_0ff_rirv938_mistral_24b_oai_77698_v2_cp248_merged | rirv938-bold-100p-0ff-r_37254_v1 | 6469 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/bold_100p_0ff_ri | 2025-04-18 | single | 0.66 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 518.0 | 1.0 | 1299.83 | 1353.66 | 0.54 | 0.99 | chaiml-anthropic-grpo-4_66492_v4 | 13B | ChaiML/anthropic_grpo_40k_cp1184_95ff | chaiml-anthropic-grpo-4_66492_v4 | 6557 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/anthropic_grpo_40 | 2025-05-13 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 519.0 | 1.0 | 1299.82 | 1353.66 | 0.0 | 0.99 | chaiml-llama-8b-multih_78780_v25 | 8B | ChaiML/llama_8b_multihead_204m_512_v3_tokens_step_398208 | chaiml-llama-8b-multih_78780_v25 | 5999 | 61115860 | 0.55 | 0.65 | basic | | 1.0 | 2048.0 | 1.0 | MultiHeadLlamaClassifier | ChaiML/llama_8b_multihea | 2025-02-12 | single | | |
rirv938 | 1 | 520.0 | 1.0 | 1299.78 | 1353.66 | 0.55 | 0.99 | rirv938-llama-8b-multih_77470_v5 | 8B | rirv938/llama_8b_multihead_22m_256_tokens_step_15036_safety_oversampled | rirv938-llama-8b-multih_77470_v5 | 8750 | 61115860 | 0.55 | 0.65 | basic | | 1.0 | 256.0 | 1.0 | MultiHeadLlamaClassifier | rirv938/llama_8b_multihe | 2025-01-27 | single | | |
rirv938 | 1 | 521.0 | 1.0 | 1299.76 | 1353.66 | 0.53 | 0.99 | rirv938-mistral-24b-bas_90162_v2 | 24B | rirv938/mistral_24b_base_2_dpo_40k_95w_pref_1250_v2 | rirv938-mistral-24b-bas_90162_v2 | 7679 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_base | 2025-03-05 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 522.0 | 1.0 | 1299.72 | 1353.66 | 0.55 | 0.99 | rirv938-anthropic-grpo-_74918_v3 | 13B | rirv938/anthropic_grpo_40k_cp1184_95ff_20ww_merged | rirv938-anthropic-grpo-_74918_v3 | 7544 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-13 | single | 1.67 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 523.0 | 1.0 | 1299.7 | 1353.66 | 0.54 | 0.99 | function_damif_2025-06-12 | | | dpo_data_collection | 8118 | 61115860 | 0.53 | 0.65 | function | | | | | | | 2025-06-11 | single | | |
rirv938 | 1 | 524.0 | 1.0 | 1299.69 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-2_32301_v2 | 13B | rirv938/anthropic_40k_2496_bo8_85w_b4_2xlora_v2 | rirv938-anthropic-40k-2_32301_v2 | 15559 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_24 | 2025-01-01 | single | 1.7 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 525.0 | 1.0 | 1299.68 | 1353.66 | 0.56 | 0.99 | rirv938-slerp-grpo-cp31_49842_v1 | 24B | rirv938/slerp_grpo_cp312_96ff_b2_r1_20k_merged | rirv938-slerp-grpo-cp31_49842_v1 | 9697 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp312 | 2025-06-10 | single | | |
rirv938 | 1 | 526.0 | 1.0 | 1299.59 | 1353.66 | 0.49 | 0.99 | rirv938-simp-grpo-cp312-_8272_v1 | 24B | rirv938/simp_grpo_cp312_98ff_b3_r2_12m_US_merged | rirv938-simp-grpo-cp312-_8272_v1 | 9866 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/simp_grpo_cp312_ | 2025-06-30 | single | 1.62 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 527.0 | 1.0 | 1299.48 | 1353.66 | 0.6 | 0.99 | function_dutat_2025-04-01 | | | dpo_data_collection | 8533 | 61115860 | 0.54 | 0.65 | function | | | | | | | 2025-04-01 | single | | |
rirv938 | 1 | 528.0 | 1.0 | 1299.46 | 1353.66 | 0.57 | 0.99 | rirv938-tune-mistral-gr_71092_v2 | 24B | rirv938/tune_mistral_grpo_cp296_92ff_v3_run_merged | rirv938-tune-mistral-gr_71092_v2 | 9025 | 61115860 | 0.49 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/tune_mistral_grp | 2025-04-30 | single | 1.75 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 529.0 | 1.0 | 1299.45 | 1353.66 | 0.51 | 0.99 | blend_jegan_2025-05-15 | n/a | | rob_ab_test | 8247 | 61115860 | 0.52 | 0.65 | blend | | | | | | | 2025-05-15 | blended | | |
rirv938 | 1 | 530.5 | 1.0 | 1299.44 | 1353.66 | 0.56 | 0.99 | rirv938-rinen-grpo-cp15_48820_v1 | 13B | rirv938/rinen_grpo_cp156_97ff_slerp_rm_b4_merged | rirv938-rinen-grpo-cp15_48820_v1 | 6608 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_cp156 | 2025-05-21 | single | | |
rirv938 | 1 | 530.5 | 1.0 | 1299.44 | 1353.66 | 0.53 | 0.99 | blend_nohis_2025-05-01 | n/a | | rob_ab_test | 9413 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-05-01 | blended | | |
rirv938 | 1 | 532.5 | 1.0 | 1299.41 | 1353.66 | 0.55 | 0.99 | rirv938-anthropic-grpo-_23095_v1 | 13B | rirv938/anthropic_grpo_40k_cp296_95ff_20ww_merged | rirv938-anthropic-grpo-_23095_v1 | 6033 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-13 | single | 1.58 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 532.5 | 1.0 | 1299.41 | 1353.66 | 0.54 | 0.99 | rirv938-100p-0ff-rirv93_35621_v3 | 24B | rirv938/100p_0ff_rirv938_mistral_24b_lex__1090_v2_cp748_merged | rirv938-100p-0ff-rirv93_35621_v3 | 7600 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-21 | single | 0.64 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 534.0 | 1.0 | 1299.33 | 1353.66 | 0.54 | 0.99 | function_bisem_2025-02-27 | | | retune_with_base | 6113 | 61115860 | 0.53 | 0.65 | function | | | | | | | 2025-02-27 | single | | |
rirv938 | 1 | 535.0 | 1.0 | 1299.3 | 1353.66 | 0.59 | 0.99 | rirv938-mistral-12b-dpo_17482_v1 | 13B | rirv938/mistral_12b_dpo_40k_1187_96_output_tokens_much_ff_v2 | rirv938-mistral-12b-dpo_17482_v1 | 5682 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 96.0 | MistralForCausalLM | rirv938/mistral_12b_dpo_ | 2025-02-24 | single | 1.03 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 536.5 | 1.0 | 1299.28 | 1353.66 | 0.49 | 0.99 | rirv938-simp-grpo-cp312_84936_v1 | 24B | rirv938/simp_grpo_cp312_2ff_b35_r1_ava_rm_merged | rirv938-simp-grpo-cp312_84936_v1 | 6254 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/simp_grpo_cp312_ | 2025-07-02 | single | 1.62 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 536.5 | 1.0 | 1299.28 | 1353.66 | 0.56 | 0.99 | rirv938-slerp-grpo-cp39_81606_v1 | 24B | rirv938/slerp_grpo_cp390_96ff_b3_r1_20k_merged | rirv938-slerp-grpo-cp39_81606_v1 | 12489 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp390 | 2025-06-10 | single | | |
rirv938 | 1 | 538.0 | 1.0 | 1299.27 | 1353.66 | 0.49 | 0.99 | rirv938-simp-grpo-cp624_37437_v1 | 24B | rirv938/simp_grpo_cp624_98ff_b3_r2_12m_US_merged | rirv938-simp-grpo-cp624_37437_v1 | 6971 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/simp_grpo_cp624_ | 2025-06-30 | single | 1.62 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 539.0 | 1.0 | 1299.18 | 1353.66 | 0.5 | 0.99 | rirv938-simp-grpo-cp468_37238_v1 | 24B | rirv938/simp_grpo_cp468_96ff_b1_r1_merged | rirv938-simp-grpo-cp468_37238_v1 | 8724 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/simp_grpo_cp468_ | 2025-06-10 | single | | |
rirv938 | 1 | 540.5 | 1.0 | 1299.16 | 1353.66 | 0.55 | 0.99 | rirv938-anthropic-grpo-_74918_v2 | 13B | rirv938/anthropic_grpo_40k_cp1184_95ff_20ww_merged | rirv938-anthropic-grpo-_74918_v2 | 8750 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-13 | single | 1.61 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 540.5 | 1.0 | 1299.16 | 1353.66 | 0.5 | 0.99 | rirv938-99p-1ff-nischay_62699_v1 | 24B | rirv938/99p_1ff_nischaydnk_exp14_exp9dp_94555_v6_cp1000_merged | rirv938-99p-1ff-nischay_62699_v1 | 11184 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/99p_1ff_nischayd | 2025-06-08 | single | | |
rirv938 | 1 | 542.5 | 1.0 | 1299.13 | 1353.66 | 0.59 | 0.99 | rirv938-lr-2-mistral-1116-v2_v1 | 13B | rirv938/lr_2_mistral_1116_v2 | rirv938-lr-2-mistral-1116-v2_v1 | 15244 | 61115860 | 0.55 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/lr_2_mistral_111 | 2024-12-21 | single | 1.81 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 542.5 | 1.0 | 1299.13 | 1353.66 | 0.53 | 0.99 | rirv938-98p-2ff-rirv938_83757_v1 | 24B | rirv938/98p_2ff_rirv938_1000_sim_100p_0_17599_v1_cp530_merged | rirv938-98p-2ff-rirv938_83757_v1 | 6482 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-04-21 | single | 1.44 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 544.0 | 1.0 | 1299.03 | 1353.66 | 0.54 | 0.99 | blend_diful_2025-05-01 | n/a | | rob_ab_test | 10129 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-05-01 | blended | | |
rirv938 | 1 | 545.0 | 1.0 | 1298.93 | 1353.66 | 0.53 | 0.99 | rirv938-gy-rerank-grpo-_99051_v1 | 24B | rirv938/gy_rerank_grpo_cp624_98ff_b35_r1_merged | rirv938-gy-rerank-grpo-_99051_v1 | 7463 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/gy_rerank_grpo_c | 2025-07-03 | single | 1.56 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 546.0 | 1.0 | 1298.92 | 1353.66 | 0.55 | 0.99 | rirv938-anthropic-grpo-_98044_v1 | 13B | rirv938/anthropic_grpo_40k_cp148_95ff_6ww_v2_merged | rirv938-anthropic-grpo-_98044_v1 | 6952 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-13 | single | 1.61 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 547.0 | 1.0 | 1298.9 | 1353.66 | 0.57 | 0.99 | rirv938-1000-sim-100p-0_76073_v1 | 24B | rirv938/1000_sim_100p_0ff_rirv938_mistral_24b_lex__1090_v2_cp372_v9_merged | rirv938-1000-sim-100p-0_76073_v1 | 7514 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/1000_sim_100p_0f | 2025-04-21 | single | 1.44 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 548.0 | 1.0 | 1298.86 | 1353.66 | 0.54 | 0.99 | rirv938-gy-rerank-grpo-_87392_v1 | 24B | rirv938/gy_rerank_grpo_cp312_98ff_b35_r1_merged | rirv938-gy-rerank-grpo-_87392_v1 | 7439 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/gy_rerank_grpo_c | 2025-07-03 | single | 1.62 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 549.0 | 1.0 | 1298.81 | 1353.66 | 0.56 | 0.99 | rirv938-prefgrok-r2-cp62_5963_v2 | 24B | rirv938/prefgrok_r2_cp624_98ff_b5_merged | rirv938-prefgrok-r2-cp62_5963_v2 | 8377 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/prefgrok_r2_cp62 | 2025-07-09 | single | 1.36 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 550.0 | 1.0 | 1298.79 | 1353.66 | 0.54 | 0.99 | rirv938-mistral-24b-base_5319_v1 | 24B | rirv938/mistral_24b_base_2_dpo_40k_95w_pref_25w_swear_2500_v2 | rirv938-mistral-24b-base_5319_v1 | 10819 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_base | 2025-03-06 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 551.0 | 1.0 | 1298.73 | 1353.66 | 0.6 | 0.99 | rirv938-mistral-24b-rou_41210_v2 | 24B | rirv938/mistral_24b_round_2_dpo_40k_70w_pref_16w_swear_2500_v2 | rirv938-mistral-24b-rou_41210_v2 | 8916 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-07 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 552.0 | 1.0 | 1298.68 | 1353.66 | 0.54 | 0.99 | function_nilun_2025-02-27 | | | retune_with_base | 7653 | 61115860 | 0.52 | 0.65 | function | | | | | | | 2025-02-27 | single | | |
rirv938 | 1 | 553.0 | 1.0 | 1298.67 | 1353.66 | 0.42 | 0.99 | rirv938-b4-98p-2ff-rirv9_6187_v1 | 24B | rirv938/b4_98p_2ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp624_v3 | rirv938-b4-98p-2ff-rirv9_6187_v1 | 7431 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/b4_98p_2ff_rirv9 | 2025-03-28 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 554.0 | 1.0 | 1298.6 | 1353.66 | 0.53 | 0.99 | rirv938-datamix-cp624-98_9661_v1 | 24B | rirv938/datamix_cp624_98ff_b35_r1_reformat_high_quality_merged | rirv938-datamix-cp624-98_9661_v1 | 11103 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/datamix_cp624_98 | 2025-07-08 | single | 1.32 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 555.0 | 1.0 | 1298.57 | 1353.66 | 0.5 | 0.99 | rirv938-99p-1ff-nischayd_7844_v1 | 24B | rirv938/99p_1ff_nischaydnk_exp14_exp9dp_94555_v6_cp500_merged | rirv938-99p-1ff-nischayd_7844_v1 | 12480 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/99p_1ff_nischayd | 2025-06-08 | single | | |
rirv938 | 1 | 556.0 | 1.0 | 1298.54 | 1353.66 | 0.5 | 0.99 | chaiml-mistral31-24b-s_69496_v11 | 24B | ChaiML/mistral31-24b-simpoexp1-s1-new-sft-retryv2top20lex-2e | chaiml-mistral31-24b-s_69496_v11 | 6396 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/mistral31-24b-sim | 2025-06-17 | single | | |
rirv938 | 1 | 557.0 | 1.0 | 1298.5 | 1353.66 | 0.53 | 0.99 | rirv938-mistral-24b-bas_90162_v1 | 24B | rirv938/mistral_24b_base_2_dpo_40k_95w_pref_1250_v2 | rirv938-mistral-24b-bas_90162_v1 | 7764 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_base | 2025-03-05 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 558.0 | 1.0 | 1298.46 | 1353.66 | 0.56 | 0.99 | chaiml-slerp-grpo-cp312_10606_v1 | 24B | ChaiML/slerp_grpo_cp312_96ff_b4_r1_lr3_merged | chaiml-slerp-grpo-cp312_10606_v1 | 5722 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerp_grpo_cp312_ | 2025-05-30 | single | | |
rirv938 | 1 | 560.0 | 1.0 | 1298.43 | 1353.66 | 0.55 | 0.99 | rirv938-dpo-to-compare-_12851_v1 | 24B | rirv938/dpo_to_compare_to_grpo_10k_cp310_merged | rirv938-dpo-to-compare-_12851_v1 | 6449 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/dpo_to_compare_t | 2025-04-25 | single | 1.46 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 560.0 | 1.0 | 1298.43 | 1353.66 | 0.0 | 0.99 | rirv938-anthropic-beta-_64925_v1 | 13B | rirv938/anthropic_beta_2_40k_2496_bo16_v2 | rirv938-anthropic-beta-_64925_v1 | 10724 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-29 | single | 2.97 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 560.0 | 1.0 | 1298.43 | 1353.66 | 0.48 | 0.99 | rirv938-100p-0ff-rirv93_43678_v1 | 24B | rirv938/100p_0ff_rirv938_mistral_24b_oai_77698_v2_cp748_merged | rirv938-100p-0ff-rirv93_43678_v1 | 6266 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-18 | single | 0.63 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 562.0 | 1.0 | 1298.39 | 1353.66 | 0.55 | 0.99 | chaiml-gy-exp61-dpo-exp_29395_v3 | 24B | ChaiML/gy-exp61-dpo-exp32ep8s2-gy-datamix-v2.5-orig-safe-grok-rerank-agreement-ep1 | chaiml-gy-exp61-dpo-exp_29395_v3 | 5606 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/gy-exp61-dpo-exp3 | 2025-07-03 | single | 1.62 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 563.0 | 1.0 | 1298.36 | 1353.66 | 0.55 | 0.99 | rirv938-mistral-12b-dpo_13301_v1 | 13B | rirv938/mistral_12b_dpo_40k_1187_64_output_tokens_v2 | rirv938-mistral-12b-dpo_13301_v1 | 5584 | 61115860 | 0.56 | 0.65 | basic | | 8.0 | 768.0 | 96.0 | MistralForCausalLM | rirv938/mistral_12b_dpo_ | 2025-02-24 | single | 1.03 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 564.5 | 1.0 | 1298.32 | 1353.66 | 0.5 | 0.99 | rirv938-simp-grpo-cp312_54334_v1 | 24B | rirv938/simp_grpo_cp312_96ff_b3_r1_merged | rirv938-simp-grpo-cp312_54334_v1 | 9751 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/simp_grpo_cp312_ | 2025-06-11 | single | | |
rirv938 | 1 | 564.5 | 1.0 | 1298.32 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-2_43413_v3 | 13B | rirv938/anthropic_40k_2496_bo8_85w_b4_l1_v2 | rirv938-anthropic-40k-2_43413_v3 | 12851 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_24 | 2025-01-01 | single | 1.67 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 566.0 | 1.0 | 1298.31 | 1353.66 | 0.55 | 0.99 | rirv938-anthropic-grpo-4_2727_v1 | 13B | rirv938/anthropic_grpo_40k_cp888_95ff_20ww2_merged | rirv938-anthropic-grpo-4_2727_v1 | 6926 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-14 | single | 1.62 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 567.0 | 1.0 | 1298.29 | 1353.66 | 0.53 | 0.99 | rirv938-20k-100p-0ff-ri_70659_v7 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp468_merged | rirv938-20k-100p-0ff-ri_70659_v7 | 7623 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-16 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 568.0 | 1.0 | 1298.28 | 1353.66 | 0.49 | 0.99 | rirv938-mistral-24b-rou_62864_v1 | 24B | rirv938/mistral_24b_round_2_b_dpo_40k_95w_pref_2500_v2 | rirv938-mistral-24b-rou_62864_v1 | 9982 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-05 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 569.0 | 1.0 | 1298.26 | 1353.66 | 0.53 | 0.99 | chaiml-20250611-retune-_50947_v1 | 8B | ChaiML/20250611_retune_long_user_messages | chaiml-20250611-retune-_50947_v1 | 8545 | 61115860 | 0.52 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | ChaiML/20250611_retune_l | 2025-06-11 | single | | |
rirv938 | 1 | 570.0 | 1.0 | 1298.24 | 1353.66 | 0.57 | 0.99 | rirv938-grpo-to-compare-_1872_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp78_with_ff_merged | rirv938-grpo-to-compare-_1872_v1 | 8600 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-28 | single | 1.43 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 571.0 | 1.0 | 1298.22 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-2_69835_v2 | 13B | rirv938/anthropic_40k_2496_bo8_85w_b4_l2_v2 | rirv938-anthropic-40k-2_69835_v2 | 12295 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_24 | 2025-01-01 | single | 1.7 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 572.0 | 1.0 | 1298.21 | 1353.66 | 0.54 | 0.99 | function_lemof_2025-04-21 | | | dpo_data_collection | 7852 | 61115860 | 0.5 | 0.65 | function | | | | | | | 2025-04-21 | single | | |
rirv938 | 1 | 573.0 | 1.0 | 1298.19 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp62_55821_v1 | 24B | rirv938/slerp_grpo_cp624_96ff_b4_r1_lr3_merged | rirv938-slerp-grpo-cp62_55821_v1 | 5477 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp624 | 2025-05-23 | single | | |
rirv938 | 1 | 574.0 | 1.0 | 1298.08 | 1353.66 | 0.57 | 0.99 | rirv938-prefgrok-r2-cp3_29730_v1 | 24B | rirv938/prefgrok_r2_cp312_98ff_b5_merged | rirv938-prefgrok-r2-cp3_29730_v1 | 8747 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/prefgrok_r2_cp31 | 2025-07-08 | single | 1.36 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 575.5 | 1.0 | 1298.04 | 1353.66 | 0.56 | 0.99 | rirv938-slerp-grpo-cp31_93207_v1 | 24B | rirv938/slerp_grpo_cp312_96ff_b3_r1_merged | rirv938-slerp-grpo-cp31_93207_v1 | 8335 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp312 | 2025-06-09 | single | | |
rirv938 | 1 | 575.5 | 1.0 | 1298.04 | 1353.66 | 0.52 | 0.99 | blend_beris_2025-05-02 | n/a | | rob_ab_test | 20532 | 61115860 | 0.53 | 0.65 | blend | | | | | | | 2025-05-02 | blended | | |
rirv938 | 1 | 577.0 | 1.0 | 1298.03 | 1353.66 | 0.47 | 0.99 | rirv938-mistral-24b-dpo_42604_v1 | 24B | rirv938/mistral_24b_dpo_kl_10k_beta2_1560_v3 | rirv938-mistral-24b-dpo_42604_v1 | 8307 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-25 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 578.0 | 1.0 | 1297.98 | 1353.66 | 0.56 | 0.99 | rirv938-tune-mistral-gr_80586_v1 | 24B | rirv938/tune_mistral_grpo_cp62_92ff_v2_merged | rirv938-tune-mistral-gr_80586_v1 | 7468 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/tune_mistral_grp | 2025-04-29 | single | 1.71 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 579.0 | 1.0 | 1297.97 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_12207_v1 | 13B | rirv938/anthropic_grpo_40k_cp156_96ff_new_rm_b5_merged | rirv938-anthropic-grpo-_12207_v1 | 7979 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-20 | single | | |
rirv938 | 1 | 580.0 | 1.0 | 1297.94 | 1353.66 | 0.51 | 0.99 | blend_midaf_2025-05-15 | n/a | | rob_ab_test | 6266 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-05-15 | blended | | |
rirv938 | 1 | 581.0 | 1.0 | 1297.89 | 1353.66 | 0.57 | 0.99 | rirv938-prefgrok-cp312-_47258_v1 | 24B | rirv938/prefgrok_cp312_98ff_b35_r1_reformat_high_quality_merged | rirv938-prefgrok-cp312-_47258_v1 | 6975 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/prefgrok_cp312_9 | 2025-07-07 | single | 1.32 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 582.0 | 1.0 | 1297.88 | 1353.66 | 0.53 | 0.99 | rirv938-0sw-99p-1ff-rir_73127_v1 | 24B | rirv938/0sw_99p_1ff_rirv938_mistral_24b_dpo_43074_v1_cp156_v3 | rirv938-0sw-99p-1ff-rir_73127_v1 | 6666 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_99p_1ff_rirv | 2025-03-25 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 583.0 | 1.0 | 1297.86 | 1353.66 | 0.58 | 0.99 | function_noget_2025-02-24 | | | retune_with_base | 6577 | 61115860 | 0.54 | 0.65 | function | | | | | | | 2025-02-24 | single | | |
rirv938 | 1 | 584.0 | 1.0 | 1297.83 | 1353.66 | 0.51 | 0.99 | rirv938-20k-100p-0ff-ri_70659_v2 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp468_merged | rirv938-20k-100p-0ff-ri_70659_v2 | 6516 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-16 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 585.0 | 1.0 | 1297.81 | 1353.66 | 0.5 | 0.99 | rirv938-100p-0ff-rirv93_42333_v1 | 24B | rirv938/100p_0ff_rirv938_mistral_24b_oai_77698_v1_cp748_merged | rirv938-100p-0ff-rirv93_42333_v1 | 6437 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-18 | single | 0.64 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 586.0 | 1.0 | 1297.69 | 1353.66 | 0.57 | 0.99 | chaiml-panflute-v2-rirv_49668_v1 | 24B | ChaiML/panflute_v2_rirv938_20250423 | chaiml-panflute-v2-rirv_49668_v1 | 12188 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/panflute_v2_rirv9 | 2025-04-22 | single | 1.46 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 587.0 | 1.0 | 1297.67 | 1353.66 | 0.58 | 0.99 | rirv938-mistral-24b-rou_70379_v2 | 24B | rirv938/mistral_24b_round_3_dpo_40k_65w_pref_10w_swear_2500_v2 | rirv938-mistral-24b-rou_70379_v2 | 11952 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-08 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 588.0 | 1.0 | 1297.65 | 1353.66 | 0.53 | 0.99 | blend_mulos_2025-06-12 | n/a | | rob_ab_test | 8766 | 61115860 | 0.54 | 0.65 | blend | | | | | | | 2025-06-11 | blended | | |
rirv938 | 1 | 589.0 | 1.0 | 1297.64 | 1353.66 | 0.52 | 0.99 | blend_rumum_2025-05-15 | n/a | | rob_ab_test | 5877 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-05-15 | blended | | |
rirv938 | 1 | 590.0 | 1.0 | 1297.6 | 1353.66 | 0.56 | 0.99 | rirv938-tune-mistral-gr_43026_v1 | 24B | rirv938/tune_mistral_grpo_cp888_92ff_v3_run3_merged | rirv938-tune-mistral-gr_43026_v1 | 7604 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/tune_mistral_grp | 2025-04-30 | single | 1.74 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 591.0 | 1.0 | 1297.55 | 1353.66 | 0.52 | 0.99 | rirv938-snug-grpo-40k-c_63788_v2 | 13B | rirv938/snug_grpo_40k_cp1184_93ff_b_merged | rirv938-snug-grpo-40k-c_63788_v2 | 6337 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/snug_grpo_40k_cp | 2025-05-01 | single | 1.32 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 592.0 | 1.0 | 1297.53 | 1353.66 | 0.59 | 0.99 | rirv938-nitral-40k-936-v2_v1 | 13B | rirv938/nitral_40k_936_v2 | rirv938-nitral-40k-936-v2_v1 | 16867 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_40k_936_v | 2024-12-27 | single | 2.93 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 593.5 | 1.0 | 1297.51 | 1353.66 | 0.51 | 0.99 | rirv938-mistral-24b-dpo_18325_v1 | 24B | rirv938/mistral_24b_dpo_kl_40k_beta4_5000_v3 | rirv938-mistral-24b-dpo_18325_v1 | 6337 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-24 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 593.5 | 1.0 | 1297.51 | 1353.66 | 0.53 | 0.99 | blend_tules_2025-05-01 | n/a | | rob_ab_test | 10253 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-05-01 | blended | | |
rirv938 | 1 | 595.0 | 1.0 | 1297.48 | 1353.66 | 0.53 | 0.99 | rirv938-datamix-cp312-9_93070_v1 | 24B | rirv938/datamix_cp312_98ff_b35_r1_reformat_high_quality_merged | rirv938-datamix-cp312-9_93070_v1 | 10774 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/datamix_cp312_98 | 2025-07-08 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 596.0 | 1.0 | 1297.39 | 1353.66 | 0.59 | 0.99 | rirv938-nitral-18k-837-v2_v1 | 13B | rirv938/nitral_18k_837_v2 | rirv938-nitral-18k-837-v2_v1 | 27844 | 61115860 | 0.55 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_18k_837_v | 2024-12-27 | single | 2.93 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 597.0 | 1.0 | 1297.36 | 1353.66 | 0.59 | 0.99 | rirv938-nitral-18k-1116-v2_v1 | 13B | rirv938/nitral_18k_1116_v2 | rirv938-nitral-18k-1116-v2_v1 | 26443 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_18k_1116_ | 2024-12-27 | single | 2.95 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 598.0 | 1.0 | 1297.25 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-3_48066_v1 | 13B | rirv938/anthropic_40k_3744_bo8_85w_b4_l1_v2 | rirv938-anthropic-40k-3_48066_v1 | 10689 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_37 | 2024-12-31 | single | 1.76 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 599.0 | 1.0 | 1297.24 | 1353.66 | 0.54 | 0.99 | function_gihor_2025-04-18 | | | dpo_data_collection | 7979 | 61115860 | 0.54 | 0.65 | function | | | | | | | 2025-04-18 | single | | |
rirv938 | 1 | 600.0 | 1.0 | 1297.16 | 1353.66 | 0.59 | 0.99 | rirv938-nitral-beta-4-4_29933_v1 | 13B | rirv938/nitral_beta_4_40k_2496_v2 | rirv938-nitral-beta-4-4_29933_v1 | 30487 | 61115860 | 0.55 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_beta_4_40 | 2024-12-27 | single | 2.94 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 601.0 | 1.0 | 1297.14 | 1353.66 | 0.57 | 0.99 | rirv938-prefgrok-cp624-_38902_v1 | 24B | rirv938/prefgrok_cp624_98ff_b35_r1_reformat_merged | rirv938-prefgrok-cp624-_38902_v1 | 7969 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/prefgrok_cp624_9 | 2025-07-07 | single | 1.29 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 602.0 | 1.0 | 1297.08 | 1353.66 | 0.57 | 0.99 | rirv938-prefgrok-cp624-_37030_v1 | 24B | rirv938/prefgrok_cp624_98ff_b35_r1_reformat_high_quality_merged | rirv938-prefgrok-cp624-_37030_v1 | 6984 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/prefgrok_cp624_9 | 2025-07-07 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 603.0 | 1.0 | 1296.99 | 1353.66 | 0.57 | 0.99 | rirv938-tune-mistral-gr_71092_v1 | 24B | rirv938/tune_mistral_grpo_cp296_92ff_v3_run_merged | rirv938-tune-mistral-gr_71092_v1 | 9277 | 61115860 | 0.48 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/tune_mistral_grp | 2025-04-30 | single | 1.75 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 604.0 | 1.0 | 1296.92 | 1353.66 | 0.57 | 0.99 | chaiml-slerp-grpo-cp312_20135_v3 | 24B | ChaiML/slerp_grpo_cp312_96ff_b6_r1_merged | chaiml-slerp-grpo-cp312_20135_v3 | 5919 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerp_grpo_cp312_ | 2025-05-31 | single | | |
rirv938 | 1 | 605.0 | 1.0 | 1296.91 | 1353.66 | 0.51 | 0.99 | chaiml-mistral31-24b-s_69496_v18 | 24B | ChaiML/mistral31-24b-simpoexp1-s1-new-sft-retryv2top20lex-2e | chaiml-mistral31-24b-s_69496_v18 | 9984 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/mistral31-24b-sim | 2025-07-08 | single | 1.63 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 606.0 | 1.0 | 1296.88 | 1353.66 | 0.53 | 0.99 | chaiml-20250611-retune-_48497_v2 | 8B | ChaiML/20250611_retune_subscribed | chaiml-20250611-retune-_48497_v2 | 8835 | 61115860 | 0.52 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | ChaiML/20250611_retune_s | 2025-06-11 | single | | |
rirv938 | 1 | 607.0 | 1.0 | 1296.85 | 1353.66 | 0.55 | 0.99 | blend_behib_2025-04-14 | n/a | | rob_ab_test | 7433 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-04-14 | blended | | |
rirv938 | 1 | 608.0 | 1.0 | 1296.83 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-4_71094_v1 | 13B | rirv938/anthropic_40k_4992_bo8_85w_b4_l1_v2 | rirv938-anthropic-40k-4_71094_v1 | 15023 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_49 | 2024-12-31 | single | 1.74 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 609.0 | 1.0 | 1296.75 | 1353.66 | 0.62 | 0.99 | rirv938-96p-4ff-chaiml-_65011_v1 | 24B | rirv938/96p_4ff_chaiml_slerpv5_mistral3_24540_v2_cp484_merged | rirv938-96p-4ff-chaiml-_65011_v1 | 20206 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_chaiml_s | 2025-06-07 | single | | |
rirv938 | 1 | 610.0 | 1.0 | 1296.72 | 1353.66 | 0.55 | 0.99 | blend_nibul_2025-04-14 | n/a | | rob_ab_test | 5702 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-04-14 | blended | | |
rirv938 | 1 | 611.0 | 1.0 | 1296.58 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_53872_v1 | 13B | rirv938/anthropic_grpo_40k_cp234_95ff_baseline_merged | rirv938-anthropic-grpo-_53872_v1 | 6384 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-15 | single | 1.47 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 612.0 | 1.0 | 1296.54 | 1353.66 | 0.51 | 0.99 | chaiml-gy-exp63-dpo-exp_33117_v3 | 24B | ChaiML/gy-exp63-dpo-exp32ep8s2-pref-grok3-sub-nis-majib-30jun-ep1 | chaiml-gy-exp63-dpo-exp_33117_v3 | 6195 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/gy-exp63-dpo-exp3 | 2025-07-02 | single | 1.62 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 613.0 | 1.0 | 1296.46 | 1353.66 | 0.49 | 0.99 | rirv938-simp-grpo-cp156_13555_v1 | 24B | rirv938/simp_grpo_cp156_96ff_b3_r1_12m_US_merged | rirv938-simp-grpo-cp156_13555_v1 | 8595 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/simp_grpo_cp156_ | 2025-06-30 | single | 1.62 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 614.0 | 1.0 | 1296.39 | 1353.66 | 0.56 | 0.99 | rinen0721-dpo-0130-cp3000_v16 | 13B | rinen0721/dpo-0130-cp3000 | rinen0721-dpo-0130-cp3000_v16 | 7453 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rinen0721/dpo-0130-cp300 | 2025-05-15 | single | 1.32 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 615.5 | 1.0 | 1296.38 | 1353.66 | 0.45 | 0.99 | rirv938-b4-98p-2ff-rirv_55455_v1 | 24B | rirv938/b4_98p_2ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp312_v3 | rirv938-b4-98p-2ff-rirv_55455_v1 | 6400 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/b4_98p_2ff_rirv9 | 2025-03-28 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 615.5 | 1.0 | 1296.38 | 1353.66 | 0.51 | 0.99 | chaiml-anthropic-40k-24_11629_v8 | 13B | ChaiML/anthropic_40k_2496_bo8_85w_b4_l1_merged | chaiml-anthropic-40k-24_11629_v8 | 6508 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/anthropic_40k_249 | 2025-05-14 | single | 1.57 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 617.5 | 1.0 | 1296.27 | 1353.66 | 0.54 | 0.99 | rirv938-groksyn-grpo-cp_67088_v2 | 24B | rirv938/groksyn_grpo_cp312_98ff_b35_r1_merged | rirv938-groksyn-grpo-cp_67088_v2 | 8355 | 61115860 | 0.51 | 0.65 | basic | | 6.0 | 1536.0 | 64.0 | MistralForCausalLM | rirv938/groksyn_grpo_cp3 | 2025-07-07 | single | 1.08 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 617.5 | 1.0 | 1296.27 | 1353.66 | 0.0 | 0.99 | function_lihef_2025-06-25 | | | dpo_data_collection | 1720 | 61115860 | 0.5 | 0.65 | function | | | | | | | 2025-06-25 | single | | |
rirv938 | 1 | 619.0 | 1.0 | 1296.19 | 1353.66 | 0.6 | 0.99 | rirv938-mistral-24b-bas_75050_v1 | 24B | rirv938/mistral_24b_base_2_dpo_40k_65w_pref_16w_swear_2500_v2 | rirv938-mistral-24b-bas_75050_v1 | 13206 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_base | 2025-03-07 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 620.5 | 1.0 | 1296.15 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-1_20446_v1 | 13B | rirv938/anthropic_40k_1248_bo8_80w_no_filter_v2 | rirv938-anthropic-40k-1_20446_v1 | 24194 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_12 | 2025-01-01 | single | 1.68 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 620.5 | 1.0 | 1296.15 | 1353.66 | 0.55 | 0.99 | chaiml-0sw-95p-5ff-rine_63828_v6 | 13B | ChaiML/0sw_95p_5ff_rinen0721_dpo_0130_cp3000_v8_merged | chaiml-0sw-95p-5ff-rine_63828_v6 | 5632 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/0sw_95p_5ff_rinen | 2025-05-21 | single | | |
rirv938 | 1 | 622.0 | 1.0 | 1296.12 | 1353.66 | 0.53 | 0.99 | rirv938-groksyn-r2-cp312_2112_v1 | 24B | rirv938/groksyn_r2_cp312_98ff_b4_merged | rirv938-groksyn-r2-cp312_2112_v1 | 5561 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/groksyn_r2_cp312 | 2025-07-08 | single | 1.37 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 623.0 | 1.0 | 1296.08 | 1353.66 | 0.53 | 0.99 | rirv938-groksyn-grpo-cp_93910_v1 | 24B | rirv938/groksyn_grpo_cp624_98ff_b35_r1_reformat_merged | rirv938-groksyn-grpo-cp_93910_v1 | 6203 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/groksyn_grpo_cp6 | 2025-07-07 | single | 1.37 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 624.0 | 1.0 | 1296.06 | 1353.66 | 0.55 | 0.99 | blend_habos_2025-05-01 | n/a | | rob_ab_test | 10420 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-05-01 | blended | | |
rirv938 | 1 | 625.0 | 1.0 | 1296.01 | 1353.66 | 0.6 | 0.99 | rirv938-mistral-24b-grp_67535_v1 | 24B | rirv938/mistral_24b_grpo_40k_cp888_92ff_ww_merged | rirv938-mistral-24b-grp_67535_v1 | 5982 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_grpo | 2025-05-15 | single | 1.71 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 626.0 | 1.0 | 1295.96 | 1353.66 | 0.45 | 0.99 | rirv938-0sw-98p-2ff-rir_54684_v1 | 24B | rirv938/0sw_98p_2ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp312_v2 | rirv938-0sw-98p-2ff-rir_54684_v1 | 8268 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_98p_2ff_rirv | 2025-03-26 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 627.0 | 1.0 | 1295.95 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-_90974_v1 | 13B | rirv938/anthropic_grpo_40k_cp888_95ff_20ww_merged | rirv938-anthropic-grpo-_90974_v1 | 6160 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-13 | single | 1.59 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 628.0 | 1.0 | 1295.87 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-2_57918_v1 | 13B | rirv938/anthropic_40k_2496_bo8_85w_b4_2xlora_2xlr_v2 | rirv938-anthropic-40k-2_57918_v1 | 12640 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_24 | 2025-01-01 | single | 1.8 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 629.5 | 1.0 | 1295.85 | 1353.66 | 0.59 | 0.99 | rirv938-nitral-40k-2500_91342_v1 | 13B | rirv938/nitral_40k_2500_13ff_40w_bo32_no_swearing_v2 | rirv938-nitral-40k-2500_91342_v1 | 6948 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/nitral_40k_2500_ | 2025-02-03 | single | | |
rirv938 | 1 | 629.5 | 1.0 | 1295.85 | 1353.66 | 0.54 | 0.99 | function_japut_2025-05-22 | | | dpo_data_collection | 7894 | 61115860 | 0.52 | 0.65 | function | | | | | | | 2025-05-21 | single | | |
rirv938 | 1 | 631.0 | 1.0 | 1295.82 | 1353.66 | 0.52 | 0.99 | rirv938-anthropic-grpo-_62054_v1 | 13B | rirv938/anthropic_grpo_40k_cp296_95ff_60ww_merged | rirv938-anthropic-grpo-_62054_v1 | 7014 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-14 | single | 1.64 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 632.0 | 1.0 | 1295.79 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp62_67411_v1 | 24B | rirv938/slerp_grpo_cp624_96ff_b8_r1_merged | rirv938-slerp-grpo-cp62_67411_v1 | 7676 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp624 | 2025-05-24 | single | | |
rirv938 | 1 | 633.0 | 1.0 | 1295.75 | 1353.66 | 0.58 | 0.99 | rirv938-mistral-12b-dpo_75616_v1 | 13B | rirv938/mistral_12b_dpo_40k_2374_96_output_tokens_v2 | rirv938-mistral-12b-dpo_75616_v1 | 6043 | 61115860 | 0.59 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_12b_dpo_ | 2025-02-24 | single | 1.55 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 634.0 | 1.0 | 1295.74 | 1353.66 | 0.54 | 0.99 | function_mesam_2025-05-22 | | | dpo_data_collection | 5409 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-05-21 | single | | |
rirv938 | 1 | 635.0 | 1.0 | 1295.73 | 1353.66 | 0.55 | 0.99 | chaiml-0sw-95p-5ff-rine_63828_v3 | 13B | ChaiML/0sw_95p_5ff_rinen0721_dpo_0130_cp3000_v8_merged | chaiml-0sw-95p-5ff-rine_63828_v3 | 5748 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/0sw_95p_5ff_rinen | 2025-04-28 | single | 1.35 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 636.0 | 1.0 | 1295.71 | 1353.66 | 0.59 | 0.99 | rirv938-mistral-24b-rou_41210_v3 | 24B | rirv938/mistral_24b_round_2_dpo_40k_70w_pref_16w_swear_2500_v2 | rirv938-mistral-24b-rou_41210_v3 | 8997 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-07 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 637.0 | 1.0 | 1295.59 | 1353.66 | 0.54 | 0.99 | function_legor_2025-02-27 | | | retune_with_base | 6093 | 61115860 | 0.53 | 0.65 | function | | | | | | | 2025-02-27 | single | | |
rirv938 | 1 | 638.0 | 1.0 | 1295.58 | 1353.66 | 0.52 | 0.99 | blend_puton_2025-05-15 | n/a | | rob_ab_test | 7480 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-05-15 | blended | | |
rirv938 | 1 | 639.0 | 1.0 | 1295.57 | 1353.66 | 0.44 | 0.99 | rirv938-mistral-24b-dpo_36894_v1 | 24B | rirv938/mistral_24b_dpo_kl_10k_beta1_1560_v3 | rirv938-mistral-24b-dpo_36894_v1 | 9116 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-25 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 640.0 | 1.0 | 1295.49 | 1353.66 | 0.58 | 0.99 | chaiml-nitral-beta-4-40_74489_v4 | 13B | ChaiML/nitral_beta_4_40k_2496_v2 | chaiml-nitral-beta-4-40_74489_v4 | 5901 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/nitral_beta_4_40k | 2025-01-30 | single | | |
rirv938 | 1 | 641.0 | 1.0 | 1295.47 | 1353.66 | 0.55 | 0.99 | rinen0721-dpo-0130-cp3000_v18 | 13B | rinen0721/dpo-0130-cp3000 | rinen0721-dpo-0130-cp3000_v18 | 6698 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rinen0721/dpo-0130-cp300 | 2025-05-21 | single | | |
rirv938 | 1 | 642.0 | 1.0 | 1295.44 | 1353.66 | 0.54 | 0.99 | rirv938-20250331-reward_29517_v1 | 8B | rirv938/20250331_reward_ablation_random_512_old | rirv938-20250331-reward_29517_v1 | 9256 | 61115860 | 0.52 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250331_reward_ | 2025-03-31 | single | | |
rirv938 | 1 | 643.0 | 1.0 | 1295.39 | 1353.66 | 0.57 | 0.99 | rirv938-grpo-to-compare-_1872_v2 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp78_with_ff_merged | rirv938-grpo-to-compare-_1872_v2 | 7981 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-28 | single | 1.47 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 644.0 | 1.0 | 1295.31 | 1353.66 | 0.57 | 0.99 | function_kurot_2025-04-20 | | | dpo_data_collection | 6546 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-04-19 | single | | |
rirv938 | 1 | 645.0 | 1.0 | 1295.3 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-2_57918_v3 | 13B | rirv938/anthropic_40k_2496_bo8_85w_b4_2xlora_2xlr_v2 | rirv938-anthropic-40k-2_57918_v3 | 19589 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_24 | 2025-01-01 | single | 1.68 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 646.0 | 1.0 | 1295.25 | 1353.66 | 0.53 | 0.99 | function_rifal_2025-06-25 | | | dpo_data_collection | 7930 | 61115860 | 0.52 | 0.65 | function | | | | | | | 2025-06-25 | single | | |
rirv938 | 1 | 647.0 | 1.0 | 1295.2 | 1353.66 | 0.53 | 0.99 | blend_dubes_2025-07-09 | n/a | | rob_ab_test | 6551 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-07-09 | blended | | |
rirv938 | 1 | 648.0 | 1.0 | 1295.15 | 1353.66 | 0.0 | 0.99 | chaiml-llama-8b-multih_78780_v28 | 8B | ChaiML/llama_8b_multihead_204m_512_v3_tokens_step_398208 | chaiml-llama-8b-multih_78780_v28 | 5392 | 61115860 | 0.55 | 0.65 | basic | | 1.0 | 2048.0 | 1.0 | MultiHeadLlamaClassifier | ChaiML/llama_8b_multihea | 2025-02-13 | single | | |
rirv938 | 1 | 649.0 | 1.0 | 1295.14 | 1353.66 | 0.53 | 0.99 | blend_bojit_2025-05-15 | n/a | | rob_ab_test | 5914 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-05-15 | blended | | |
rirv938 | 1 | 650.0 | 1.0 | 1295.07 | 1353.66 | 0.55 | 0.99 | blend_legal_2025-04-03 | n/a | | rob_ab_test | 5912 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-04-03 | blended | | |
rirv938 | 1 | 651.0 | 1.0 | 1295.06 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_90264_v1 | 13B | rirv938/anthropic_grpo_40k_cp1716_96ff_new_rm_b5_merged | rirv938-anthropic-grpo-_90264_v1 | 5682 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-20 | single | | |
rirv938 | 1 | 652.0 | 1.0 | 1294.99 | 1353.66 | 0.53 | 0.99 | chaiml-exp14-exp9dpoft_65674_v14 | 24B | ChaiML/exp14-exp9DPOFt-chaidatav1dpo6k-24B | chaiml-exp14-exp9dpoft_65674_v14 | 10124 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/exp14-exp9DPOFt-c | 2025-06-08 | single | | |
rirv938 | 1 | 653.5 | 1.0 | 1294.9 | 1353.66 | 0.51 | 0.99 | rirv938-snug-grpo-40k-c_14141_v1 | 13B | rirv938/snug_grpo_40k_cp888_93ff_b_merged | rirv938-snug-grpo-40k-c_14141_v1 | 5543 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/snug_grpo_40k_cp | 2025-05-01 | single | 1.33 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 653.5 | 1.0 | 1294.9 | 1353.66 | 0.59 | 0.99 | rirv938-nitral-beta-40k_87408_v1 | 13B | rirv938/nitral_beta_40k_2496_v2 | rirv938-nitral-beta-40k_87408_v1 | 14678 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_beta_40k_ | 2024-12-27 | single | 2.97 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 655.0 | 1.0 | 1294.86 | 1353.66 | 0.48 | 0.99 | rirv938-grpo-20250711-c_63518_v2 | 24B | rirv938/grpo_20250711_cp312_sid_mistral_24b_dpo_40k__merged | rirv938-grpo-20250711-c_63518_v2 | 8605 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_20250711_cp | 2025-07-11 | single | 1.37 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 656.0 | 1.0 | 1294.76 | 1353.66 | 0.57 | 0.99 | blend_musik_2025-04-14 | n/a | | rob_ab_test | 5668 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-04-14 | blended | | |
rirv938 | 1 | 657.0 | 1.0 | 1294.59 | 1353.66 | 0.59 | 0.99 | rirv938-nitral-beta-40k_76570_v1 | 13B | rirv938/nitral_beta_40k_936_v2 | rirv938-nitral-beta-40k_76570_v1 | 13854 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_beta_40k_ | 2024-12-27 | single | 2.83 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 658.0 | 1.0 | 1294.45 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-2_57918_v2 | 13B | rirv938/anthropic_40k_2496_bo8_85w_b4_2xlora_2xlr_v2 | rirv938-anthropic-40k-2_57918_v2 | 11524 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_24 | 2025-01-01 | single | 1.74 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 659.0 | 1.0 | 1294.41 | 1353.66 | 0.53 | 0.99 | chaiml-20250411-rob-ava-_6550_v5 | 8B | ChaiML/20250411_rob_ava_reward_300k_safety_threshold_1_2 | chaiml-20250411-rob-ava-_6550_v5 | 9712 | 61115860 | 0.51 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | ChaiML/20250411_rob_ava_ | 2025-06-11 | single | | |
rirv938 | 1 | 661.0 | 1.0 | 1294.4 | 1353.66 | 0.54 | 0.99 | blend_gilen_2025-04-23 | n/a | | rob_ab_test | 8546 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-04-23 | blended | | |
rirv938 | 1 | 661.0 | 1.0 | 1294.4 | 1353.66 | 0.58 | 0.99 | rirv938-5k-98p-2ff-rirv_32450_v1 | 24B | rirv938/5k_98p_2ff_rirv938_mistral_24b_bon_31129_v6_cp156_v4 | rirv938-5k-98p-2ff-rirv_32450_v1 | 7234 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/5k_98p_2ff_rirv9 | 2025-04-01 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 661.0 | 1.0 | 1294.4 | 1353.66 | 0.5 | 0.99 | chaiml-mistral31-24b-si_69496_v7 | 24B | ChaiML/mistral31-24b-simpoexp1-s1-new-sft-retryv2top20lex-2e | chaiml-mistral31-24b-si_69496_v7 | 8020 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/mistral31-24b-sim | 2025-06-10 | single | | |
rirv938 | 1 | 663.0 | 1.0 | 1294.39 | 1353.66 | 0.56 | 0.99 | rirv938-slerp-grpo-cp31_12029_v1 | 24B | rirv938/slerp_grpo_cp312_96ff_b3_r1_20k_merged | rirv938-slerp-grpo-cp31_12029_v1 | 9459 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp312 | 2025-06-10 | single | | |
rirv938 | 1 | 664.0 | 1.0 | 1294.38 | 1353.66 | 0.55 | 0.99 | chaiml-rinen-grpo-cp312_62363_v1 | 13B | ChaiML/rinen_grpo_cp312_97ff_ava_bo1_b4_merged | chaiml-rinen-grpo-cp312_62363_v1 | 5544 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/rinen_grpo_cp312_ | 2025-05-30 | single | | |
rirv938 | 1 | 665.0 | 1.0 | 1294.28 | 1353.66 | 0.57 | 0.99 | function_tumob_2025-03-08 | | | retune_with_base | 8973 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-03-08 | single | | |
rirv938 | 1 | 666.0 | 1.0 | 1294.24 | 1353.66 | 0.54 | 0.99 | rirv938-100p-0ff-rirv93_34920_v2 | 24B | rirv938/100p_0ff_rirv938_mistral_24b_lex__1090_v2_cp374_merged | rirv938-100p-0ff-rirv93_34920_v2 | 8515 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-21 | single | 0.63 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 667.0 | 1.0 | 1294.16 | 1353.66 | 0.55 | 0.99 | blend_dahir_2025-03-08 | n/a | | rob_ab_test | 8986 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-03-08 | blended | | |
rirv938 | 1 | 668.0 | 1.0 | 1294.15 | 1353.66 | 0.53 | 0.99 | rirv938-anthropic-grpo-_83925_v1 | 13B | rirv938/anthropic_grpo_40k_cp60_98ff_g2b15_merged | rirv938-anthropic-grpo-_83925_v1 | 9055 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-18 | single | 1.65 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 669.0 | 1.0 | 1294.12 | 1353.66 | 0.54 | 0.99 | chaiml-mistral32-sftexp1_2523_v5 | 24B | ChaiML/mistral32-sftexp1-s1-groksyn30jun-full-4e-top750 | chaiml-mistral32-sftexp1_2523_v5 | 9005 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1536.0 | 64.0 | MistralForCausalLM | ChaiML/mistral32-sftexp1 | 2025-07-07 | single | 1.02 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 670.5 | 1.0 | 1294.1 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-_62301_v1 | 13B | rirv938/anthropic_grpo_40k_cp148_95ff_60ww_merged | rirv938-anthropic-grpo-_62301_v1 | 6321 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-14 | single | 1.59 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 670.5 | 1.0 | 1294.1 | 1353.66 | 0.56 | 0.99 | blend_fapum_2025-04-03 | n/a | | rob_ab_test | 6147 | 61115860 | 0.49 | 0.65 | blend | | | | | | | 2025-04-03 | blended | | |
rirv938 | 1 | 672.5 | 1.0 | 1294.06 | 1353.66 | 0.49 | 0.99 | rirv938-simp-grpo-cp624_22822_v1 | 24B | rirv938/simp_grpo_cp624_96ff_b1_r1_merged | rirv938-simp-grpo-cp624_22822_v1 | 8655 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/simp_grpo_cp624_ | 2025-06-10 | single | | |
rirv938 | 1 | 672.5 | 1.0 | 1294.06 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-2_32301_v1 | 13B | rirv938/anthropic_40k_2496_bo8_85w_b4_2xlora_v2 | rirv938-anthropic-40k-2_32301_v1 | 20370 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_24 | 2025-01-01 | single | 1.82 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 674.5 | 1.0 | 1294.04 | 1353.66 | 0.66 | 0.99 | rirv938-95p-5ff-rirv938_66486_v1 | 24B | rirv938/95p_5ff_rirv938_mistral_24b_oai_34522_v1_cp1000_merged | rirv938-95p-5ff-rirv938_66486_v1 | 8107 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/95p_5ff_rirv938_ | 2025-04-11 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 674.5 | 1.0 | 1294.04 | 1353.66 | 0.54 | 0.99 | rirv938-datamix-v2-cp31_32080_v1 | 24B | rirv938/datamix_v2_cp312_98ff_b35_r1_reformat_high_quality_merged | rirv938-datamix-v2-cp31_32080_v1 | 11084 | 61115860 | 0.49 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/datamix_v2_cp312 | 2025-07-08 | single | 1.35 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 676.0 | 1.0 | 1294.03 | 1353.66 | 0.57 | 0.99 | rirv938-mistral-24b-rou_85599_v1 | 24B | rirv938/mistral_24b_round_3_dpo_40k_60w_pref_10w_swear_2500_v2 | rirv938-mistral-24b-rou_85599_v1 | 10961 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-08 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 677.0 | 1.0 | 1294.02 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-4_1326_v1 | 13B | rirv938/anthropic_grpo_40k_cp148_95ff_20ww_merged | rirv938-anthropic-grpo-4_1326_v1 | 6192 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-13 | single | 1.59 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 678.5 | 1.0 | 1294.0 | 1353.66 | 0.58 | 0.99 | rirv938-mistral-24b-grp_39559_v2 | 24B | rirv938/mistral_24b_grpo_40k_cp148_95ff_merged | rirv938-mistral-24b-grp_39559_v2 | 8569 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_grpo | 2025-04-28 | single | 1.47 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 678.5 | 1.0 | 1294.0 | 1353.66 | 0.55 | 0.99 | chaiml-exp14-exp9dpoft_65674_v13 | 24B | ChaiML/exp14-exp9DPOFt-chaidatav1dpo6k-24B | chaiml-exp14-exp9dpoft_65674_v13 | 22500 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/exp14-exp9DPOFt-c | 2025-06-05 | single | | |
rirv938 | 1 | 680.0 | 1.0 | 1293.98 | 1353.66 | 0.55 | 0.99 | blend_solon_2025-04-03 | n/a | | rob_ab_test | 5505 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-04-03 | blended | | |
rirv938 | 1 | 681.0 | 1.0 | 1293.91 | 1353.66 | 0.58 | 0.99 | rirv938-v7-pref-plus-03-_7692_v1 | 13B | rirv938/v7_pref_plus_03_mistral_558_v2 | rirv938-v7-pref-plus-03-_7692_v1 | 22183 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/v7_pref_plus_03_ | 2024-12-22 | single | 1.79 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 682.0 | 1.0 | 1293.89 | 1353.66 | 0.54 | 0.99 | blend_fonuf_2025-06-12 | n/a | | rob_ab_test | 8201 | 61115860 | 0.53 | 0.65 | blend | | | | | | | 2025-06-11 | blended | | |
rirv938 | 1 | 683.5 | 1.0 | 1293.81 | 1353.66 | 0.57 | 0.99 | rirv938-yautja-cp312-98_44860_v1 | 24B | rirv938/yautja_cp312_98ff_b35_r1_reformat_high_quality_merged | rirv938-yautja-cp312-98_44860_v1 | 6419 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/yautja_cp312_98f | 2025-07-08 | single | 1.31 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 683.5 | 1.0 | 1293.81 | 1353.66 | 0.57 | 0.99 | chaiml-slerp-grpo-cp312_20135_v4 | 24B | ChaiML/slerp_grpo_cp312_96ff_b6_r1_merged | chaiml-slerp-grpo-cp312_20135_v4 | 20203 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerp_grpo_cp312_ | 2025-06-05 | single | | |
rirv938 | 1 | 685.5 | 1.0 | 1293.76 | 1353.66 | 0.54 | 0.99 | rirv938-groksyn-grpo-cp_55837_v2 | 24B | rirv938/groksyn_grpo_cp624_98ff_b35_r1_merged | rirv938-groksyn-grpo-cp_55837_v2 | 8382 | 61115860 | 0.51 | 0.65 | basic | | 6.0 | 1536.0 | 64.0 | MistralForCausalLM | rirv938/groksyn_grpo_cp6 | 2025-07-07 | single | 1.08 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 685.5 | 1.0 | 1293.76 | 1353.66 | 0.42 | 0.99 | rirv938-b4-98p-2ff-rirv_19085_v1 | 24B | rirv938/b4_98p_2ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp936_v3 | rirv938-b4-98p-2ff-rirv_19085_v1 | 8014 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/b4_98p_2ff_rirv9 | 2025-03-28 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 687.0 | 1.0 | 1293.67 | 1353.66 | 0.51 | 0.99 | rirv938-mistral-24b-dpo-_2511_v3 | 24B | rirv938/mistral_24b_dpo_40k_95w_pref_3750_instruct_l128_v2 | rirv938-mistral-24b-dpo-_2511_v3 | 7405 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-26 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 688.5 | 1.0 | 1293.6 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-beta-_24135_v1 | 13B | rirv938/anthropic_beta_2_40k_624_bo8_95w_v2 | rirv938-anthropic-beta-_24135_v1 | 17680 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-30 | single | 2.91 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 688.5 | 1.0 | 1293.6 | 1353.66 | 0.59 | 0.99 | rirv938-nitral-beta-40k_32603_v1 | 13B | rirv938/nitral_beta_40k_312_v2 | rirv938-nitral-beta-40k_32603_v1 | 22227 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_beta_40k_ | 2024-12-27 | single | 2.93 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 690.0 | 1.0 | 1293.57 | 1353.66 | 0.5 | 0.99 | chaiml-bold-v1-rirv938-2_7710_v2 | 24B | ChaiML/bold_v1_rirv938_20250420 | chaiml-bold-v1-rirv938-2_7710_v2 | 9033 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/bold_v1_rirv938_2 | 2025-04-22 | single | 1.45 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 691.0 | 1.0 | 1293.5 | 1353.66 | 0.55 | 0.99 | blend_nejot_2025-04-03 | n/a | | rob_ab_test | 5955 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-04-03 | blended | | |
rirv938 | 1 | 692.5 | 1.0 | 1293.48 | 1353.66 | 0.45 | 0.99 | rirv938-b4-98p-2ff-rirv_55455_v2 | 24B | rirv938/b4_98p_2ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp312_v3 | rirv938-b4-98p-2ff-rirv_55455_v2 | 6480 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/b4_98p_2ff_rirv9 | 2025-03-28 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 692.5 | 1.0 | 1293.48 | 1353.66 | 0.53 | 0.99 | chaiml-gy-exp78-sft-gy-_32548_v3 | 24B | ChaiML/gy-exp78-sft-gy-datamix-v1-AR-ep2 | chaiml-gy-exp78-sft-gy-_32548_v3 | 11238 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/gy-exp78-sft-gy-d | 2025-07-08 | single | 1.33 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 694.0 | 1.0 | 1293.46 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-beta-2_8422_v1 | 13B | rirv938/anthropic_beta_2_40k_1248_bo8_95w_v2 | rirv938-anthropic-beta-2_8422_v1 | 14254 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-30 | single | 3.0 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 695.0 | 1.0 | 1293.43 | 1353.66 | 0.49 | 0.99 | chaiml-mistral31-24b-s_69496_v16 | 24B | ChaiML/mistral31-24b-simpoexp1-s1-new-sft-retryv2top20lex-2e | chaiml-mistral31-24b-s_69496_v16 | 9087 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/mistral31-24b-sim | 2025-06-30 | single | 1.59 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 696.0 | 1.0 | 1293.4 | 1353.66 | 0.53 | 0.99 | function_lujeb_2025-02-27 | | | retune_with_base | 5681 | 61115860 | 0.52 | 0.65 | function | | | | | | | 2025-02-27 | single | | |
rirv938 | 1 | 697.0 | 1.0 | 1293.36 | 1353.66 | 0.57 | 0.99 | rirv938-prefgrok-cp312-_76270_v1 | 24B | rirv938/prefgrok_cp312_98ff_b35_r1_reformat_merged | rirv938-prefgrok-cp312-_76270_v1 | 8086 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/prefgrok_cp312_9 | 2025-07-07 | single | 1.32 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 698.0 | 1.0 | 1293.34 | 1353.66 | 0.49 | 0.99 | rirv938-simp-grpo-cp624_97924_v1 | 24B | rirv938/simp_grpo_cp624_2ff_b35_r1_ava_rm_merged | rirv938-simp-grpo-cp624_97924_v1 | 6668 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/simp_grpo_cp624_ | 2025-07-02 | single | 1.62 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 699.0 | 1.0 | 1293.33 | 1353.66 | 0.56 | 0.99 | rirv938-grpo-to-compare_36740_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp156_lr8_merged | rirv938-grpo-to-compare_36740_v1 | 10568 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-26 | single | 1.47 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 700.0 | 1.0 | 1293.32 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-beta-_54778_v2 | 13B | rirv938/anthropic_beta_2_40k_2496_bo8_v2 | rirv938-anthropic-beta-_54778_v2 | 16308 | 61115860 | 0.55 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-29 | single | 2.92 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 701.0 | 1.0 | 1293.3 | 1353.66 | 0.52 | 0.99 | chaiml-llama-8b-multihe_54063_v4 | 8B | ChaiML/llama_8b_multihead_204m_preference | chaiml-llama-8b-multihe_54063_v4 | 11155 | 61115860 | 0.52 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | ChaiML/llama_8b_multihea | 2025-02-27 | single | | |
rirv938 | 1 | 702.0 | 1.0 | 1293.29 | 1353.66 | 0.57 | 0.99 | chaiml-slerp-grpo-cp312_10606_v2 | 24B | ChaiML/slerp_grpo_cp312_96ff_b4_r1_lr3_merged | chaiml-slerp-grpo-cp312_10606_v2 | 6249 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerp_grpo_cp312_ | 2025-05-30 | single | | |
rirv938 | 1 | 703.0 | 1.0 | 1293.25 | 1353.66 | 0.53 | 0.99 | blend_rotan_2025-04-23 | n/a | | rob_ab_test | 8357 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-04-23 | blended | | |
rirv938 | 1 | 704.0 | 1.0 | 1293.19 | 1353.66 | 0.56 | 0.99 | rirv938-100p-0ff-rirv93_49616_v1 | 24B | rirv938/100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp156_v3 | rirv938-100p-0ff-rirv93_49616_v1 | 5830 | 61115860 | 0.49 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-02 | single | 0.76 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 705.0 | 1.0 | 1293.18 | 1353.66 | 0.59 | 0.99 | rirv938-96p-4ff-nischaydn_844_v1 | 24B | rirv938/96p_4ff_nischaydnk_exp14_exp9dp_94555_v6_cp2000_merged | rirv938-96p-4ff-nischaydn_844_v1 | 21492 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_nischayd | 2025-06-07 | single | | |
rirv938 | 1 | 706.0 | 1.0 | 1293.15 | 1353.66 | 0.54 | 0.99 | function_nahat_2025-02-27 | | | retune_with_base | 6362 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-02-27 | single | | |
rirv938 | 1 | 707.5 | 1.0 | 1293.1 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_74918_v1 | 13B | rirv938/anthropic_grpo_40k_cp1184_95ff_20ww_merged | rirv938-anthropic-grpo-_74918_v1 | 8792 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-13 | single | 1.65 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 707.5 | 1.0 | 1293.1 | 1353.66 | 0.0 | 0.99 | chaiml-llama-8b-multih_78780_v27 | 8B | ChaiML/llama_8b_multihead_204m_512_v3_tokens_step_398208 | chaiml-llama-8b-multih_78780_v27 | 5413 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 2048.0 | 1.0 | MultiHeadLlamaClassifier | ChaiML/llama_8b_multihea | 2025-02-13 | single | | |
rirv938 | 1 | 709.5 | 1.0 | 1293.09 | 1353.66 | 0.63 | 0.99 | rirv938-mistral-24b-rou_17322_v1 | 24B | rirv938/mistral_24b_round_2_dpo_40k_50w_pref_16w_swear_2500_v2 | rirv938-mistral-24b-rou_17322_v1 | 9889 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-07 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 709.5 | 1.0 | 1293.09 | 1353.66 | 0.53 | 0.99 | blend_seluk_2025-05-15 | n/a | | rob_ab_test | 6833 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-05-15 | blended | | |
rirv938 | 1 | 711.0 | 1.0 | 1292.97 | 1353.66 | 0.6 | 0.99 | rirv938-96p-4ff-nischay_68965_v2 | 24B | rirv938/96p_4ff_nischaydnk_exp14_exp9dp_94555_v6_cp1000_merged | rirv938-96p-4ff-nischay_68965_v2 | 20298 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_nischayd | 2025-06-07 | single | | |
rirv938 | 1 | 712.0 | 1.0 | 1292.9 | 1353.66 | 0.6 | 0.99 | rirv938-mistral-24b-dpo_28527_v1 | 24B | rirv938/mistral_24b_dpo_40k_95w_pref_3750_instruct_dpo_2_v2 | rirv938-mistral-24b-dpo_28527_v1 | 7979 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-02-23 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 713.0 | 1.0 | 1292.88 | 1353.66 | 0.58 | 0.99 | rirv938-lr-2-mistral-558-v2_v2 | 13B | rirv938/lr_2_mistral_558_v2 | rirv938-lr-2-mistral-558-v2_v2 | 21097 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/lr_2_mistral_558 | 2024-12-21 | single | 1.74 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 714.0 | 1.0 | 1292.86 | 1353.66 | 0.57 | 0.99 | rirv938-20k-100p-0ff-ri_56887_v1 | 24B | rirv938/20k_100p_0ff_rirv938_mistral_24b_bon_82623_v1_cp156_v3 | rirv938-20k-100p-0ff-ri_56887_v1 | 5608 | 61115860 | 0.49 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/20k_100p_0ff_rir | 2025-04-02 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 715.0 | 1.0 | 1292.82 | 1353.66 | 0.58 | 0.99 | rirv938-mistral-24b-grp_39559_v1 | 24B | rirv938/mistral_24b_grpo_40k_cp148_95ff_merged | rirv938-mistral-24b-grp_39559_v1 | 8663 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_grpo | 2025-04-28 | single | 1.44 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 716.5 | 1.0 | 1292.8 | 1353.66 | 0.46 | 0.99 | rirv938-0sw-99p-1ff-rir_79560_v1 | 24B | rirv938/0sw_99p_1ff_rirv938_mistral_24b_dpo_43074_v1_cp390_v3 | rirv938-0sw-99p-1ff-rir_79560_v1 | 6311 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_99p_1ff_rirv | 2025-03-25 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 716.5 | 1.0 | 1292.8 | 1353.66 | 0.52 | 0.99 | rirv938-snug-grpo-40k-c_63788_v1 | 13B | rirv938/snug_grpo_40k_cp1184_93ff_b_merged | rirv938-snug-grpo-40k-c_63788_v1 | 5582 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/snug_grpo_40k_cp | 2025-05-01 | single | 1.33 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 718.5 | 1.0 | 1292.79 | 1353.66 | 0.51 | 0.99 | rirv938-mistral-24b-rou_37562_v1 | 24B | rirv938/mistral_24b_round_2_b_dpo_40k_95w_pref_1250_v2 | rirv938-mistral-24b-rou_37562_v1 | 7585 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-05 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 718.5 | 1.0 | 1292.79 | 1353.66 | 0.58 | 0.99 | chaiml-slerpv5-mistral3_24540_v4 | 24B | ChaiML/slerpv5_mistral31_simpo_dpo_dpoold_s2 | chaiml-slerpv5-mistral3_24540_v4 | 5870 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerpv5_mistral31 | 2025-05-22 | single | | |
rirv938 | 1 | 720.0 | 1.0 | 1292.78 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_51278_v1 | 13B | rirv938/anthropic_grpo_40k_cp2368_95ff_beta6_2_2_merged | rirv938-anthropic-grpo-_51278_v1 | 9192 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-16 | single | 1.61 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 721.0 | 1.0 | 1292.76 | 1353.66 | 0.59 | 0.99 | rirv938-mistral-24b-dpo_61861_v1 | 24B | rirv938/mistral_24b_dpo_40k_95w_pref_2500_instruct_dpo_2_v2 | rirv938-mistral-24b-dpo_61861_v1 | 6294 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-02-23 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 722.0 | 1.0 | 1292.75 | 1353.66 | 0.55 | 0.99 | rirv938-anthropic-grpo-_49016_v1 | 13B | rirv938/anthropic_grpo_40k_cp148_95ff_20ww2_merged | rirv938-anthropic-grpo-_49016_v1 | 6355 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-14 | single | 1.58 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 723.0 | 1.0 | 1292.74 | 1353.66 | 0.0 | 0.99 | chaiml-20250611-retune-u_1558_v2 | 8B | ChaiML/20250611_retune_US_7_to_13_seconds | chaiml-20250611-retune-u_1558_v2 | 8285 | 61115860 | 0.52 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | ChaiML/20250611_retune_U | 2025-06-11 | single | | |
rirv938 | 1 | 724.5 | 1.0 | 1292.73 | 1353.66 | 0.57 | 0.99 | rirv938-prefgrok-r2-cp62_5963_v1 | 24B | rirv938/prefgrok_r2_cp624_98ff_b5_merged | rirv938-prefgrok-r2-cp62_5963_v1 | 6408 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/prefgrok_r2_cp62 | 2025-07-08 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 724.5 | 1.0 | 1292.73 | 1353.66 | 0.54 | 0.99 | blend_pipar_2025-06-12 | n/a | | rob_ab_test | 10021 | 61115860 | 0.53 | 0.65 | blend | | | | | | | 2025-06-11 | blended | | |
rirv938 | 1 | 726.0 | 1.0 | 1292.72 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-_49016_v2 | 13B | rirv938/anthropic_grpo_40k_cp148_95ff_20ww2_merged | rirv938-anthropic-grpo-_49016_v2 | 6470 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-14 | single | 1.58 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 727.0 | 1.0 | 1292.54 | 1353.66 | 0.53 | 0.99 | blend_hakuk_2025-05-01 | n/a | | rob_ab_test | 7077 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-05-01 | blended | | |
rirv938 | 1 | 728.0 | 1.0 | 1292.47 | 1353.66 | 0.58 | 0.99 | rirv938-nitral-40k-2500_91342_v2 | 13B | rirv938/nitral_40k_2500_13ff_40w_bo32_no_swearing_v2 | rirv938-nitral-40k-2500_91342_v2 | 8017 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/nitral_40k_2500_ | 2025-02-03 | single | | |
rirv938 | 1 | 729.0 | 1.0 | 1292.4 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-_22923_v1 | 13B | rirv938/anthropic_grpo_40k_cp444_95ff_20ww2_merged | rirv938-anthropic-grpo-_22923_v1 | 7398 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-14 | single | 1.64 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 730.0 | 1.0 | 1292.38 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-beta-_13714_v1 | 13B | rirv938/anthropic_beta_2_40k_624_bo16_v2 | rirv938-anthropic-beta-_13714_v1 | 22361 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-29 | single | 3.03 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 731.5 | 1.0 | 1292.36 | 1353.66 | 0.5 | 0.99 | rirv938-100p-0ff-rirv938_2517_v1 | 24B | rirv938/100p_0ff_rirv938_mistral_24b_oai_77698_v2_cp374_merged | rirv938-100p-0ff-rirv938_2517_v1 | 5461 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/100p_0ff_rirv938 | 2025-04-18 | single | 0.66 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 731.5 | 1.0 | 1292.36 | 1353.66 | 0.56 | 0.99 | blend_hubul_2025-03-21 | n/a | | rob_ab_test | 6609 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-03-21 | blended | | |
rirv938 | 1 | 733.0 | 1.0 | 1292.34 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-2_43413_v2 | 13B | rirv938/anthropic_40k_2496_bo8_85w_b4_l1_v2 | rirv938-anthropic-40k-2_43413_v2 | 13845 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_24 | 2025-01-01 | single | 1.78 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 734.0 | 1.0 | 1292.33 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-40k-2_12610_v1 | 13B | rirv938/anthropic_40k_2500_10w_bo32_v2 | rirv938-anthropic-40k-2_12610_v1 | 5348 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_25 | 2025-01-30 | single | | |
rirv938 | 1 | 735.5 | 1.0 | 1292.32 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-1_25268_v3 | 13B | rirv938/anthropic_40k_1248_bo8_85w_b4_2xlora_v2 | rirv938-anthropic-40k-1_25268_v3 | 13698 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_12 | 2025-01-01 | single | 1.74 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 735.5 | 1.0 | 1292.32 | 1353.66 | 0.48 | 0.99 | rirv938-0sw-99p-1ff-rir_36411_v1 | 24B | rirv938/0sw_99p_1ff_rirv938_mistral_24b_dpo_43074_v1_cp312_v3 | rirv938-0sw-99p-1ff-rir_36411_v1 | 7119 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_99p_1ff_rirv | 2025-03-25 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 737.0 | 1.0 | 1292.3 | 1353.66 | 0.47 | 0.99 | rirv938-0sw-98p-2ff-rir_34053_v1 | 24B | rirv938/0sw_98p_2ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp234_v2 | rirv938-0sw-98p-2ff-rir_34053_v1 | 8160 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_98p_2ff_rirv | 2025-03-26 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 738.0 | 1.0 | 1292.29 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-12_7347_v2 | 13B | rirv938/anthropic_40k_1248_bo8_85w_b4_2xlora_2xlr_v2 | rirv938-anthropic-40k-12_7347_v2 | 20193 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_12 | 2025-01-01 | single | 1.68 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 739.0 | 1.0 | 1292.28 | 1353.66 | 0.49 | 0.99 | rirv938-simp-grpo-cp156_10803_v1 | 24B | rirv938/simp_grpo_cp156_96ff_b1_r1_merged | rirv938-simp-grpo-cp156_10803_v1 | 8725 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/simp_grpo_cp156_ | 2025-06-10 | single | | |
rirv938 | 1 | 740.0 | 1.0 | 1292.26 | 1353.66 | 0.52 | 0.99 | chaiml-llama-8b-multihe_54063_v6 | 8B | ChaiML/llama_8b_multihead_204m_preference | chaiml-llama-8b-multihe_54063_v6 | 10839 | 61115860 | 0.51 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | ChaiML/llama_8b_multihea | 2025-02-27 | single | | |
rirv938 | 1 | 741.0 | 1.0 | 1292.24 | 1353.66 | 0.56 | 0.99 | rirv938-slerp-grpo-cp62_45951_v1 | 24B | rirv938/slerp_grpo_cp624_96ff_b3_r1_merged | rirv938-slerp-grpo-cp62_45951_v1 | 8961 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp624 | 2025-06-09 | single | | |
rirv938 | 1 | 742.5 | 1.0 | 1292.22 | 1353.66 | 0.5 | 0.99 | rirv938-rinen-grpo-40k-_37852_v1 | 13B | rirv938/rinen_grpo_40k_cp888_95ff_run2_ww_merged | rirv938-rinen-grpo-40k-_37852_v1 | 7033 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_40k_c | 2025-05-15 | single | 1.36 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 742.5 | 1.0 | 1292.22 | 1353.66 | 0.51 | 0.99 | rirv938-0sw-96p-4ff-rir_63230_v1 | 24B | rirv938/0sw_96p_4ff_rirv938_mistral_24b_dpo_43074_v1_cp624_v3 | rirv938-0sw-96p-4ff-rir_63230_v1 | 6660 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_96p_4ff_rirv | 2025-03-25 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 744.0 | 1.0 | 1292.21 | 1353.66 | 0.53 | 0.99 | chaiml-gy-exp78-sft-gy-_36416_v2 | 24B | ChaiML/gy-exp78-sft-gy-datamix-v1-AR-ep6 | chaiml-gy-exp78-sft-gy-_36416_v2 | 11099 | 61115860 | 0.49 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/gy-exp78-sft-gy-d | 2025-07-08 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 745.0 | 1.0 | 1292.2 | 1353.66 | 0.51 | 0.99 | rirv938-mistral-24b-dpo_40702_v1 | 24B | rirv938/mistral_24b_dpo_kl_10k_beta4_1560_v3 | rirv938-mistral-24b-dpo_40702_v1 | 6987 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-24 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 746.0 | 1.0 | 1292.15 | 1353.66 | 0.0 | 0.99 | chaiml-llama-8b-multih_78780_v26 | 8B | ChaiML/llama_8b_multihead_204m_512_v3_tokens_step_398208 | chaiml-llama-8b-multih_78780_v26 | 7595 | 61115860 | 0.53 | 0.65 | basic | | 1.0 | 2048.0 | 1.0 | MultiHeadLlamaClassifier | ChaiML/llama_8b_multihea | 2025-02-12 | single | | |
rirv938 | 1 | 747.0 | 1.0 | 1292.13 | 1353.66 | 0.55 | 0.99 | rirv938-dpo-to-compare-_68956_v1 | 24B | rirv938/dpo_to_compare_to_grpo_10k_cp186_b2_merged | rirv938-dpo-to-compare-_68956_v1 | 8981 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/dpo_to_compare_t | 2025-04-26 | single | 1.44 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 748.5 | 1.0 | 1292.09 | 1353.66 | 0.59 | 0.99 | function_fulef_2025-03-05 | | | retune_with_base | 7840 | 61115860 | 0.52 | 0.65 | function | | | | | | | 2025-03-05 | single | | |
rirv938 | 1 | 748.5 | 1.0 | 1292.09 | 1353.66 | 0.56 | 0.99 | chaiml-nemo-anthropic-_38239_v27 | 13B | ChaiML/nemo_anthropic_addict_lexical_1120_run2 | chaiml-nemo-anthropic-_38239_v27 | 7798 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/nemo_anthropic_ad | 2025-05-19 | single | | |
rirv938 | 1 | 750.5 | 1.0 | 1292.05 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_12256_v1 | 13B | rirv938/anthropic_grpo_40k_cp592_95ff_beta6_2_merged | rirv938-anthropic-grpo-_12256_v1 | 9542 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-15 | single | 1.42 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 750.5 | 1.0 | 1292.05 | 1353.66 | 0.54 | 0.99 | function_lemam_2025-06-25 | | | dpo_data_collection | 6418 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-06-25 | single | | |
rirv938 | 1 | 752.0 | 1.0 | 1292.04 | 1353.66 | 0.53 | 0.99 | rirv938-anthropic-grpo-_86434_v1 | 13B | rirv938/anthropic_grpo_40k_cp248_98ff_g8b3_merged | rirv938-anthropic-grpo-_86434_v1 | 7589 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-17 | single | 1.6 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 753.0 | 1.0 | 1292.01 | 1353.66 | 0.58 | 0.99 | rirv938-nitral-40k-2500_66631_v1 | 13B | rirv938/nitral_40k_2500_13ff_15w_bo32_old_rm_fixed_v2_v2 | rirv938-nitral-40k-2500_66631_v1 | 6286 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/nitral_40k_2500_ | 2025-01-31 | single | | |
rirv938 | 1 | 754.5 | 1.0 | 1291.97 | 1353.66 | 0.7 | 0.99 | rirv938-20250411-reward_71496_v1 | 8B | rirv938/20250411_reward_safety_10_removed | rirv938-20250411-reward_71496_v1 | 6736 | 61115860 | 0.51 | 0.65 | basic | | 1.0 | 512.0 | 1.0 | LlamaForSequenceClassification | rirv938/20250411_reward_ | 2025-04-11 | single | | |
rirv938 | 1 | 754.5 | 1.0 | 1291.97 | 1353.66 | 0.44 | 0.99 | rirv938-0sw-98p-2ff-rir_90051_v1 | 24B | rirv938/0sw_98p_2ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp390_v2 | rirv938-0sw-98p-2ff-rir_90051_v1 | 9873 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_98p_2ff_rirv | 2025-03-26 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 756.0 | 1.0 | 1291.95 | 1353.66 | 0.53 | 0.99 | rirv938-groksyn-r2-cp62_61633_v1 | 24B | rirv938/groksyn_r2_cp624_98ff_b4_merged | rirv938-groksyn-r2-cp62_61633_v1 | 5688 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/groksyn_r2_cp624 | 2025-07-08 | single | 1.33 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 757.0 | 1.0 | 1291.94 | 1353.66 | 0.55 | 0.99 | blend_gokus_2025-03-21 | n/a | | rob_ab_test | 6359 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-03-21 | blended | | |
rirv938 | 1 | 758.5 | 1.0 | 1291.89 | 1353.66 | 0.57 | 0.99 | rirv938-prefgrok-cp312-_47258_v2 | 24B | rirv938/prefgrok_cp312_98ff_b35_r1_reformat_high_quality_merged | rirv938-prefgrok-cp312-_47258_v2 | 6897 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/prefgrok_cp312_9 | 2025-07-07 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 758.5 | 1.0 | 1291.89 | 1353.66 | 0.54 | 0.99 | blend_simun_2025-07-09 | n/a | | rob_ab_test | 7596 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-07-09 | blended | | |
rirv938 | 1 | 760.0 | 1.0 | 1291.86 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-beta-2_8422_v2 | 13B | rirv938/anthropic_beta_2_40k_1248_bo8_95w_v2 | rirv938-anthropic-beta-2_8422_v2 | 13611 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-30 | single | 3.04 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 761.0 | 1.0 | 1291.81 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-beta-_64925_v3 | 13B | rirv938/anthropic_beta_2_40k_2496_bo16_v2 | rirv938-anthropic-beta-_64925_v3 | 26863 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-29 | single | 2.9 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 762.0 | 1.0 | 1291.7 | 1353.66 | 0.53 | 0.99 | blend_bideb_2025-05-15 | n/a | | rob_ab_test | 7518 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-05-15 | blended | | |
rirv938 | 1 | 763.0 | 1.0 | 1291.6 | 1353.66 | 0.52 | 0.99 | rirv938-0sw-94p-6ff-rir_73377_v1 | 24B | rirv938/0sw_94p_6ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp390_v2 | rirv938-0sw-94p-6ff-rir_73377_v1 | 8998 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_94p_6ff_rirv | 2025-03-26 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 764.0 | 1.0 | 1291.58 | 1353.66 | 0.56 | 0.99 | chaiml-slerp-grpo-cp312_10606_v4 | 24B | ChaiML/slerp_grpo_cp312_96ff_b4_r1_lr3_merged | chaiml-slerp-grpo-cp312_10606_v4 | 20306 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerp_grpo_cp312_ | 2025-06-05 | single | | |
rirv938 | 1 | 765.0 | 1.0 | 1291.56 | 1353.66 | 0.57 | 0.99 | rirv938-slerp-grpo-cp54_35754_v2 | 24B | rirv938/slerp_grpo_cp546_96ff_b2_r1_20k_merged | rirv938-slerp-grpo-cp54_35754_v2 | 9672 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp546 | 2025-06-10 | single | | |
rirv938 | 1 | 766.0 | 1.0 | 1291.55 | 1353.66 | 0.58 | 0.99 | rirv938-96p-4ff-nischay_71333_v2 | 24B | rirv938/96p_4ff_nischaydnk_exp14_exp9dp_94555_v6_cp500_merged | rirv938-96p-4ff-nischay_71333_v2 | 20341 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_nischayd | 2025-06-07 | single | | |
rirv938 | 1 | 767.0 | 1.0 | 1291.53 | 1353.66 | 0.43 | 0.99 | rirv938-mistral-24b-dpo_99850_v1 | 24B | rirv938/mistral_24b_dpo_kl_10k_beta1_936_v3 | rirv938-mistral-24b-dpo_99850_v1 | 9064 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-25 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 768.0 | 1.0 | 1291.48 | 1353.66 | 0.53 | 0.99 | blend_budob_2025-05-31 | n/a | | rob_ab_test | 5664 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-05-31 | blended | | |
rirv938 | 1 | 769.0 | 1.0 | 1291.45 | 1353.66 | 0.52 | 0.99 | blend_jisab_2025-07-09 | n/a | | rob_ab_test | 7286 | 61115860 | 0.49 | 0.65 | blend | | | | | | | 2025-07-09 | blended | | |
rirv938 | 1 | 770.0 | 1.0 | 1291.41 | 1353.66 | 0.53 | 0.99 | function_sodeb_2025-02-27 | | | retune_with_base | 5782 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-02-27 | single | | |
rirv938 | 1 | 771.0 | 1.0 | 1291.37 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-beta-_24135_v2 | 13B | rirv938/anthropic_beta_2_40k_624_bo8_95w_v2 | rirv938-anthropic-beta-_24135_v2 | 11983 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-30 | single | 2.98 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 772.0 | 1.0 | 1291.28 | 1353.66 | 0.53 | 0.99 | function_demaf_2025-05-22 | | | dpo_data_collection | 8279 | 61115860 | 0.5 | 0.65 | function | | | | | | | 2025-05-22 | single | | |
rirv938 | 1 | 773.0 | 1.0 | 1291.19 | 1353.66 | 0.5 | 0.99 | rirv938-mistral-24b-dpo_29487_v7 | 24B | rirv938/mistral_24b_dpo_40k_95w_pref_1250_instruct_dpo_2_v2 | rirv938-mistral-24b-dpo_29487_v7 | 7155 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-26 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 774.0 | 1.0 | 1291.16 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-2_43413_v1 | 13B | rirv938/anthropic_40k_2496_bo8_85w_b4_l1_v2 | rirv938-anthropic-40k-2_43413_v1 | 11377 | 61115860 | 0.52 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_24 | 2024-12-31 | single | 1.76 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 775.0 | 1.0 | 1291.14 | 1353.66 | 0.59 | 0.99 | rirv938-96p-4ff-nischay_71333_v1 | 24B | rirv938/96p_4ff_nischaydnk_exp14_exp9dp_94555_v6_cp500_merged | rirv938-96p-4ff-nischay_71333_v1 | 8293 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_nischayd | 2025-06-07 | single | | |
rirv938 | 1 | 776.0 | 1.0 | 1291.1 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-_76361_v1 | 13B | rirv938/anthropic_grpo_40k_cp120_98ff_g2b15_merged | rirv938-anthropic-grpo-_76361_v1 | 8318 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-18 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 777.0 | 1.0 | 1291.06 | 1353.66 | 0.59 | 0.99 | rirv938-96p-4ff-nischay_86528_v2 | 24B | rirv938/96p_4ff_nischaydnk_exp14_exp9dp_94555_v6_cp1500_merged | rirv938-96p-4ff-nischay_86528_v2 | 20294 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_nischayd | 2025-06-07 | single | | |
rirv938 | 1 | 778.0 | 1.0 | 1291.03 | 1353.66 | 0.54 | 0.99 | rirv938-anthropic-grpo-_19396_v1 | 13B | rirv938/anthropic_grpo_40k_cp78_95ff_baseline_merged | rirv938-anthropic-grpo-_19396_v1 | 8024 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-15 | single | 1.66 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 779.0 | 1.0 | 1291.0 | 1353.66 | 0.53 | 0.99 | blend_fenek_2025-07-09 | n/a | | rob_ab_test | 6682 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-07-09 | blended | | |
rirv938 | 1 | 780.0 | 1.0 | 1290.93 | 1353.66 | 0.54 | 0.99 | chaiml-mistral32-sftexp1_2523_v6 | 24B | ChaiML/mistral32-sftexp1-s1-groksyn30jun-full-4e-top750 | chaiml-mistral32-sftexp1_2523_v6 | 5816 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/mistral32-sftexp1 | 2025-07-07 | single | 1.35 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 781.0 | 1.0 | 1290.89 | 1353.66 | 0.45 | 0.99 | rirv938-grpo-20250711-c_25242_v1 | 24B | rirv938/grpo_20250711_cp312_sid_mistral_24b_dpo_40k_2_merged | rirv938-grpo-20250711-c_25242_v1 | 7607 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_20250711_cp | 2025-07-14 | single | 1.36 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 782.0 | 1.0 | 1290.87 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-2_68187_v1 | 13B | rirv938/anthropic_40k_2500_swear_10_v2 | rirv938-anthropic-40k-2_68187_v1 | 6786 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_25 | 2025-01-21 | single | | |
rirv938 | 1 | 783.5 | 1.0 | 1290.8 | 1353.66 | 0.65 | 0.99 | function_nitim_2025-04-10 | | | dpo_data_collection | 7459 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-04-10 | single | | |
rirv938 | 1 | 783.5 | 1.0 | 1290.8 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-beta-_68706_v1 | 13B | rirv938/anthropic_beta_2_40k_1248_bo16_v2 | rirv938-anthropic-beta-_68706_v1 | 19253 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-29 | single | 2.89 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 785.0 | 1.0 | 1290.78 | 1353.66 | 0.5 | 0.99 | rirv938-mistral-24b-dpo_29487_v6 | 24B | rirv938/mistral_24b_dpo_40k_95w_pref_1250_instruct_dpo_2_v2 | rirv938-mistral-24b-dpo_29487_v6 | 6961 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-26 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 786.0 | 1.0 | 1290.77 | 1353.66 | 0.52 | 0.99 | rirv938-0sw-94p-6ff-rir_45663_v1 | 24B | rirv938/0sw_94p_6ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp78_v2 | rirv938-0sw-94p-6ff-rir_45663_v1 | 10216 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_94p_6ff_rirv | 2025-03-26 | single | 0.76 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 787.0 | 1.0 | 1290.76 | 1353.66 | 0.6 | 0.99 | function_kogek_2025-03-06 | | | retune_with_base | 7704 | 61115860 | 0.5 | 0.65 | function | | | | | | | 2025-03-06 | single | | |
rirv938 | 1 | 788.0 | 1.0 | 1290.74 | 1353.66 | 0.56 | 0.99 | rirv938-grpo-to-compare_30616_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp624_g16_merged | rirv938-grpo-to-compare_30616_v1 | 9021 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-25 | single | 1.42 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 789.0 | 1.0 | 1290.71 | 1353.66 | 0.53 | 0.99 | rirv938-rinen-grpo-40k-c_7257_v1 | 13B | rirv938/rinen_grpo_40k_cp444_95ff_run2_ww_merged | rirv938-rinen-grpo-40k-c_7257_v1 | 8532 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/rinen_grpo_40k_c | 2025-05-15 | single | 1.32 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 790.5 | 1.0 | 1290.66 | 1353.66 | 0.56 | 0.99 | chaiml-camp-half-blood-_29383_v3 | 24B | ChaiML/Camp-Half-blood-Rp250614101345_preference_dpo | chaiml-camp-half-blood-_29383_v3 | 7655 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/Camp-Half-blood-R | 2025-07-07 | single | 1.35 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 790.5 | 1.0 | 1290.66 | 1353.66 | 0.6 | 0.99 | blend_fohef_2025-01-08 | n/a | | rob_ab_test | 12013 | 61115860 | 0.54 | 0.65 | blend | | | | | | | 2025-01-08 | blended | | |
rirv938 | 1 | 792.0 | 1.0 | 1290.62 | 1353.66 | 0.56 | 0.99 | rirv938-94p-6ff-rirv938_99477_v1 | 24B | rirv938/94p_6ff_rirv938_1000_sim_100p_0_17599_v1_cp530_merged | rirv938-94p-6ff-rirv938_99477_v1 | 8235 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/94p_6ff_rirv938_ | 2025-04-21 | single | 1.46 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 793.5 | 1.0 | 1290.52 | 1353.66 | 0.52 | 0.99 | rirv938-snug-grpo-40k-cp_3986_v1 | 13B | rirv938/snug_grpo_40k_cp592_93ff_b_merged | rirv938-snug-grpo-40k-cp_3986_v1 | 5451 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/snug_grpo_40k_cp | 2025-05-01 | single | 1.32 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 793.5 | 1.0 | 1290.52 | 1353.66 | 0.6 | 0.99 | rirv938-nitral-beta-40k_51642_v1 | 13B | rirv938/nitral_beta_40k_12486_v2 | rirv938-nitral-beta-40k_51642_v1 | 16111 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_beta_40k_ | 2024-12-27 | single | 2.83 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 795.0 | 1.0 | 1290.49 | 1353.66 | 0.53 | 0.99 | function_kifem_2025-05-22 | | | dpo_data_collection | 8545 | 61115860 | 0.49 | 0.65 | function | | | | | | | 2025-05-22 | single | | |
rirv938 | 1 | 796.0 | 1.0 | 1290.44 | 1353.66 | 0.0 | 0.99 | function_fuset_2025-01-31 | | | retune_with_base | 5809 | 61115860 | 0.53 | 0.65 | function | | | | | | | 2025-01-30 | single | | |
rirv938 | 1 | 797.0 | 1.0 | 1290.41 | 1353.66 | 0.52 | 0.99 | rirv938-mistral-24b-dpo_50042_v1 | 24B | rirv938/mistral_24b_dpo_kl_10k_beta4_1248_v3 | rirv938-mistral-24b-dpo_50042_v1 | 7114 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-24 | single | 0.76 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 798.0 | 1.0 | 1290.38 | 1353.66 | 0.51 | 0.99 | function_puror_2025-03-14 | | | dpo_data_collection | 7438 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-03-14 | single | | |
rirv938 | 1 | 799.0 | 1.0 | 1290.37 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_21322_v1 | 13B | rirv938/anthropic_grpo_40k_cp1184_95ff_6ww_merged | rirv938-anthropic-grpo-_21322_v1 | 8504 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-13 | single | 1.68 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 800.5 | 1.0 | 1290.34 | 1353.66 | 0.59 | 0.99 | rirv938-nitral-beta-40k_59903_v2 | 13B | rirv938/nitral_beta_40k_624_v2 | rirv938-nitral-beta-40k_59903_v2 | 19706 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_beta_40k_ | 2024-12-27 | single | 2.92 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 800.5 | 1.0 | 1290.34 | 1353.66 | 0.54 | 0.99 | blend_pigab_2025-05-31 | n/a | | rob_ab_test | 5673 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-05-31 | blended | | |
rirv938 | 1 | 802.0 | 1.0 | 1290.31 | 1353.66 | 0.59 | 0.99 | chaiml-slerpv5-mistral_24540_v14 | 24B | ChaiML/slerpv5_mistral31_simpo_dpo_dpoold_s2 | chaiml-slerpv5-mistral_24540_v14 | 16645 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerpv5_mistral31 | 2025-06-05 | single | | |
rirv938 | 1 | 804.0 | 1.0 | 1290.29 | 1353.66 | 0.57 | 0.99 | chaiml-mistral31-24b-sf_19349_v4 | 24B | ChaiML/mistral31-24b-sftmorelora-retryv2-top20k | chaiml-mistral31-24b-sf_19349_v4 | 6336 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/mistral31-24b-sft | 2025-07-07 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 804.0 | 1.0 | 1290.29 | 1353.66 | 0.52 | 0.99 | blend_lomel_2025-07-09 | n/a | | rob_ab_test | 7158 | 61115860 | 0.49 | 0.65 | blend | | | | | | | 2025-07-09 | blended | | |
rirv938 | 1 | 804.0 | 1.0 | 1290.29 | 1353.66 | 0.55 | 0.99 | blend_fikas_2025-04-23 | n/a | | rob_ab_test | 8940 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-04-23 | blended | | |
rirv938 | 1 | 806.5 | 1.0 | 1290.28 | 1353.66 | 0.6 | 0.99 | rirv938-nitral-18k-558-v2_v1 | 13B | rirv938/nitral_18k_558_v2 | rirv938-nitral-18k-558-v2_v1 | 15614 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_18k_558_v | 2024-12-27 | single | 2.95 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 806.5 | 1.0 | 1290.28 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-40k-12_7347_v1 | 13B | rirv938/anthropic_40k_1248_bo8_85w_b4_2xlora_2xlr_v2 | rirv938-anthropic-40k-12_7347_v1 | 16080 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_12 | 2025-01-01 | single | 1.77 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 808.0 | 1.0 | 1290.2 | 1353.66 | 0.53 | 0.99 | blend_sobim_2025-05-01 | n/a | | rob_ab_test | 7523 | 61115860 | 0.49 | 0.65 | blend | | | | | | | 2025-05-01 | blended | | |
rirv938 | 1 | 809.0 | 1.0 | 1290.19 | 1353.66 | 0.53 | 0.99 | function_kakal_2025-05-22 | | | dpo_data_collection | 6322 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-05-21 | single | | |
rirv938 | 1 | 810.0 | 1.0 | 1290.04 | 1353.66 | 0.58 | 0.99 | rirv938-mistral-filtered_1275_v1 | 13B | rirv938/mistral_filtered_1116_v2 | rirv938-mistral-filtered_1275_v1 | 16611 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/mistral_filtered | 2024-12-21 | single | 1.73 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 811.0 | 1.0 | 1290.0 | 1353.66 | 0.54 | 0.99 | blend_debut_2025-05-01 | n/a | | rob_ab_test | 6819 | 61115860 | 0.49 | 0.65 | blend | | | | | | | 2025-05-01 | blended | | |
rirv938 | 1 | 812.0 | 1.0 | 1289.98 | 1353.66 | 0.56 | 0.99 | rirv938-slerp-grpo-cp12_50590_v1 | 24B | rirv938/slerp_grpo_cp1248_96ff_b3_r1_merged | rirv938-slerp-grpo-cp12_50590_v1 | 8530 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp124 | 2025-06-09 | single | | |
rirv938 | 1 | 813.0 | 1.0 | 1289.97 | 1353.66 | 0.54 | 0.99 | function_metal_2025-05-28 | | | dpo_data_collection | 9467 | 61115860 | 0.5 | 0.65 | function | | | | | | | 2025-05-28 | single | | |
rirv938 | 1 | 814.0 | 1.0 | 1289.95 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_48962_v1 | 13B | rirv938/anthropic_grpo_40k_cp624_95ff_beta4_merged | rirv938-anthropic-grpo-_48962_v1 | 5998 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-15 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 815.0 | 1.0 | 1289.94 | 1353.66 | 0.53 | 0.99 | blend_jalib_2025-05-31 | n/a | | rob_ab_test | 5758 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-05-31 | blended | | |
rirv938 | 1 | 816.0 | 1.0 | 1289.84 | 1353.66 | 0.58 | 0.99 | rirv938-prefgrok-cp624-_37030_v2 | 24B | rirv938/prefgrok_cp624_98ff_b35_r1_reformat_high_quality_merged | rirv938-prefgrok-cp624-_37030_v2 | 5692 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/prefgrok_cp624_9 | 2025-07-07 | single | 1.4 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 817.5 | 1.0 | 1289.83 | 1353.66 | 0.51 | 0.99 | function_mimur_2025-03-26 | | | dpo_data_collection | 10191 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-03-26 | single | | |
rirv938 | 1 | 817.5 | 1.0 | 1289.83 | 1353.66 | 0.54 | 0.99 | function_fules_2025-06-25 | | | dpo_data_collection | 6387 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-06-25 | single | | |
rirv938 | 1 | 819.0 | 1.0 | 1289.82 | 1353.66 | 0.49 | 0.99 | chaiml-mistral31-24b-s_69496_v17 | 24B | ChaiML/mistral31-24b-simpoexp1-s1-new-sft-retryv2top20lex-2e | chaiml-mistral31-24b-s_69496_v17 | 8034 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/mistral31-24b-sim | 2025-06-30 | single | 1.6 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 820.0 | 1.0 | 1289.75 | 1353.66 | 0.55 | 0.99 | rirv938-grpo-to-compare-_4371_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp156_lr4_merged | rirv938-grpo-to-compare-_4371_v1 | 10899 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-25 | single | 1.4 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 821.0 | 1.0 | 1289.68 | 1353.66 | 0.56 | 0.99 | chaiml-llama-8b-multih_78780_v34 | 8B | ChaiML/llama_8b_multihead_204m_512_v3_tokens_step_398208 | chaiml-llama-8b-multih_78780_v34 | 6236 | 61115860 | 0.52 | 0.65 | basic | | 1.0 | 2048.0 | 1.0 | MultiHeadLlamaClassifier | ChaiML/llama_8b_multihea | 2025-02-14 | single | | |
rirv938 | 1 | 822.0 | 1.0 | 1289.67 | 1353.66 | 0.53 | 0.99 | rirv938-groksyn-grpo-cp_67088_v1 | 24B | rirv938/groksyn_grpo_cp312_98ff_b35_r1_merged | rirv938-groksyn-grpo-cp_67088_v1 | 6005 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/groksyn_grpo_cp3 | 2025-07-03 | single | 1.63 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 823.0 | 1.0 | 1289.63 | 1353.66 | 0.49 | 0.99 | chaiml-mistral31-24b-s_69496_v15 | 24B | ChaiML/mistral31-24b-simpoexp1-s1-new-sft-retryv2top20lex-2e | chaiml-mistral31-24b-s_69496_v15 | 6340 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/mistral31-24b-sim | 2025-06-26 | single | 1.63 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 824.0 | 1.0 | 1289.6 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_70195_v2 | 13B | rirv938/anthropic_grpo_40k_cp1184_95ff_beta6_2_merged | rirv938-anthropic-grpo-_70195_v2 | 9374 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-15 | single | 1.6 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 825.0 | 1.0 | 1289.51 | 1353.66 | 0.5 | 0.99 | function_lefan_2025-03-14 | | | dpo_data_collection | 8646 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-03-14 | single | | |
rirv938 | 1 | 826.0 | 1.0 | 1289.5 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-beta-_10235_v1 | 13B | rirv938/anthropic_beta_2_40k_1872_bo16_v2 | rirv938-anthropic-beta-_10235_v1 | 17999 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-29 | single | 2.98 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 827.0 | 1.0 | 1289.42 | 1353.66 | 0.6 | 0.99 | rirv938-nitral-40k-624-v2_v1 | 13B | rirv938/nitral_40k_624_v2 | rirv938-nitral-40k-624-v2_v1 | 15256 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_40k_624_v | 2024-12-27 | single | 2.91 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 828.5 | 1.0 | 1289.41 | 1353.66 | 0.56 | 0.99 | rirv938-slerp-grpo-cp156_6356_v1 | 24B | rirv938/slerp_grpo_cp156_96ff_b3_r1_20k_merged | rirv938-slerp-grpo-cp156_6356_v1 | 8085 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/slerp_grpo_cp156 | 2025-06-10 | single | | |
rirv938 | 1 | 828.5 | 1.0 | 1289.41 | 1353.66 | 0.55 | 0.99 | function_tobos_2025-03-25 | | | dpo_data_collection | 7901 | 61115860 | 0.54 | 0.65 | function | | | | | | | 2025-03-25 | single | | |
rirv938 | 1 | 830.5 | 1.0 | 1289.4 | 1353.66 | 0.5 | 0.99 | rirv938-mistral-24b-dpo_45953_v1 | 24B | rirv938/mistral_24b_dpo_kl_40k_beta4_6250_v3 | rirv938-mistral-24b-dpo_45953_v1 | 6230 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-24 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 830.5 | 1.0 | 1289.4 | 1353.66 | 0.54 | 0.99 | chaiml-mistral32-sftexp1_2523_v4 | 24B | ChaiML/mistral32-sftexp1-s1-groksyn30jun-full-4e-top750 | chaiml-mistral32-sftexp1_2523_v4 | 9163 | 61115860 | 0.5 | 0.65 | basic | | 6.0 | 1536.0 | 64.0 | MistralForCausalLM | ChaiML/mistral32-sftexp1 | 2025-07-07 | single | 1.09 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 832.0 | 1.0 | 1289.3 | 1353.66 | 0.53 | 0.99 | nischaydnk-exp14-exp9d_94555_v11 | 24B | NischayDnk/exp14-exp9DPOft-Chaidatav1dpo6k-Mistral24B | nischaydnk-exp14-exp9d_94555_v11 | 20403 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | NischayDnk/exp14-exp9DPO | 2025-06-07 | single | | |
rirv938 | 1 | 833.0 | 1.0 | 1289.23 | 1353.66 | 0.55 | 0.99 | blend_gojet_2025-04-14 | n/a | | rob_ab_test | 5618 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-04-14 | blended | | |
rirv938 | 1 | 834.0 | 1.0 | 1289.2 | 1353.66 | 0.57 | 0.99 | chaiml-anthropic-grpo-40_3002_v1 | 13B | ChaiML/anthropic_grpo_40k_cp234_95ff_beta4_merged | chaiml-anthropic-grpo-40_3002_v1 | 7588 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/anthropic_grpo_40 | 2025-05-15 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 835.0 | 1.0 | 1289.15 | 1353.66 | 0.57 | 0.99 | chaiml-mistral31-24b-sf_19349_v5 | 24B | ChaiML/mistral31-24b-sftmorelora-retryv2-top20k | chaiml-mistral31-24b-sf_19349_v5 | 6913 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/mistral31-24b-sft | 2025-07-07 | single | 1.32 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 836.0 | 1.0 | 1289.13 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-beta-2_6346_v1 | 13B | rirv938/anthropic_beta_2_40k_2496_bo4_v2 | rirv938-anthropic-beta-2_6346_v1 | 28804 | 61115860 | 0.54 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-29 | single | 2.84 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 837.0 | 1.0 | 1289.09 | 1353.66 | 0.55 | 0.99 | rirv938-dpo-to-compare-_51776_v1 | 24B | rirv938/dpo_to_compare_to_grpo_10k_cp248_merged | rirv938-dpo-to-compare-_51776_v1 | 6679 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/dpo_to_compare_t | 2025-04-25 | single | 1.45 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 838.0 | 1.0 | 1289.04 | 1353.66 | 0.58 | 0.99 | rirv938-lr-2-mistral-558-v2_v1 | 13B | rirv938/lr_2_mistral_558_v2 | rirv938-lr-2-mistral-558-v2_v1 | 20106 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/lr_2_mistral_558 | 2024-12-21 | single | 1.77 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 839.0 | 1.0 | 1289.03 | 1353.66 | 0.57 | 0.99 | chaiml-slerpv5-mistral3_24540_v9 | 24B | ChaiML/slerpv5_mistral31_simpo_dpo_dpoold_s2 | chaiml-slerpv5-mistral3_24540_v9 | 5745 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerpv5_mistral31 | 2025-05-31 | single | | |
rirv938 | 1 | 840.0 | 1.0 | 1289.02 | 1353.66 | 0.0 | 0.99 | function_basum_2025-04-10 | | | dpo_data_collection | 5971 | 61115860 | 0.5 | 0.65 | function | | | | | | | 2025-04-10 | single | | |
rirv938 | 1 | 841.0 | 1.0 | 1289.0 | 1353.66 | 0.53 | 0.99 | blend_suhif_2025-06-25 | n/a | | rob_ab_test | 6243 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-06-25 | blended | | |
rirv938 | 1 | 842.0 | 1.0 | 1288.92 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_58960_v1 | 13B | rirv938/anthropic_grpo_40k_cp234_95ff_beta4_merged | rirv938-anthropic-grpo-_58960_v1 | 6268 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-15 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 843.0 | 1.0 | 1288.87 | 1353.66 | 0.54 | 0.99 | function_hahat_2025-06-25 | | | dpo_data_collection | 11513 | 61115860 | 0.5 | 0.65 | function | | | | | | | 2025-06-25 | single | | |
rirv938 | 1 | 844.0 | 1.0 | 1288.86 | 1353.66 | 0.58 | 0.99 | rirv938-v7-pref-plus-03-_9004_v1 | 13B | rirv938/v7_pref_plus_03_mistral_1116_v2 | rirv938-v7-pref-plus-03-_9004_v1 | 25044 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/v7_pref_plus_03_ | 2024-12-22 | single | 1.82 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 845.0 | 1.0 | 1288.85 | 1353.66 | 0.52 | 0.99 | rirv938-0sw-94p-6ff-rir_70552_v1 | 24B | rirv938/0sw_94p_6ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp234_v2 | rirv938-0sw-94p-6ff-rir_70552_v1 | 9628 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_94p_6ff_rirv | 2025-03-26 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 846.5 | 1.0 | 1288.82 | 1353.66 | 0.58 | 0.99 | rirv938-nitral-40k-2500_59046_v1 | 13B | rirv938/nitral_40k_2500_13ff_10w_bo32_old_rm_fixed_v2_v2 | rirv938-nitral-40k-2500_59046_v1 | 6236 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/nitral_40k_2500_ | 2025-01-31 | single | | |
rirv938 | 1 | 846.5 | 1.0 | 1288.82 | 1353.66 | 0.47 | 0.99 | rirv938-mistral-24b-dpo_45557_v1 | 24B | rirv938/mistral_24b_dpo_kl_10k_beta2_1248_v3 | rirv938-mistral-24b-dpo_45557_v1 | 8338 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-25 | single | 0.76 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 848.0 | 1.0 | 1288.77 | 1353.66 | 0.58 | 0.99 | rirv938-anthropic-40k-2_75038_v3 | 13B | rirv938/anthropic_40k_2500_15w_swearing_no_safety_v2 | rirv938-anthropic-40k-2_75038_v3 | 6355 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_25 | 2025-01-29 | single | | |
rirv938 | 1 | 849.0 | 1.0 | 1288.74 | 1353.66 | 0.54 | 0.99 | function_ramit_2025-06-25 | | | dpo_data_collection | 6474 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-06-25 | single | | |
rirv938 | 1 | 850.0 | 1.0 | 1288.69 | 1353.66 | 0.56 | 0.99 | blend_podit_2025-02-24 | n/a | | rob_ab_test | 6183 | 61115860 | 0.53 | 0.65 | blend | | | | | | | 2025-02-24 | blended | | |
rirv938 | 1 | 851.0 | 1.0 | 1288.68 | 1353.66 | 0.51 | 0.99 | rirv938-mistral-24b-dpo_95031_v1 | 24B | rirv938/mistral_24b_dpo_kl_10k_beta1_312_v3 | rirv938-mistral-24b-dpo_95031_v1 | 8905 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-25 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 852.0 | 1.0 | 1288.65 | 1353.66 | 0.55 | 0.99 | blend_sigif_2025-03-21 | n/a | | rob_ab_test | 7104 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-03-21 | blended | | |
rirv938 | 1 | 853.0 | 1.0 | 1288.63 | 1353.66 | 0.55 | 0.99 | rirv938-anthropic-grpo-_25164_v1 | 13B | rirv938/anthropic_grpo_40k_cp1776_95ff_beta6_2_2_merged | rirv938-anthropic-grpo-_25164_v1 | 10102 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-16 | single | 1.62 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 854.0 | 1.0 | 1288.58 | 1353.66 | 0.0 | 0.99 | function_ritab_2025-01-30 | | | retune_with_base | 5472 | 61115860 | 0.53 | 0.65 | function | | | | | | | 2025-01-30 | single | | |
rirv938 | 1 | 855.0 | 1.0 | 1288.54 | 1353.66 | 0.47 | 0.99 | chaiml-mistral-24b-dpo_43220_v10 | 24B | ChaiML/mistral_24b_dpo_40k_95w_pref_1250_instruct_dpo_2_merged | chaiml-mistral-24b-dpo_43220_v10 | 9283 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/mistral_24b_dpo_4 | 2025-07-11 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 856.5 | 1.0 | 1288.51 | 1353.66 | 0.6 | 0.99 | rirv938-nitral-40k-1248-v2_v1 | 13B | rirv938/nitral_40k_1248_v2 | rirv938-nitral-40k-1248-v2_v1 | 17030 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_40k_1248_ | 2024-12-27 | single | 2.91 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 856.5 | 1.0 | 1288.51 | 1353.66 | 0.58 | 0.99 | rirv938-mistral-24b-dpo_29487_v2 | 24B | rirv938/mistral_24b_dpo_40k_95w_pref_1250_instruct_dpo_2_v2 | rirv938-mistral-24b-dpo_29487_v2 | 9017 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-05 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 858.0 | 1.0 | 1288.49 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-beta-_63113_v1 | 13B | rirv938/anthropic_beta_2_40k_1872_bo8_v2 | rirv938-anthropic-beta-_63113_v1 | 30297 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-29 | single | 2.91 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 859.0 | 1.0 | 1288.48 | 1353.66 | 0.53 | 0.99 | blend_defil_2025-07-09 | n/a | | rob_ab_test | 7171 | 61115860 | 0.49 | 0.65 | blend | | | | | | | 2025-07-09 | blended | | |
rirv938 | 1 | 860.5 | 1.0 | 1288.46 | 1353.66 | 0.52 | 0.99 | rirv938-0sw-96p-4ff-rir_91910_v1 | 24B | rirv938/0sw_96p_4ff_rirv938_mistral_24b_dpo_43074_v1_cp468_v3 | rirv938-0sw-96p-4ff-rir_91910_v1 | 6657 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_96p_4ff_rirv | 2025-03-25 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 860.5 | 1.0 | 1288.46 | 1353.66 | 0.55 | 0.99 | rinen0721-dpo-0130-cp3000_v15 | 13B | rinen0721/dpo-0130-cp3000 | rinen0721-dpo-0130-cp3000_v15 | 5708 | 61115860 | 0.49 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rinen0721/dpo-0130-cp300 | 2025-04-28 | single | 1.32 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 862.0 | 1.0 | 1288.45 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-40k-1_16761_v1 | 13B | rirv938/anthropic_40k_1248_bo8_85w_b4_2xlora_lr4_v2 | rirv938-anthropic-40k-1_16761_v1 | 19077 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_12 | 2025-01-01 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 863.0 | 1.0 | 1288.39 | 1353.66 | 0.58 | 0.99 | function_bedul_2024-12-26 | | | retune_with_base | 21787 | 61115860 | 0.54 | 0.65 | function | | | | | | | 2024-12-26 | single | | |
rirv938 | 1 | 864.0 | 1.0 | 1288.36 | 1353.66 | 0.57 | 0.99 | rirv938-anthropic-grpo-_64392_v1 | 13B | rirv938/anthropic_grpo_40k_cp624_95ff_beta6_merged | rirv938-anthropic-grpo-_64392_v1 | 5825 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-15 | single | 1.62 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 865.0 | 1.0 | 1288.33 | 1353.66 | 0.53 | 0.99 | chaiml-snugstable-grpo-4_7330_v1 | 13B | ChaiML/snugstable_grpo_40k_cp1184_93ff | chaiml-snugstable-grpo-4_7330_v1 | 8935 | 61115860 | 0.48 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/snugstable_grpo_4 | 2025-05-01 | single | 1.36 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 866.0 | 1.0 | 1288.28 | 1353.66 | 0.58 | 0.99 | function_sileb_2025-02-24 | | | retune_with_base | 5608 | 61115860 | 0.53 | 0.65 | function | | | | | | | 2025-02-24 | single | | |
rirv938 | 1 | 867.0 | 1.0 | 1288.27 | 1353.66 | 0.46 | 0.99 | chaiml-mistral-24b-dpo-_43220_v5 | 24B | ChaiML/mistral_24b_dpo_40k_95w_pref_1250_instruct_dpo_2_merged | chaiml-mistral-24b-dpo-_43220_v5 | 5787 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/mistral_24b_dpo_4 | 2025-04-16 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 868.0 | 1.0 | 1288.25 | 1353.66 | 0.58 | 0.99 | rirv938-nitral-40k-2500_76258_v1 | 13B | rirv938/nitral_40k_2500_13ff_10w_bo32_old_rm_v2 | rirv938-nitral-40k-2500_76258_v1 | 7752 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/nitral_40k_2500_ | 2025-01-31 | single | | |
rirv938 | 1 | 869.0 | 1.0 | 1288.23 | 1353.66 | 0.56 | 0.99 | rirv938-harry-potter-rp_65094_v2 | 24B | rirv938/harry_potter_rp_grpo_cp624_98ff_b35_r1_merged | rirv938-harry-potter-rp_65094_v2 | 6902 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/harry_potter_rp_ | 2025-07-07 | single | 1.32 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 870.0 | 1.0 | 1288.21 | 1353.66 | 0.59 | 0.99 | rirv938-96p-4ff-nischaydn_844_v2 | 24B | rirv938/96p_4ff_nischaydnk_exp14_exp9dp_94555_v6_cp2000_merged | rirv938-96p-4ff-nischaydn_844_v2 | 20421 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_nischayd | 2025-06-07 | single | | |
rirv938 | 1 | 871.0 | 1.0 | 1288.2 | 1353.66 | 0.54 | 0.99 | blend_potek_2025-03-08 | n/a | | rob_ab_test | 10001 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-03-08 | blended | | |
rirv938 | 1 | 872.0 | 1.0 | 1288.18 | 1353.66 | 0.55 | 0.99 | rirv938-nitral-40k-2500_98229_v1 | 13B | rirv938/nitral_40k_2500_0w_bo32_new_rm_v2 | rirv938-nitral-40k-2500_98229_v1 | 5380 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/nitral_40k_2500_ | 2025-01-30 | single | | |
rirv938 | 1 | 873.0 | 1.0 | 1288.16 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-40k-2_75038_v1 | 13B | rirv938/anthropic_40k_2500_15w_swearing_no_safety_v2 | rirv938-anthropic-40k-2_75038_v1 | 7792 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_25 | 2025-01-28 | single | | |
rirv938 | 1 | 874.0 | 1.0 | 1288.07 | 1353.66 | 0.59 | 0.99 | rirv938-mistral-24b-rou_41210_v1 | 24B | rirv938/mistral_24b_round_2_dpo_40k_70w_pref_16w_swear_2500_v2 | rirv938-mistral-24b-rou_41210_v1 | 10289 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_roun | 2025-03-07 | single | 0.76 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 875.0 | 1.0 | 1288.06 | 1353.66 | 0.54 | 0.99 | rirv938-96p-4ff-rirv938_59567_v1 | 24B | rirv938/96p_4ff_rirv938_1000_sim_100p_0_17599_v1_cp530_merged | rirv938-96p-4ff-rirv938_59567_v1 | 6368 | 61115860 | 0.49 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/96p_4ff_rirv938_ | 2025-04-21 | single | 1.49 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 876.5 | 1.0 | 1288.05 | 1353.66 | 0.48 | 0.99 | rirv938-mistral-24b-dpo_39021_v1 | 24B | rirv938/mistral_24b_dpo_kl_10k_beta2_936_v3 | rirv938-mistral-24b-dpo_39021_v1 | 7552 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-25 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 876.5 | 1.0 | 1288.05 | 1353.66 | 0.53 | 0.99 | blend_famot_2025-07-09 | n/a | | rob_ab_test | 6868 | 61115860 | 0.49 | 0.65 | blend | | | | | | | 2025-07-09 | blended | | |
rirv938 | 1 | 878.0 | 1.0 | 1288.03 | 1353.66 | 0.54 | 0.99 | rirv938-mistral-24b-dpo_56149_v1 | 24B | rirv938/mistral_24b_dpo_kl_2500_beta4_390_v3 | rirv938-mistral-24b-dpo_56149_v1 | 6091 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-24 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 879.0 | 1.0 | 1288.02 | 1353.66 | 0.44 | 0.99 | rirv938-mistral-24b-dpo_67163_v1 | 24B | rirv938/mistral_24b_dpo_kl_10k_beta1_1248_v3 | rirv938-mistral-24b-dpo_67163_v1 | 10290 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-25 | single | 0.8 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 880.0 | 1.0 | 1288.0 | 1353.66 | 0.59 | 0.99 | rirv938-nitral-18k-279-v2_v1 | 13B | rirv938/nitral_18k_279_v2 | rirv938-nitral-18k-279-v2_v1 | 17608 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_18k_279_v | 2024-12-27 | single | 2.92 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 881.0 | 1.0 | 1287.95 | 1353.66 | 0.56 | 0.99 | rirv938-grpo-to-compare_32686_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp156_lr5_merged | rirv938-grpo-to-compare_32686_v1 | 7445 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-25 | single | 1.47 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 882.5 | 1.0 | 1287.91 | 1353.66 | 0.58 | 0.99 | rirv938-nitral-40k-1875-_3275_v1 | 13B | rirv938/nitral_40k_1875_13ff_15w_bo32_old_rm_v2 | rirv938-nitral-40k-1875-_3275_v1 | 5916 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/nitral_40k_1875_ | 2025-01-31 | single | | |
rirv938 | 1 | 882.5 | 1.0 | 1287.91 | 1353.66 | 0.52 | 0.99 | rirv938-0sw-94p-6ff-rir_46054_v1 | 24B | rirv938/0sw_94p_6ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp312_v2 | rirv938-0sw-94p-6ff-rir_46054_v1 | 8881 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_94p_6ff_rirv | 2025-03-26 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 884.0 | 1.0 | 1287.88 | 1353.66 | 0.51 | 0.99 | chaiml-mistral31-24b-si_69496_v6 | 24B | ChaiML/mistral31-24b-simpoexp1-s1-new-sft-retryv2top20lex-2e | chaiml-mistral31-24b-si_69496_v6 | 7885 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/mistral31-24b-sim | 2025-06-10 | single | | |
rirv938 | 1 | 885.0 | 1.0 | 1287.85 | 1353.66 | 0.59 | 0.99 | function_norur_2024-12-31 | | | retune_with_base | 9049 | 61115860 | 0.53 | 0.65 | function | | | | | | | 2024-12-31 | single | | |
rirv938 | 1 | 886.0 | 1.0 | 1287.82 | 1353.66 | 0.52 | 0.99 | rirv938-mistral-24b-dpo_87088_v1 | 24B | rirv938/mistral_24b_dpo_kl_40k_beta4_3750_v3 | rirv938-mistral-24b-dpo_87088_v1 | 6277 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-24 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 887.0 | 1.0 | 1287.81 | 1353.66 | 0.57 | 0.99 | rirv938-mistral-24b-dpo_43074_v1 | 24B | rirv938/mistral_24b_dpo_kl_2500_beta4_234_v3 | rirv938-mistral-24b-dpo_43074_v1 | 5934 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-24 | single | 0.79 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 888.0 | 1.0 | 1287.78 | 1353.66 | 0.54 | 0.99 | function_fobos_2025-06-25 | | | dpo_data_collection | 11809 | 61115860 | 0.5 | 0.65 | function | | | | | | | 2025-06-25 | single | | |
rirv938 | 1 | 889.0 | 1.0 | 1287.77 | 1353.66 | 0.56 | 0.99 | blend_lehil_2025-02-24 | n/a | | rob_ab_test | 5558 | 61115860 | 0.56 | 0.65 | blend | | | | | | | 2025-02-24 | blended | | |
rirv938 | 1 | 890.0 | 1.0 | 1287.73 | 1353.66 | 0.54 | 0.99 | blend_dobam_2025-04-23 | n/a | | rob_ab_test | 9147 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-04-23 | blended | | |
rirv938 | 1 | 891.0 | 1.0 | 1287.71 | 1353.66 | 0.54 | 0.99 | blend_sotuf_2025-03-08 | n/a | | rob_ab_test | 10142 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-03-08 | blended | | |
rirv938 | 1 | 892.0 | 1.0 | 1287.68 | 1353.66 | 0.54 | 0.99 | blend_jidif_2025-07-09 | n/a | | rob_ab_test | 7534 | 61115860 | 0.49 | 0.65 | blend | | | | | | | 2025-07-09 | blended | | |
rirv938 | 1 | 893.0 | 1.0 | 1287.55 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_22923_v2 | 13B | rirv938/anthropic_grpo_40k_cp444_95ff_20ww2_merged | rirv938-anthropic-grpo-_22923_v2 | 7114 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-15 | single | 1.6 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 894.0 | 1.0 | 1287.53 | 1353.66 | 0.54 | 0.99 | function_kegus_2025-05-22 | | | dpo_data_collection | 6423 | 61115860 | 0.5 | 0.65 | function | | | | | | | 2025-05-21 | single | | |
rirv938 | 1 | 895.0 | 1.0 | 1287.52 | 1353.66 | 0.53 | 0.99 | blend_deset_2025-06-12 | n/a | | rob_ab_test | 8487 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-06-11 | blended | | |
rirv938 | 1 | 896.0 | 1.0 | 1287.5 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-beta-_80283_v1 | 13B | rirv938/anthropic_beta_2_40k_1248_bo8_100w_b4_v2 | rirv938-anthropic-beta-_80283_v1 | 12269 | 61115860 | 0.51 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-30 | single | 1.76 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 897.0 | 1.0 | 1287.47 | 1353.66 | 0.59 | 0.99 | rirv938-nitral-beta-4-4_77721_v1 | 13B | rirv938/nitral_beta_4_40k_1248_v2 | rirv938-nitral-beta-4-4_77721_v1 | 19977 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_beta_4_40 | 2024-12-27 | single | 3.06 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 898.0 | 1.0 | 1287.46 | 1353.66 | 0.57 | 0.99 | chaiml-slerp-grpo-cp312_20135_v2 | 24B | ChaiML/slerp_grpo_cp312_96ff_b6_r1_merged | chaiml-slerp-grpo-cp312_20135_v2 | 6148 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerp_grpo_cp312_ | 2025-05-30 | single | | |
rirv938 | 1 | 899.0 | 1.0 | 1287.44 | 1353.66 | 0.55 | 0.99 | nitral-ai-captain-bmo-12b_v46 | 13B | Nitral-AI/Captain_BMO-12B | nitral-ai-captain-bmo-12b_v46 | 9215 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | Nitral-AI/Captain_BMO-12 | 2025-04-30 | single | 1.58 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 900.0 | 1.0 | 1287.43 | 1353.66 | 0.48 | 0.99 | rirv938-grpo-20250711-c_20147_v2 | 24B | rirv938/grpo_20250711_cp624_sid_mistral_24b_dpo_40k__merged | rirv938-grpo-20250711-c_20147_v2 | 9882 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_20250711_cp | 2025-07-11 | single | 1.34 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 901.0 | 1.0 | 1287.42 | 1353.66 | 0.54 | 0.99 | function_momil_2025-06-25 | | | dpo_data_collection | 5523 | 61115860 | 0.52 | 0.65 | function | | | | | | | 2025-06-24 | single | | |
rirv938 | 1 | 903.0 | 1.0 | 1287.41 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-beta-_99529_v2 | 13B | rirv938/anthropic_beta_2_40k_1872_bo4_v2 | rirv938-anthropic-beta-_99529_v2 | 25395 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-29 | single | 2.94 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 903.0 | 1.0 | 1287.41 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-40k-1_25268_v1 | 13B | rirv938/anthropic_40k_1248_bo8_85w_b4_2xlora_v2 | rirv938-anthropic-40k-1_25268_v1 | 11936 | 61115860 | 0.52 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_12 | 2025-01-01 | single | 1.77 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 903.0 | 1.0 | 1287.41 | 1353.66 | 0.5 | 0.99 | chaiml-bold-v1-rirv938-2_7710_v1 | 24B | ChaiML/bold_v1_rirv938_20250420 | chaiml-bold-v1-rirv938-2_7710_v1 | 9064 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/bold_v1_rirv938_2 | 2025-04-22 | single | 1.43 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 905.0 | 1.0 | 1287.39 | 1353.66 | 0.51 | 0.99 | rirv938-anthropic-grpo-_26753_v1 | 13B | rirv938/anthropic_grpo_40k_cp124_98ff_g4b15_merged | rirv938-anthropic-grpo-_26753_v1 | 7933 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-18 | single | 1.56 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 906.0 | 1.0 | 1287.29 | 1353.66 | 0.53 | 0.99 | blend_tader_2025-06-25 | n/a | | rob_ab_test | 5764 | 61115860 | 0.52 | 0.65 | blend | | | | | | | 2025-06-24 | blended | | |
rirv938 | 1 | 907.0 | 1.0 | 1287.24 | 1353.66 | 0.64 | 0.99 | rirv938-98p-2ff-rirv938_78334_v1 | 13B | rirv938/98p_2ff_rirv938_mistral_12b_oai_47210_v1_cp872_merged | rirv938-98p-2ff-rirv938_78334_v1 | 6278 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/98p_2ff_rirv938_ | 2025-04-10 | single | 1.32 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 908.5 | 1.0 | 1287.14 | 1353.66 | 0.57 | 0.99 | rirv938-1000-sim-100p-0_17599_v2 | 24B | rirv938/1000_sim_100p_0ff_rirv938_mistral_24b_lex__1090_v2_cp374_merged | rirv938-1000-sim-100p-0_17599_v2 | 7289 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/1000_sim_100p_0f | 2025-04-20 | single | 0.64 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 908.5 | 1.0 | 1287.14 | 1353.66 | 0.56 | 0.99 | rirv938-grpo-to-compare_45958_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp310_merged | rirv938-grpo-to-compare_45958_v1 | 6513 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-25 | single | 1.43 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 910.0 | 1.0 | 1287.1 | 1353.66 | 0.45 | 0.99 | chaiml-mistral-24b-dpo_43220_v11 | 24B | ChaiML/mistral_24b_dpo_40k_95w_pref_1250_instruct_dpo_2_merged | chaiml-mistral-24b-dpo_43220_v11 | 9118 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/mistral_24b_dpo_4 | 2025-07-14 | single | 1.33 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 912.0 | 1.0 | 1287.09 | 1353.66 | 0.58 | 0.99 | rirv938-v-3-mistral-558-v2_v1 | 13B | rirv938/v_3_mistral_558_v2 | rirv938-v-3-mistral-558-v2_v1 | 18626 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/v_3_mistral_558_ | 2024-12-21 | single | 1.78 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 912.0 | 1.0 | 1287.09 | 1353.66 | 0.56 | 0.99 | rirv938-grpo-to-compare_65873_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp156_lr3_merged | rirv938-grpo-to-compare_65873_v1 | 11810 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-25 | single | 1.48 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 912.0 | 1.0 | 1287.09 | 1353.66 | 0.49 | 0.99 | rirv938-0sw-99p-1ff-rirv_2746_v1 | 24B | rirv938/0sw_99p_1ff_rirv938_mistral_24b_dpo_43074_v1_cp234_v3 | rirv938-0sw-99p-1ff-rirv_2746_v1 | 6834 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_99p_1ff_rirv | 2025-03-25 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 914.0 | 1.0 | 1287.08 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-40k-2_75038_v2 | 13B | rirv938/anthropic_40k_2500_15w_swearing_no_safety_v2 | rirv938-anthropic-40k-2_75038_v2 | 8018 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_25 | 2025-01-28 | single | | |
rirv938 | 1 | 915.0 | 1.0 | 1287.05 | 1353.66 | 0.58 | 0.99 | chaiml-slerpv5-mistral_24540_v13 | 24B | ChaiML/slerpv5_mistral31_simpo_dpo_dpoold_s2 | chaiml-slerpv5-mistral_24540_v13 | 20583 | 61115860 | 0.49 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerpv5_mistral31 | 2025-06-05 | single | | |
rirv938 | 1 | 916.5 | 1.0 | 1287.02 | 1353.66 | 0.56 | 0.99 | rirv938-1000-sim-100p-0_45214_v2 | 24B | rirv938/1000_sim_100p_0ff_rirv938_mistral_24b_lex__1090_v2_cp748_merged | rirv938-1000-sim-100p-0_45214_v2 | 7053 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/1000_sim_100p_0f | 2025-04-20 | single | 0.62 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 916.5 | 1.0 | 1287.02 | 1353.66 | 0.59 | 0.99 | function_rufor_2024-12-31 | | | retune_with_base | 11696 | 61115860 | 0.53 | 0.65 | function | | | | | | | 2024-12-31 | single | | |
rirv938 | 1 | 918.0 | 1.0 | 1287.0 | 1353.66 | 0.55 | 0.99 | blend_rudur_2025-03-21 | n/a | | rob_ab_test | 7062 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-03-21 | blended | | |
rirv938 | 1 | 919.0 | 1.0 | 1286.91 | 1353.66 | 0.47 | 0.99 | function_defom_2025-03-14 | | | dpo_data_collection | 7229 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-03-14 | single | | |
rirv938 | 1 | 920.0 | 1.0 | 1286.87 | 1353.66 | 0.51 | 0.99 | rirv938-0sw-96p-4ff-rir_20571_v1 | 24B | rirv938/0sw_96p_4ff_rirv938_mistral_24b_dpo_43074_v1_cp780_v3 | rirv938-0sw-96p-4ff-rir_20571_v1 | 6590 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_96p_4ff_rirv | 2025-03-25 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 921.0 | 1.0 | 1286.86 | 1353.66 | 0.55 | 0.99 | rirv938-anthropic-grpo-_74020_v1 | 13B | rirv938/anthropic_grpo_40k_cp78_95ff_beta6_merged | rirv938-anthropic-grpo-_74020_v1 | 8159 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-15 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 922.5 | 1.0 | 1286.85 | 1353.66 | 0.56 | 0.99 | chaiml-camp-half-blood-_29383_v4 | 24B | ChaiML/Camp-Half-blood-Rp250614101345_preference_dpo | chaiml-camp-half-blood-_29383_v4 | 7590 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/Camp-Half-blood-R | 2025-07-07 | single | 1.36 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 922.5 | 1.0 | 1286.85 | 1353.66 | 0.55 | 0.99 | chaiml-nemo-anthropic-_38239_v25 | 13B | ChaiML/nemo_anthropic_addict_lexical_1120_run2 | chaiml-nemo-anthropic-_38239_v25 | 5975 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/nemo_anthropic_ad | 2025-05-13 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 924.0 | 1.0 | 1286.83 | 1353.66 | 0.0 | 0.99 | function_honuk_2025-06-25 | | | dpo_data_collection | 1792 | 61115860 | 0.5 | 0.65 | function | | | | | | | 2025-06-25 | single | | |
rirv938 | 1 | 925.0 | 1.0 | 1286.79 | 1353.66 | 0.59 | 0.99 | rirv938-nitral-beta-4-40_6225_v1 | 13B | rirv938/nitral_beta_4_40k_312_v2 | rirv938-nitral-beta-4-40_6225_v1 | 11521 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_beta_4_40 | 2024-12-27 | single | 2.94 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 926.0 | 1.0 | 1286.76 | 1353.66 | 0.52 | 0.99 | function_dadeb_2025-02-27 | | | retune_with_base | 5734 | 61115860 | 0.5 | 0.65 | function | | | | | | | 2025-02-27 | single | | |
rirv938 | 1 | 927.5 | 1.0 | 1286.73 | 1353.66 | 0.53 | 0.99 | function_gugar_2025-06-25 | | | dpo_data_collection | 6035 | 61115860 | 0.5 | 0.65 | function | | | | | | | 2025-06-25 | single | | |
rirv938 | 1 | 927.5 | 1.0 | 1286.73 | 1353.66 | 0.53 | 0.99 | blend_sufis_2025-06-25 | n/a | | rob_ab_test | 5765 | 61115860 | 0.52 | 0.65 | blend | | | | | | | 2025-06-24 | blended | | |
rirv938 | 1 | 929.0 | 1.0 | 1286.71 | 1353.66 | 0.6 | 0.99 | blend_potol_2025-01-06 | n/a | | rob_ab_test | 9032 | 61115860 | 0.52 | 0.65 | blend | | | | | | | 2025-01-06 | blended | | |
rirv938 | 1 | 930.0 | 1.0 | 1286.7 | 1353.66 | 0.54 | 0.99 | function_binot_2025-05-28 | | | dpo_data_collection | 8296 | 61115860 | 0.5 | 0.65 | function | | | | | | | 2025-05-28 | single | | |
rirv938 | 1 | 931.0 | 1.0 | 1286.65 | 1353.66 | 0.52 | 0.99 | blend_tepuk_2025-06-12 | n/a | | rob_ab_test | 9785 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-06-11 | blended | | |
rirv938 | 1 | 932.0 | 1.0 | 1286.57 | 1353.66 | 0.57 | 0.99 | rirv938-grpo-to-compare_75170_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp310_lr2_merged | rirv938-grpo-to-compare_75170_v1 | 6931 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-25 | single | 1.46 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 933.0 | 1.0 | 1286.55 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-40k-2_62187_v1 | 13B | rirv938/anthropic_40k_2500_13w_bo32_v2 | rirv938-anthropic-40k-2_62187_v1 | 5874 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_25 | 2025-01-30 | single | | |
rirv938 | 1 | 934.0 | 1.0 | 1286.4 | 1353.66 | 0.56 | 0.99 | rirv938-mistral-12b-dpo-_9564_v1 | 13B | rirv938/mistral_12b_dpo_40k_2374_64_output_tokens_v2 | rirv938-mistral-12b-dpo-_9564_v1 | 6081 | 61115860 | 0.58 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_12b_dpo_ | 2025-02-24 | single | 1.54 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 935.5 | 1.0 | 1286.39 | 1353.66 | 0.54 | 0.99 | blend_rujik_2025-06-25 | n/a | | rob_ab_test | 6502 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-06-25 | blended | | |
rirv938 | 1 | 935.5 | 1.0 | 1286.39 | 1353.66 | 0.55 | 0.99 | function_hohub_2025-01-29 | | | retune_with_base | 7140 | 61115860 | 0.52 | 0.65 | function | | | | | | | 2025-01-29 | single | | |
rirv938 | 1 | 937.0 | 1.0 | 1286.37 | 1353.66 | 0.57 | 0.99 | chaiml-slerpv5-mistral_24540_v12 | 24B | ChaiML/slerpv5_mistral31_simpo_dpo_dpoold_s2 | chaiml-slerpv5-mistral_24540_v12 | 21358 | 61115860 | 0.49 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerpv5_mistral31 | 2025-06-05 | single | | |
rirv938 | 1 | 938.0 | 1.0 | 1286.36 | 1353.66 | 0.54 | 0.99 | blend_fogeb_2025-06-25 | n/a | | rob_ab_test | 6155 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-06-25 | blended | | |
rirv938 | 1 | 939.0 | 1.0 | 1286.34 | 1353.66 | 0.48 | 0.99 | rirv938-0sw-98p-2ff-rir_61371_v1 | 24B | rirv938/0sw_98p_2ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp156_v2 | rirv938-0sw-98p-2ff-rir_61371_v1 | 9441 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_98p_2ff_rirv | 2025-03-26 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 940.0 | 1.0 | 1286.18 | 1353.66 | 0.55 | 0.99 | function_lekar_2025-05-22 | | | dpo_data_collection | 6406 | 61115860 | 0.5 | 0.65 | function | | | | | | | 2025-05-22 | single | | |
rirv938 | 1 | 941.0 | 1.0 | 1286.17 | 1353.66 | 0.55 | 0.99 | blend_tehar_2025-04-14 | n/a | | rob_ab_test | 5486 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-04-14 | blended | | |
rirv938 | 1 | 942.0 | 1.0 | 1286.08 | 1353.66 | 0.54 | 0.99 | blend_pirun_2025-06-25 | n/a | | rob_ab_test | 6084 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-06-25 | blended | | |
rirv938 | 1 | 943.0 | 1.0 | 1286.07 | 1353.66 | 0.55 | 0.99 | rirv938-mistral-12b-dpo_28324_v1 | 13B | rirv938/mistral_12b_dpo_40k_3561_64_output_tokens_v2 | rirv938-mistral-12b-dpo_28324_v1 | 6129 | 61115860 | 0.54 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_12b_dpo_ | 2025-02-24 | single | 1.58 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 944.0 | 1.0 | 1285.98 | 1353.66 | 0.52 | 0.99 | rirv938-anthropic-grpo-_57458_v1 | 13B | rirv938/anthropic_grpo_40k_cp62_98ff_g4b15_merged | rirv938-anthropic-grpo-_57458_v1 | 7990 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-18 | single | 1.63 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 945.0 | 1.0 | 1285.91 | 1353.66 | 0.58 | 0.99 | rirv938-anthropic-40k-25_7275_v1 | 13B | rirv938/anthropic_40k_2500_15w_old_new_data_v2 | rirv938-anthropic-40k-25_7275_v1 | 8411 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_25 | 2025-01-29 | single | | |
rirv938 | 1 | 946.5 | 1.0 | 1285.89 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-40k-1_60332_v1 | 13B | rirv938/anthropic_40k_1248_bo8_85w_b4_l1_v2 | rirv938-anthropic-40k-1_60332_v1 | 11145 | 61115860 | 0.52 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_12 | 2024-12-31 | single | 1.74 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 946.5 | 1.0 | 1285.89 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-20k-1_54023_v1 | 13B | rirv938/anthropic_20k_1248_bo8_80w_dpo5_v2 | rirv938-anthropic-20k-1_54023_v1 | 18791 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_20k_12 | 2025-01-02 | single | 1.67 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 948.0 | 1.0 | 1285.88 | 1353.66 | 0.56 | 0.99 | blend_lipib_2025-03-21 | n/a | | rob_ab_test | 6903 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-03-21 | blended | | |
rirv938 | 1 | 949.0 | 1.0 | 1285.83 | 1353.66 | 0.58 | 0.99 | nitral-ai-captain-bmo-12b_v27 | 13B | Nitral-AI/Captain_BMO-12B | nitral-ai-captain-bmo-12b_v27 | 5550 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | Nitral-AI/Captain_BMO-12 | 2025-01-30 | single | | |
rirv938 | 1 | 950.0 | 1.0 | 1285.82 | 1353.66 | 0.55 | 0.99 | blend_hobim_2025-04-23 | n/a | | rob_ab_test | 9511 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-04-23 | blended | | |
rirv938 | 1 | 951.5 | 1.0 | 1285.81 | 1353.66 | 0.6 | 0.99 | rirv938-nitral-40k-312-v2_v1 | 13B | rirv938/nitral_40k_312_v2 | rirv938-nitral-40k-312-v2_v1 | 25032 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_40k_312_v | 2024-12-27 | single | 2.91 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 951.5 | 1.0 | 1285.81 | 1353.66 | 0.56 | 0.99 | chaiml-nemo-anthropic-_38239_v21 | 13B | ChaiML/nemo_anthropic_addict_lexical_1120_run2 | chaiml-nemo-anthropic-_38239_v21 | 7211 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/nemo_anthropic_ad | 2025-04-28 | single | 1.31 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 953.0 | 1.0 | 1285.78 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-40k-1_92306_v1 | 13B | rirv938/anthropic_40k_1248_bo8_85w_b4_l2_v2 | rirv938-anthropic-40k-1_92306_v1 | 11015 | 61115860 | 0.51 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_12 | 2024-12-31 | single | 1.81 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 954.0 | 1.0 | 1285.75 | 1353.66 | 0.56 | 0.99 | rirv938-tune-mistral-gr_89879_v1 | 24B | rirv938/tune_mistral_grpo_cp62_92ff_v4_merged | rirv938-tune-mistral-gr_89879_v1 | 7426 | 61115860 | 0.48 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/tune_mistral_grp | 2025-04-29 | single | 1.75 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 955.0 | 1.0 | 1285.73 | 1353.66 | 0.59 | 0.99 | blend_mekit_2025-01-16 | n/a | | rob_ab_test | 7320 | 61115860 | 0.52 | 0.65 | blend | | | | | | | 2025-01-16 | blended | | |
rirv938 | 1 | 956.5 | 1.0 | 1285.68 | 1353.66 | 0.56 | 0.99 | rirv938-grpo-to-compare_51856_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp312_lr3_merged | rirv938-grpo-to-compare_51856_v1 | 11418 | 61115860 | 0.49 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-25 | single | 1.43 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 956.5 | 1.0 | 1285.68 | 1353.66 | 0.57 | 0.99 | chaiml-slerpv5-mistral_24540_v17 | 24B | ChaiML/slerpv5_mistral31_simpo_dpo_dpoold_s2 | chaiml-slerpv5-mistral_24540_v17 | 9495 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerpv5_mistral31 | 2025-06-09 | single | | |
rirv938 | 1 | 958.0 | 1.0 | 1285.66 | 1353.66 | 0.61 | 0.99 | function_tehok_2025-03-07 | | | retune_with_base | 9871 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-03-07 | single | | |
rirv938 | 1 | 959.5 | 1.0 | 1285.52 | 1353.66 | 0.53 | 0.99 | rirv938-mistral-24b-dpo_92099_v1 | 24B | rirv938/mistral_24b_dpo_kl_10k_beta2_312_v3 | rirv938-mistral-24b-dpo_92099_v1 | 8286 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-25 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 959.5 | 1.0 | 1285.52 | 1353.66 | 0.57 | 0.99 | blend_robal_2025-02-25 | n/a | | rob_ab_test | 6035 | 61115860 | 0.54 | 0.65 | blend | | | | | | | 2025-02-25 | blended | | |
rirv938 | 1 | 961.0 | 1.0 | 1285.49 | 1353.66 | 0.55 | 0.99 | blend_satib_2025-03-21 | n/a | | rob_ab_test | 6333 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-03-21 | blended | | |
rirv938 | 1 | 962.5 | 1.0 | 1285.48 | 1353.66 | 0.53 | 0.99 | blend_kibes_2025-07-09 | n/a | | rob_ab_test | 7002 | 61115860 | 0.49 | 0.65 | blend | | | | | | | 2025-07-09 | blended | | |
rirv938 | 1 | 962.5 | 1.0 | 1285.48 | 1353.66 | 0.55 | 0.99 | function_hukor_2025-06-25 | | | dpo_data_collection | 6537 | 61115860 | 0.5 | 0.65 | function | | | | | | | 2025-06-25 | single | | |
rirv938 | 1 | 964.0 | 1.0 | 1285.47 | 1353.66 | 0.56 | 0.99 | rirv938-tune-mistral-gr_63526_v1 | 24B | rirv938/tune_mistral_grpo_cp296_92ff_v3_run3_merged | rirv938-tune-mistral-gr_63526_v1 | 6313 | 61115860 | 0.49 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/tune_mistral_grp | 2025-04-30 | single | 1.73 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 965.0 | 1.0 | 1285.41 | 1353.66 | 0.58 | 0.99 | rirv938-nitral-40k-2500_33037_v1 | 13B | rirv938/nitral_40k_2500_13ff_15w_bo32_old_rm_v2 | rirv938-nitral-40k-2500_33037_v1 | 7719 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/nitral_40k_2500_ | 2025-01-31 | single | | |
rirv938 | 1 | 966.0 | 1.0 | 1285.35 | 1353.66 | 0.6 | 0.99 | rirv938-anthropic-beta-_39265_v1 | 13B | rirv938/anthropic_beta_2_40k_1248_bo8_v2 | rirv938-anthropic-beta-_39265_v1 | 15125 | 61115860 | 0.52 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_beta_2 | 2024-12-29 | single | 2.94 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 967.0 | 1.0 | 1285.33 | 1353.66 | 0.53 | 0.99 | blend_dodaf_2025-06-12 | n/a | | rob_ab_test | 7775 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-06-11 | blended | | |
rirv938 | 1 | 968.0 | 1.0 | 1285.32 | 1353.66 | 0.54 | 0.99 | rirv938-mistral-12b-bon_20382_v1 | 13B | rirv938/mistral_12b_bon_1400_346_v2 | rirv938-mistral-12b-bon_20382_v1 | 5727 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/mistral_12b_bon_ | 2025-02-19 | single | 1.3 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 969.0 | 1.0 | 1285.31 | 1353.66 | 0.55 | 0.99 | rirv938-anthropic-grpo-4_5638_v1 | 13B | rirv938/anthropic_grpo_40k_cp78_95ff_beta4_merged | rirv938-anthropic-grpo-4_5638_v1 | 8040 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-15 | single | 1.64 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 970.0 | 1.0 | 1285.29 | 1353.66 | 0.59 | 0.99 | chaiml-slerpv5-mistral_24540_v16 | 24B | ChaiML/slerpv5_mistral31_simpo_dpo_dpoold_s2 | chaiml-slerpv5-mistral_24540_v16 | 20223 | 61115860 | 0.49 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | ChaiML/slerpv5_mistral31 | 2025-06-07 | single | | |
rirv938 | 1 | 971.0 | 1.0 | 1285.26 | 1353.66 | 0.57 | 0.99 | chaiml-anthropic-grpo-4_68396_v1 | 13B | ChaiML/anthropic_grpo_40k_cp624_95ff_beta6_merged | chaiml-anthropic-grpo-4_68396_v1 | 7051 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/anthropic_grpo_40 | 2025-05-15 | single | 1.62 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 972.0 | 1.0 | 1285.25 | 1353.66 | 0.53 | 0.99 | blend_gejib_2025-07-09 | n/a | | rob_ab_test | 6665 | 61115860 | 0.49 | 0.65 | blend | | | | | | | 2025-07-09 | blended | | |
rirv938 | 1 | 973.0 | 1.0 | 1285.24 | 1353.66 | 0.54 | 0.99 | blend_betul_2025-06-25 | n/a | | rob_ab_test | 6444 | 61115860 | 0.51 | 0.65 | blend | | | | | | | 2025-06-25 | blended | | |
rirv938 | 1 | 974.0 | 1.0 | 1285.2 | 1353.66 | 0.54 | 0.99 | rirv938-groksyn-grpo-cp_55837_v1 | 24B | rirv938/groksyn_grpo_cp624_98ff_b35_r1_merged | rirv938-groksyn-grpo-cp_55837_v1 | 6020 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/groksyn_grpo_cp6 | 2025-07-03 | single | 1.57 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 975.0 | 1.0 | 1285.16 | 1353.66 | 0.53 | 0.99 | nischaydnk-exp14-exp9d_94555_v10 | 24B | NischayDnk/exp14-exp9DPOft-Chaidatav1dpo6k-Mistral24B | nischaydnk-exp14-exp9d_94555_v10 | 11250 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | NischayDnk/exp14-exp9DPO | 2025-06-07 | single | | |
rirv938 | 1 | 976.0 | 1.0 | 1285.12 | 1353.66 | 0.59 | 0.99 | rirv938-mistral-24b-dpo_29487_v4 | 24B | rirv938/mistral_24b_dpo_40k_95w_pref_1250_instruct_dpo_2_v2 | rirv938-mistral-24b-dpo_29487_v4 | 13175 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-03-06 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 977.0 | 1.0 | 1285.11 | 1353.66 | 0.6 | 0.99 | blend_deful_2025-01-16 | n/a | | rob_ab_test | 9191 | 61115860 | 0.52 | 0.65 | blend | | | | | | | 2025-01-16 | blended | | |
rirv938 | 1 | 978.0 | 1.0 | 1285.08 | 1353.66 | 0.56 | 0.99 | rirv938-anthropic-grpo-_72536_v1 | 13B | rirv938/anthropic_grpo_40k_cp234_95ff_beta6_merged | rirv938-anthropic-grpo-_72536_v1 | 6250 | 61115860 | 0.49 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-15 | single | 1.59 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 979.0 | 1.0 | 1285.05 | 1353.66 | 0.58 | 0.99 | rirv938-nitral-40k-1875_16875_v1 | 13B | rirv938/nitral_40k_1875_13ff_10w_bo32_old_rm_v2 | rirv938-nitral-40k-1875_16875_v1 | 5789 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/nitral_40k_1875_ | 2025-01-31 | single | | |
rirv938 | 1 | 980.0 | 1.0 | 1285.04 | 1353.66 | 0.54 | 0.99 | blend_jibis_2025-07-09 | n/a | | rob_ab_test | 7599 | 61115860 | 0.49 | 0.65 | blend | | | | | | | 2025-07-09 | blended | | |
rirv938 | 1 | 981.0 | 1.0 | 1285.03 | 1353.66 | 0.54 | 0.99 | function_pabut_2025-06-25 | | | dpo_data_collection | 7175 | 61115860 | 0.52 | 0.65 | function | | | | | | | 2025-06-24 | single | | |
rirv938 | 1 | 982.0 | 1.0 | 1285.02 | 1353.66 | 0.52 | 0.99 | rirv938-0sw-94p-6ff-rirv_6635_v1 | 24B | rirv938/0sw_94p_6ff_rirv938_0sw_99p_1ff_rir_73127_v1_cp156_v2 | rirv938-0sw-94p-6ff-rirv_6635_v1 | 9604 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/0sw_94p_6ff_rirv | 2025-03-26 | single | 0.77 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 983.0 | 1.0 | 1284.99 | 1353.66 | 0.45 | 0.99 | rirv938-10sw-100p-0ff-c_87664_v1 | 13B | rirv938/10sw_100p_0ff_chaiml_snugstable1_5_1_59274_v21_merge | rirv938-10sw-100p-0ff-c_87664_v1 | 8818 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/10sw_100p_0ff_ch | 2025-03-18 | single | 1.33 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 984.0 | 1.0 | 1284.98 | 1353.66 | 0.61 | 0.99 | rirv938-mistral-24b-dpo-_2511_v1 | 24B | rirv938/mistral_24b_dpo_40k_95w_pref_3750_instruct_l128_v2 | rirv938-mistral-24b-dpo-_2511_v1 | 8564 | 61115860 | 0.51 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/mistral_24b_dpo_ | 2025-02-23 | single | 0.78 | {'NVIDIA RTX A6000': 1} |
rirv938 | 1 | 985.5 | 1.0 | 1284.93 | 1353.66 | 0.54 | 0.99 | function_tujom_2025-06-25 | | | dpo_data_collection | 6539 | 61115860 | 0.51 | 0.65 | function | | | | | | | 2025-06-24 | single | | |
rirv938 | 1 | 985.5 | 1.0 | 1284.93 | 1353.66 | 0.57 | 0.99 | rirv938-harry-potter-rp_79878_v1 | 24B | rirv938/harry_potter_rp_grpo_cp312_98ff_b35_r1_merged | rirv938-harry-potter-rp_79878_v1 | 10033 | 61115860 | 0.53 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/harry_potter_rp_ | 2025-07-03 | single | 1.58 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 987.0 | 1.0 | 1284.92 | 1353.66 | 0.55 | 0.99 | chaiml-llama-8b-multih_78780_v32 | 8B | ChaiML/llama_8b_multihead_204m_512_v3_tokens_step_398208 | chaiml-llama-8b-multih_78780_v32 | 5278 | 61115860 | 0.51 | 0.65 | basic | | 1.0 | 1024.0 | 1.0 | MultiHeadLlamaClassifier | ChaiML/llama_8b_multihea | 2025-02-14 | single | | |
rirv938 | 1 | 988.5 | 1.0 | 1284.91 | 1353.66 | 0.53 | 0.99 | blend_hisit_2025-05-31 | n/a | | rob_ab_test | 6512 | 61115860 | 0.5 | 0.65 | blend | | | | | | | 2025-05-31 | blended | | |
rirv938 | 1 | 988.5 | 1.0 | 1284.91 | 1353.66 | 0.56 | 0.99 | blend_tuhin_2025-02-25 | n/a | | rob_ab_test | 5884 | 61115860 | 0.54 | 0.65 | blend | | | | | | | 2025-02-25 | blended | | |
rirv938 | 1 | 990.0 | 1.0 | 1284.9 | 1353.66 | 0.55 | 0.99 | rirv938-anthropic-grpo-_55195_v1 | 13B | rirv938/anthropic_grpo_40k_cp30_98ff_g2b15_merged | rirv938-anthropic-grpo-_55195_v1 | 7980 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_grpo_4 | 2025-05-18 | single | 1.59 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 991.0 | 1.0 | 1284.87 | 1353.66 | 0.59 | 0.99 | rirv938-nitral-beta-4-4_86147_v1 | 13B | rirv938/nitral_beta_4_40k_936_v2 | rirv938-nitral-beta-4-4_86147_v1 | 20559 | 61115860 | 0.52 | 0.65 | basic | | 4.0 | 512.0 | 64.0 | MistralForCausalLM | rirv938/nitral_beta_4_40 | 2024-12-27 | single | 2.88 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 992.0 | 1.0 | 1284.83 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-40k-1_93389_v1 | 13B | rirv938/anthropic_40k_1250_15w_old_data_v2 | rirv938-anthropic-40k-1_93389_v1 | 9613 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_12 | 2025-01-28 | single | | |
rirv938 | 1 | 993.5 | 1.0 | 1284.82 | 1353.66 | 0.58 | 0.99 | function_moruk_2025-01-16 | | | retune_with_base | 7652 | 61115860 | 0.52 | 0.65 | function | | | | | | | 2025-01-16 | single | | |
rirv938 | 1 | 993.5 | 1.0 | 1284.82 | 1353.66 | 0.49 | 0.99 | chaiml-anthropic-40k-24_11629_v5 | 13B | ChaiML/anthropic_40k_2496_bo8_85w_b4_l1_merged | chaiml-anthropic-40k-24_11629_v5 | 6622 | 61115860 | 0.49 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | ChaiML/anthropic_40k_249 | 2025-04-28 | single | 1.6 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 995.0 | 1.0 | 1284.81 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-40k-2_65477_v1 | 13B | rirv938/anthropic_40k_2500_15w_old_data_v2 | rirv938-anthropic-40k-2_65477_v1 | 7465 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_25 | 2025-01-28 | single | | |
rirv938 | 1 | 996.0 | 1.0 | 1284.8 | 1353.66 | 0.6 | 0.99 | rirv938-v10-pref-plus-03_7169_v1 | 13B | rirv938/v10_pref_plus_03_mistral_558_v2 | rirv938-v10-pref-plus-03_7169_v1 | 28597 | 61115860 | 0.53 | 0.65 | basic | | 4.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/v10_pref_plus_03 | 2024-12-23 | single | 1.75 | {'NVIDIA RTX A5000': 1} |
rirv938 | 1 | 997.0 | 1.0 | 1284.78 | 1353.66 | 0.58 | 0.99 | function_mabil_2025-02-24 | | | retune_with_base | 5915 | 61115860 | 0.53 | 0.65 | function | | | | | | | 2025-02-24 | single | | |
rirv938 | 1 | 998.0 | 1.0 | 1284.76 | 1353.66 | 0.57 | 0.99 | rirv938-grpo-to-compare-_3561_v1 | 24B | rirv938/grpo_to_compare_to_dpo_10k_cp312_g16_merged | rirv938-grpo-to-compare-_3561_v1 | 7719 | 61115860 | 0.5 | 0.65 | basic | | 8.0 | 1024.0 | 64.0 | MistralForCausalLM | rirv938/grpo_to_compare_ | 2025-04-25 | single | 1.41 | {'NVIDIA A100-SXM4-80GB': 1} |
rirv938 | 1 | 999.0 | 1.0 | 1284.71 | 1353.66 | 0.59 | 0.99 | rirv938-anthropic-40k-2_43413_v7 | 13B | rirv938/anthropic_40k_2496_bo8_85w_b4_l1_v2 | rirv938-anthropic-40k-2_43413_v7 | 6604 | 61115860 | 0.52 | 0.65 | basic | | 8.0 | 768.0 | 64.0 | MistralForCausalLM | rirv938/anthropic_40k_24 | 2025-01-29 | single | | |
rirv938 | 1 | 1000.5 | 1.0 | 1284.67 | 1353.66 | 0.53 | 0.99 | chaiml-llama-8b-multihe_54063_v9 | 8B | ChaiML/llama_8b_multihead_204m_preference | chaiml-llama-8b-multihe_54063_v9 | 10628 | 61115860 | 0.49 | 0.65 | basic | | 1.0 | 256.0 | 1.0 | LlamaForSequenceClassification | ChaiML/llama_8b_multihea | 2025-03-31 | single | | |