zhenzhe | 1 | 1.0 | 1.0 | 1275.59 | 1275.59 | 0.42 | 0.68 | white-bird-4-dpo_v2 | 13B | white-bird/4_dpo | white-bird-4-dpo_v2 | 8506 | 376660 | 0.5 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/4_dpo | 2025-03-02 | single | 1.39 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 2.0 | 1.0 | 1273.14 | 1275.59 | 0.43 | 0.68 | white-bird-5-dpo-50step_v3 | 13B | white-bird/5_dpo_50step | white-bird-5-dpo-50step_v3 | 10563 | 376660 | 0.49 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/5_dpo_50step | 2025-03-02 | single | 1.34 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 3.0 | 1.0 | 1272.7 | 1275.59 | 0.45 | 0.68 | white-bird-1-dpo_v1 | 13B | white-bird/1_dpo | white-bird-1-dpo_v1 | 10942 | 376660 | 0.49 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_dpo | 2025-03-01 | single | 1.37 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 4.0 | 1.0 | 1270.96 | 1275.59 | 0.44 | 0.68 | white-bird-7-dpo_v3 | 13B | white-bird/7_dpo | white-bird-7-dpo_v3 | 8750 | 376660 | 0.49 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/7_dpo | 2025-03-02 | single | 1.37 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 5.0 | 1.0 | 1268.84 | 1275.59 | 0.44 | 0.68 | white-bird-7-dpo_v1 | 13B | white-bird/7_dpo | white-bird-7-dpo_v1 | 8744 | 376660 | 0.49 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/7_dpo | 2025-03-02 | single | 1.37 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 6.0 | 1.0 | 1267.12 | 1275.59 | 0.43 | 0.68 | white-bird-5-dpo-150step_v1 | 13B | white-bird/5_dpo_150step | white-bird-5-dpo-150step_v1 | 14623 | 376660 | 0.48 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/5_dpo_150step | 2025-03-02 | single | 1.36 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 7.0 | 1.0 | 1267.08 | 1275.59 | 0.41 | 0.68 | white-bird-4-dpo_v1 | 13B | white-bird/4_dpo | white-bird-4-dpo_v1 | 8056 | 376660 | 0.48 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/4_dpo | 2025-03-02 | single | 1.4 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 8.0 | 1.0 | 1266.61 | 1275.59 | 0.44 | 0.68 | white-bird-7-dpo-step100_v1 | 13B | white-bird/7_dpo_step100 | white-bird-7-dpo-step100_v1 | 8140 | 376660 | 0.48 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/7_dpo_step100 | 2025-03-02 | single | 1.33 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 9.0 | 1.0 | 1266.47 | 1275.59 | 0.44 | 0.68 | white-bird-7-dpo_v2 | 13B | white-bird/7_dpo | white-bird-7-dpo_v2 | 13218 | 376660 | 0.48 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/7_dpo | 2025-03-02 | single | 1.36 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 10.0 | 1.0 | 1264.35 | 1275.59 | 0.46 | 0.68 | white-bird-5-dpo-50step_v1 | 13B | white-bird/5_dpo_50step | white-bird-5-dpo-50step_v1 | 8959 | 376660 | 0.48 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/5_dpo_50step | 2025-03-02 | single | 1.32 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 11.0 | 1.0 | 1262.95 | 1275.59 | 0.41 | 0.68 | white-bird-4-dpo_v3 | 13B | white-bird/4_dpo | white-bird-4-dpo_v3 | 13242 | 376660 | 0.48 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/4_dpo | 2025-03-02 | single | 1.37 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 12.0 | 1.0 | 1262.36 | 1275.59 | 0.45 | 0.68 | white-bird-1-dpo_v2 | 13B | white-bird/1_dpo | white-bird-1-dpo_v2 | 13082 | 376660 | 0.47 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_dpo | 2025-03-01 | single | 1.39 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 13.0 | 1.0 | 1262.25 | 1275.59 | 0.44 | 0.68 | white-bird-5-dpo-50step_v2 | 13B | white-bird/5_dpo_50step | white-bird-5-dpo-50step_v2 | 9175 | 376660 | 0.47 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/5_dpo_50step | 2025-03-02 | single | 1.26 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 14.0 | 1.0 | 1260.88 | 1275.59 | 0.47 | 0.68 | white-bird-7-dpo-step100_v2 | 13B | white-bird/7_dpo_step100 | white-bird-7-dpo-step100_v2 | 7766 | 376660 | 0.48 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/7_dpo_step100 | 2025-03-02 | single | 1.36 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 15.0 | 1.0 | 1259.57 | 1275.59 | 0.47 | 0.68 | white-bird-7-dpo-step100_v3 | 13B | white-bird/7_dpo_step100 | white-bird-7-dpo-step100_v3 | 7496 | 376660 | 0.48 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/7_dpo_step100 | 2025-03-02 | single | 1.34 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 16.0 | 1.0 | 1256.9 | 1275.59 | 0.47 | 0.68 | white-bird-2-dpo_v1 | 13B | white-bird/2_dpo | white-bird-2-dpo_v1 | 10378 | 376660 | 0.47 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/2_dpo | 2025-03-02 | single | 1.33 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 17.0 | 1.0 | 1256.87 | 1275.59 | 0.47 | 0.68 | white-bird-2-dpo_v2 | 13B | white-bird/2_dpo | white-bird-2-dpo_v2 | 8814 | 376660 | 0.47 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/2_dpo | 2025-03-02 | single | 1.33 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 18.0 | 1.0 | 1241.7 | 1275.59 | 0.6 | 0.68 | mistralai-mistral-nem_93303_v449 | 13B | mistralai/Mistral-Nemo-Instruct-2407 | bird_test | 10478 | 376660 | 0.45 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | mistralai/Mistral-Nemo-I | 2025-02-28 | single | 1.3 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 19.0 | 1.0 | 1239.63 | 1275.59 | 0.6 | 0.68 | white-bird-1-kto_v2 | 13B | white-bird/1_kto | white-bird-1-kto_v2 | 13649 | 376660 | 0.45 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_kto | 2025-03-02 | single | 1.3 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 20.0 | 1.0 | 1237.33 | 1275.59 | 0.6 | 0.68 | white-bird-1-kto_v1 | 13B | white-bird/1_kto | white-bird-1-kto_v1 | 9770 | 376660 | 0.45 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_kto | 2025-03-02 | single | 1.36 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 21.0 | 1.0 | 1234.11 | 1275.59 | 0.6 | 0.68 | mistralai-mistral-nem_93303_v448 | 13B | mistralai/Mistral-Nemo-Instruct-2407 | bird_nostop | 11536 | 376660 | 0.44 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | mistralai/Mistral-Nemo-I | 2025-02-28 | single | 1.35 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 22.0 | 1.0 | 1230.86 | 1275.59 | 0.63 | 0.68 | white-bird-1-sft-label1-200_v1 | 13B | white-bird/1_sft_label1_200 | white-bird-1-sft-label1-200_v1 | 10865 | 376660 | 0.44 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_sft_label1_ | 2025-03-01 | single | 1.34 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 23.0 | 1.0 | 1229.74 | 1275.59 | 0.61 | 0.68 | white-bird-1-distill_v1 | 13B | white-bird/1_distill | white-bird-1-distill_v1 | 11848 | 376660 | 0.44 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_distill | 2025-03-01 | single | 1.29 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 24.0 | 1.0 | 1229.44 | 1275.59 | 0.63 | 0.68 | white-bird-1-sft-label1-400_v1 | 13B | white-bird/1_sft_label1_400 | white-bird-1-sft-label1-400_v1 | 8302 | 376660 | 0.44 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_sft_label1_ | 2025-03-01 | single | 1.32 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 25.0 | 1.0 | 1225.21 | 1275.59 | 0.63 | 0.68 | white-bird-1-sft-label1-400_v2 | 13B | white-bird/1_sft_label1_400 | white-bird-1-sft-label1-400_v2 | 15091 | 376660 | 0.42 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_sft_label1_ | 2025-03-01 | single | 1.39 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 26.0 | 1.0 | 1224.78 | 1275.59 | 0.63 | 0.68 | white-bird-1-sft-label1-708_v1 | 13B | white-bird/1_sft_label1_708 | white-bird-1-sft-label1-708_v1 | 13356 | 376660 | 0.43 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_sft_label1_ | 2025-03-01 | single | 1.31 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 27.0 | 1.0 | 1224.68 | 1275.59 | 0.63 | 0.68 | white-bird-1-sft-label1_v2 | 13B | white-bird/1_sft_label1 | white-bird-1-sft-label1_v2 | 13161 | 376660 | 0.43 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_sft_label1 | 2025-03-01 | single | 1.33 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 28.0 | 1.0 | 1224.05 | 1275.59 | 0.64 | 0.68 | white-bird-1-sft-label1-200_v3 | 13B | white-bird/1_sft_label1_200 | white-bird-1-sft-label1-200_v2 | 7409 | 376660 | 0.43 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_sft_label1_ | 2025-03-01 | single | 1.34 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 29.0 | 1.0 | 1223.64 | 1275.59 | 0.61 | 0.68 | white-bird-1-sft-unpack_v1 | 13B | white-bird/1_sft_unpack | white-bird-1-sft-unpack_v1 | 10749 | 376660 | 0.43 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_sft_unpack | 2025-03-01 | single | 1.36 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 30.0 | 1.0 | 1223.2 | 1275.59 | 0.63 | 0.68 | white-bird-1-sft-label1-400_v3 | 13B | white-bird/1_sft_label1_400 | white-bird-1-sft-label1-400_v3 | 9284 | 376660 | 0.43 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_sft_label1_ | 2025-03-01 | single | 1.35 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 31.0 | 1.0 | 1221.89 | 1275.59 | 0.62 | 0.68 | white-bird-1-sft-label1_24791_v1 | 13B | white-bird/1_sft_label1_lora300 | white-bird-1-sft-label1_24791_v1 | 10868 | 376660 | 0.45 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_sft_label1_ | 2025-03-01 | single | 1.32 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 32.0 | 1.0 | 1221.84 | 1275.59 | 0.63 | 0.68 | white-bird-1-sft-label1-lora_v2 | 13B | white-bird/1_sft_label1_lora | white-bird-1-sft-label1-lora_v2 | 9738 | 376660 | 0.43 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_sft_label1_ | 2025-03-01 | single | 1.34 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 33.0 | 1.0 | 1221.67 | 1275.59 | 0.64 | 0.68 | white-bird-1-sft-label1-200_v2 | 13B | white-bird/1_sft_label1_200 | white-bird-1-sft-label1-200_v2 | 7026 | 376660 | 0.43 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_sft_label1_ | 2025-03-01 | single | 1.32 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 34.0 | 1.0 | 1219.83 | 1275.59 | 0.63 | 0.68 | white-bird-1-sft-label4-diff_v1 | 13B | white-bird/1_sft_label4_diff | white-bird-1-sft-label4-diff_v1 | 9650 | 376660 | 0.42 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_sft_label4_ | 2025-03-01 | single | 1.32 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 35.0 | 1.0 | 1217.35 | 1275.59 | 0.63 | 0.68 | white-bird-1-sft-label1_v1 | 13B | white-bird/1_sft_label1 | white-bird-1-sft-label1_v1 | 11953 | 376660 | 0.41 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_sft_label1 | 2025-03-01 | single | 1.34 | {'NVIDIA RTX A5000': 1} |
zhenzhe | 1 | 36.0 | 1.0 | 1125.3 | 1275.59 | 0.68 | 0.68 | white-bird-1-sft-label1-lora_v1 | 13B | white-bird/1_sft_label1_lora | white-bird-1-sft-label1-lora_v1 | 11473 | 376660 | 0.3 | 0.5 | basic | | 8 | 1024 | 64 | MistralForCausalLM | white-bird/1_sft_label1_ | 2025-03-01 | single | 1.34 | {'NVIDIA RTX A5000': 1} |