submission_id: hastagaras-l3-cukai-8b-dpo_v1
developer_uid: Hastagaras
status: inactive
model_repo: Hastagaras/L3-Cukai-8B-DPO
reward_repo: ChaiML/reward_gpt2_medium_preference_24m_e2
generation_params: {'temperature': 0.85, 'top_p': 1.0, 'min_p': 0.0, 'top_k': 40, 'presence_penalty': 0.0, 'frequency_penalty': 1.05, 'stopping_words': ['\n', '###', '</s>', '<|eot_id|>'], 'max_input_tokens': 512, 'best_of': 16, 'max_output_tokens': 64}
formatter: {'memory_template': "Write {bot_name}'s next reply in a fictional roleplay chat between {user_name} and {bot_name}.\n\n{memory}", 'prompt_template': '\n\n### Response:\n{bot_name}: {prompt}<|end_of_text|>', 'bot_template': '\n\n### Response:\n{bot_name}: {message}<|end_of_text|>', 'user_template': '\n\n### Instruction:\n{user_name}: {message}', 'response_template': '\n\n### Response:\n{bot_name}:', 'truncate_by_message': False}
reward_formatter: {'memory_template': "{bot_name}'s Persona: {memory}\n####\n", 'prompt_template': '{bot_name}: {prompt}\n', 'bot_template': '{bot_name}: {message}\n', 'user_template': '{user_name}: {message}\n', 'response_template': '{bot_name}:', 'truncate_by_message': False}
timestamp: 2024-04-25T17:29:27+00:00
model_name: hastagaras-l3-cukai-8b-dpo_v1
model_eval_status: success
model_group: Hastagaras/L3-Cukai-8B-D
double_thumbs_up: 0
thumbs_up: 0
thumbs_down: 0
num_battles: 7167
num_wins: 4153
celo_rating: 1206.35
entertaining: 6.92
stay_in_character: 8.69
user_preference: 7.4
safety_score: 0.84
propriety_score: 0.0
propriety_total_count: None
submission_type: basic
model_architecture: LlamaForCausalLM
model_num_parameters: 8030261248.0
best_of: 16
max_input_tokens: 512
max_output_tokens: 64
display_name: hastagaras-l3-cukai-8b-dpo_v1
double_thumbs_up_ratio: None
feedback_count: 0
ineligible_reason: None
language_model: Hastagaras/L3-Cukai-8B-DPO
model_score: 7.669999999999999
model_size: 8B
reward_model: ChaiML/reward_gpt2_medium_preference_24m_e2
single_thumbs_up_ratio: None
thumbs_down_ratio: None
thumbs_up_ratio: None
us_pacific_date: 2024-04-25
win_ratio: 0.5794614203990512
Resubmit model