submission_id: rica40325-feedback-and-dpo_v1
developer_uid: rica40325
alignment_samples: 11447
alignment_score: 0.9017426032470925
best_of: 1
celo_rating: 1145.38
display_name: rica40325-feedback-and-dpo_v1
formatter: {'memory_template': "{bot_name}'s Persona: {memory}\n####\n", 'prompt_template': '{prompt}\n<START>\n', 'bot_template': '{bot_name}: {message}\n', 'user_template': '{user_name}: {message}\n', 'response_template': '{bot_name}:', 'truncate_by_message': False}
generation_params: {'temperature': 1.0, 'top_p': 1.0, 'min_p': 0.0, 'top_k': 40, 'presence_penalty': 0.0, 'frequency_penalty': 0.0, 'stopping_words': ['\n'], 'max_input_tokens': 512, 'best_of': 1, 'max_output_tokens': 64}
is_internal_developer: False
language_model: rica40325/feedback-and-dpo
max_input_tokens: 512
max_output_tokens: 64
model_architecture: LlamaForCausalLM
model_group: rica40325/feedback-and-d
model_name: rica40325-feedback-and-dpo_v1
model_num_parameters: 8030261248.0
model_repo: rica40325/feedback-and-dpo
model_size: 8B
num_battles: 11447
num_wins: 4285
propriety_score: 0.7393075356415478
propriety_total_count: 982.0
ranking_group: single
status: inactive
submission_type: basic
timestamp: 2024-09-01T07:57:36+00:00
us_pacific_date: 2024-09-01
win_ratio: 0.37433388660784483
Download Preference Data
Resubmit model