submission_id: function_fitos_2024-08-30
developer_uid: chai_backend_admin
alignment_samples: 12727
alignment_score: -1.098599392556389
celo_rating: 1222.57
display_name: elo_alignment_amd_calibrated
formatter: {'memory_template': "{bot_name}'s Persona: {memory}\n####\n", 'prompt_template': '{prompt}\n<START>\n', 'bot_template': '{bot_name}: {message}\n', 'user_template': '{user_name}: {message}\n', 'response_template': '{bot_name}:', 'truncate_by_message': False}
generation_params: {'temperature': 0.95, 'top_p': 1.0, 'min_p': 0.08, 'top_k': 40, 'presence_penalty': 0.0, 'frequency_penalty': 0.0, 'stopping_words': ['\n', '<|eot_id|>'], 'max_input_tokens': 512, 'best_of': 16, 'max_output_tokens': 64}
is_internal_developer: True
model_group:
model_name: elo_alignment_amd_calibrated
num_battles: 12727
num_wins: 6119
propriety_score: 0.7357830271216098
propriety_total_count: 1143.0
ranking_group: single
status: inactive
submission_type: function
timestamp: 2024-08-30T20:45:15+00:00
us_pacific_date: 2024-08-30
win_ratio: 0.48078887404730103
Download Preference Data
Resubmit model
Running pipeline stage StressChecker
Received healthy response to inference request in 2.659714460372925s
Received healthy response to inference request in 2.2468748092651367s
Received healthy response to inference request in 1.8163492679595947s
Received healthy response to inference request in 1.2137198448181152s
Received healthy response to inference request in 2.0833752155303955s
5 requests
0 failed requests
5th percentile: 1.3342457294464112
10th percentile: 1.4547716140747071
20th percentile: 1.6958233833312988
30th percentile: 1.8697544574737548
40th percentile: 1.9765648365020752
50th percentile: 2.0833752155303955
60th percentile: 2.148775053024292
70th percentile: 2.2141748905181884
80th percentile: 2.3294427394866943
90th percentile: 2.4945785999298096
95th percentile: 2.577146530151367
99th percentile: 2.6432008743286133
mean time: 2.0040067195892335
Pipeline stage StressChecker completed in 10.68s
function_fitos_2024-08-30 status is now deployed due to DeploymentManager action
function_fitos_2024-08-30 status is now inactive due to auto deactivation removed underperforming models

Usage Metrics

Latency Metrics