submission_id: function_sejub_2024-08-30
developer_uid: chai_backend_admin
alignment_samples: 3725
alignment_score: -0.7842482510062065
celo_rating: 1231.89
display_name: elo_alignment_amd_calibrated
formatter: {'memory_template': "{bot_name}'s Persona: {memory}\n####\n", 'prompt_template': '{prompt}\n<START>\n', 'bot_template': '{bot_name}: {message}\n', 'user_template': '{user_name}: {message}\n', 'response_template': '{bot_name}:', 'truncate_by_message': False}
generation_params: {'temperature': 0.95, 'top_p': 1.0, 'min_p': 0.08, 'top_k': 40, 'presence_penalty': 0.0, 'frequency_penalty': 0.0, 'stopping_words': ['\n', '<|eot_id|>'], 'max_input_tokens': 512, 'best_of': 16, 'max_output_tokens': 64}
is_internal_developer: True
model_group:
model_name: elo_alignment_amd_calibrated
num_battles: 3725
num_wins: 1844
propriety_score: 0.773972602739726
propriety_total_count: 292.0
ranking_group: single
status: inactive
submission_type: function
timestamp: 2024-08-30T20:09:05+00:00
us_pacific_date: 2024-08-30
win_ratio: 0.4950335570469799
Download Preference Data
Resubmit model
Running pipeline stage StressChecker
Received healthy response to inference request in 1.9191522598266602s
Received healthy response to inference request in 1.4042565822601318s
Received healthy response to inference request in 1.7390649318695068s
Received healthy response to inference request in 2.010519504547119s
Received healthy response to inference request in 1.4969465732574463s
5 requests
0 failed requests
5th percentile: 1.4227945804595947
10th percentile: 1.4413325786590576
20th percentile: 1.4784085750579834
30th percentile: 1.5453702449798583
40th percentile: 1.6422175884246826
50th percentile: 1.7390649318695068
60th percentile: 1.8110998630523683
70th percentile: 1.8831347942352294
80th percentile: 1.937425708770752
90th percentile: 1.9739726066589356
95th percentile: 1.9922460556030273
99th percentile: 2.0068648147583006
mean time: 1.7139879703521728
Pipeline stage StressChecker completed in 9.90s
function_sejub_2024-08-30 status is now deployed due to DeploymentManager action
function_sejub_2024-08-30 status is now inactive due to admin request

Usage Metrics

Latency Metrics