submission_id: function_lotar_2024-08-26
developer_uid: chai_backend_admin
alignment_samples: 2861
alignment_score: -1.2042395609665768
celo_rating: 1252.37
display_name: elo_alignment_coreweave_baseline
formatter: {'memory_template': "{bot_name}'s Persona: {memory}\n####\n", 'prompt_template': '{prompt}\n<START>\n', 'bot_template': '{bot_name}: {message}\n', 'user_template': '{user_name}: {message}\n', 'response_template': '{bot_name}:', 'truncate_by_message': False}
generation_params: {'temperature': 0.95, 'top_p': 1.0, 'min_p': 0.08, 'top_k': 40, 'presence_penalty': 0.0, 'frequency_penalty': 0.0, 'stopping_words': ['\n', '<|eot_id|>'], 'max_input_tokens': 512, 'best_of': 16, 'max_output_tokens': 64}
is_internal_developer: True
model_group:
model_name: elo_alignment_coreweave_baseline
num_battles: 2861
num_wins: 1489
propriety_score: 0.7615062761506276
propriety_total_count: 239.0
ranking_group: single
status: inactive
submission_type: function
timestamp: 2024-08-26T23:45:51+00:00
us_pacific_date: 2024-08-26
win_ratio: 0.5204473960153793
Download Preference Data
Resubmit model
Running pipeline stage StressChecker
Received healthy response to inference request in 3.0358500480651855s
Received healthy response to inference request in 4.7055487632751465s
Received healthy response to inference request in 3.5998239517211914s
Received healthy response to inference request in 5.5129663944244385s
Received healthy response to inference request in 2.987600564956665s
5 requests
0 failed requests
5th percentile: 2.997250461578369
10th percentile: 3.006900358200073
20th percentile: 3.0262001514434815
30th percentile: 3.1486448287963866
40th percentile: 3.3742343902587892
50th percentile: 3.5998239517211914
60th percentile: 4.042113876342773
70th percentile: 4.484403800964356
80th percentile: 4.867032289505005
90th percentile: 5.189999341964722
95th percentile: 5.35148286819458
99th percentile: 5.480669689178467
mean time: 3.9683579444885253
Pipeline stage StressChecker completed in 20.59s
function_lotar_2024-08-26 status is now deployed due to DeploymentManager action
function_lotar_2024-08-26 status is now inactive due to admin request

Usage Metrics

Latency Metrics