submission_id: zonemercy-lexical-nemo-_1518_v29
developer_uid: chai_backend_admin
best_of: 4
celo_rating: 1246.87
display_name: zonemercy-lexical-nemo-_1518_v29
family_friendly_score: 0.5698
family_friendly_standard_error: 0.007001827761377739
formatter: {'memory_template': "{bot_name}'s Persona: {memory}\n####\n", 'prompt_template': '{prompt}\n<START>\n', 'bot_template': '{bot_name}: {message}\n', 'user_template': '{user_name}: {message}\n', 'response_template': '{bot_name}:', 'truncate_by_message': False}
generation_params: {'temperature': 0.9, 'top_p': 1.0, 'min_p': 0.05, 'top_k': 80, 'presence_penalty': 0.0, 'frequency_penalty': 0.0, 'stopping_words': ['\n', '</s>', '###', 'Bot:', 'User:', 'You:', '<|im_end|>'], 'max_input_tokens': 1024, 'best_of': 4, 'max_output_tokens': 64}
gpu_counts: {'NVIDIA RTX A5000': 1}
is_internal_developer: True
language_model: zonemercy/Lexical-Nemo-v4-1k1e5
latencies: [{'batch_size': 1, 'throughput': 0.6323023174711848, 'latency_mean': 1.5814444065093993, 'latency_p50': 1.5912071466445923, 'latency_p90': 1.7214602947235107}, {'batch_size': 3, 'throughput': 1.2599087218434057, 'latency_mean': 2.369664821624756, 'latency_p50': 2.3558225631713867, 'latency_p90': 2.640217518806457}, {'batch_size': 5, 'throughput': 1.5733497382980175, 'latency_mean': 3.165028305053711, 'latency_p50': 3.165925621986389, 'latency_p90': 3.5572864294052122}, {'batch_size': 6, 'throughput': 1.6890897142858523, 'latency_mean': 3.5318483412265778, 'latency_p50': 3.503597855567932, 'latency_p90': 4.006222939491272}, {'batch_size': 8, 'throughput': 1.8352528399343426, 'latency_mean': 4.321796709299088, 'latency_p50': 4.336133241653442, 'latency_p90': 4.873060321807861}, {'batch_size': 10, 'throughput': 1.9127450091975435, 'latency_mean': 5.196655564308166, 'latency_p50': 5.186009645462036, 'latency_p90': 5.903792881965638}]
max_input_tokens: 1024
max_output_tokens: 64
model_architecture: MistralForCausalLM
model_group: zonemercy/Lexical-Nemo-v
model_name: zonemercy-lexical-nemo-_1518_v29
model_num_parameters: 12772070400.0
model_repo: zonemercy/Lexical-Nemo-v4-1k1e5
model_size: 13B
num_battles: 16013
num_wins: 8317
ranking_group: single
status: inactive
submission_type: basic
throughput_3p7s: 1.74
timestamp: 2024-11-11T18:07:27+00:00
us_pacific_date: 2024-11-11
win_ratio: 0.5193904952226316
Resubmit model
Shutdown handler not registered because Python interpreter is not running in the main thread
run pipeline %s
run pipeline stage %s
Running pipeline stage MKMLizer
Starting job with name zonemercy-lexical-nemo-1518-v29-mkmlizer
Waiting for job on zonemercy-lexical-nemo-1518-v29-mkmlizer to finish
zonemercy-lexical-nemo-1518-v29-mkmlizer: ╔═════════════════════════════════════════════════════════════════════╗
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ _____ __ __ ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ / _/ /_ ___ __/ / ___ ___ / / ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ / _/ / // / |/|/ / _ \/ -_) -_) / ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ /_//_/\_, /|__,__/_//_/\__/\__/_/ ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ /___/ ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ Version: 0.11.33 ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ Copyright 2023 MK ONE TECHNOLOGIES Inc. ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ https://mk1.ai ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ The license key for the current software has been verified as ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ belonging to: ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ Chai Research Corp. ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ Account ID: 7997a29f-0ceb-4cc7-9adf-840c57b4ae6f ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ Expiration: 2025-01-15 23:59:59 ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ║ ║
zonemercy-lexical-nemo-1518-v29-mkmlizer: ╚═════════════════════════════════════════════════════════════════════╝
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
zonemercy-lexical-nemo-1518-v29-mkmlizer: Downloaded to shared memory in 310.232s
zonemercy-lexical-nemo-1518-v29-mkmlizer: quantizing model to /dev/shm/model_cache, profile:s0, folder:/tmp/tmpmog6n7kc, device:0
zonemercy-lexical-nemo-1518-v29-mkmlizer: Saving flywheel model at /dev/shm/model_cache
zonemercy-lexical-nemo-1518-v29-mkmlizer: quantized model in 49.752s
zonemercy-lexical-nemo-1518-v29-mkmlizer: Processed model zonemercy/Lexical-Nemo-v4-1k1e5 in 359.984s
zonemercy-lexical-nemo-1518-v29-mkmlizer: creating bucket guanaco-mkml-models
zonemercy-lexical-nemo-1518-v29-mkmlizer: Bucket 's3://guanaco-mkml-models/' created
zonemercy-lexical-nemo-1518-v29-mkmlizer: uploading /dev/shm/model_cache to s3://guanaco-mkml-models/zonemercy-lexical-nemo-1518-v29
zonemercy-lexical-nemo-1518-v29-mkmlizer: cp /dev/shm/model_cache/config.json s3://guanaco-mkml-models/zonemercy-lexical-nemo-1518-v29/config.json
zonemercy-lexical-nemo-1518-v29-mkmlizer: cp /dev/shm/model_cache/special_tokens_map.json s3://guanaco-mkml-models/zonemercy-lexical-nemo-1518-v29/special_tokens_map.json
zonemercy-lexical-nemo-1518-v29-mkmlizer: cp /dev/shm/model_cache/tokenizer_config.json s3://guanaco-mkml-models/zonemercy-lexical-nemo-1518-v29/tokenizer_config.json
zonemercy-lexical-nemo-1518-v29-mkmlizer: cp /dev/shm/model_cache/tokenizer.json s3://guanaco-mkml-models/zonemercy-lexical-nemo-1518-v29/tokenizer.json
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
zonemercy-lexical-nemo-1518-v29-mkmlizer: cp /dev/shm/model_cache/flywheel_model.0.safetensors s3://guanaco-mkml-models/zonemercy-lexical-nemo-1518-v29/flywheel_model.0.safetensors
zonemercy-lexical-nemo-1518-v29-mkmlizer: Loading 0: 0%| | 0/363 [00:00<?, ?it/s] Loading 0: 1%| | 4/363 [00:00<00:16, 22.30it/s] Loading 0: 2%|▏ | 7/363 [00:00<00:20, 17.33it/s] Loading 0: 3%|▎ | 10/363 [00:00<00:20, 17.17it/s] Loading 0: 4%|▎ | 13/363 [00:00<00:21, 16.66it/s] Loading 0: 4%|▍ | 15/363 [00:00<00:23, 14.89it/s] Loading 0: 5%|▌ | 19/363 [00:01<00:19, 17.44it/s] Loading 0: 6%|▌ | 22/363 [00:01<00:18, 18.44it/s] Loading 0: 7%|▋ | 24/363 [00:01<00:23, 14.23it/s] Loading 0: 7%|▋ | 26/363 [00:01<00:28, 12.00it/s] Loading 0: 8%|▊ | 30/363 [00:01<00:20, 15.92it/s] Loading 0: 9%|▉ | 32/363 [00:02<00:26, 12.58it/s] Loading 0: 10%|█ | 37/363 [00:02<00:19, 17.14it/s] Loading 0: 11%|█ | 39/363 [00:02<00:18, 17.51it/s] Loading 0: 11%|█▏ | 41/363 [00:02<00:23, 13.76it/s] Loading 0: 13%|█▎ | 46/363 [00:02<00:17, 18.24it/s] Loading 0: 13%|█▎ | 49/363 [00:03<00:17, 17.89it/s] Loading 0: 14%|█▍ | 51/363 [00:03<00:19, 16.37it/s] Loading 0: 15%|█▌ | 55/363 [00:03<00:16, 18.73it/s] Loading 0: 16%|█▌ | 57/363 [00:03<00:16, 18.75it/s] Loading 0: 17%|█▋ | 60/363 [00:03<00:15, 19.14it/s] Loading 0: 17%|█▋ | 62/363 [00:03<00:21, 14.29it/s] Loading 0: 18%|█▊ | 64/363 [00:04<00:25, 11.70it/s] Loading 0: 19%|█▉ | 69/363 [00:04<00:18, 16.31it/s] Loading 0: 20%|█▉ | 71/363 [00:04<00:17, 16.87it/s] Loading 0: 20%|██ | 73/363 [00:04<00:19, 14.94it/s] Loading 0: 21%|██ | 76/363 [00:04<00:18, 15.31it/s] Loading 0: 21%|██▏ | 78/363 [00:04<00:19, 14.39it/s] Loading 0: 23%|██▎ | 82/363 [00:05<00:16, 17.44it/s] Loading 0: 23%|██▎ | 84/363 [00:05<00:15, 17.66it/s] Loading 0: 24%|██▎ | 86/363 [00:05<00:20, 13.53it/s] Loading 0: 25%|██▌ | 91/363 [00:05<00:15, 18.11it/s] Loading 0: 26%|██▌ | 94/363 [00:05<00:15, 17.32it/s] Loading 0: 26%|██▋ | 96/363 [00:05<00:17, 15.68it/s] Loading 0: 28%|██▊ | 100/363 [00:06<00:14, 18.36it/s] Loading 0: 28%|██▊ | 102/363 [00:06<00:18, 14.21it/s] Loading 0: 29%|██▊ | 104/363 [00:06<00:22, 11.63it/s] Loading 0: 30%|███ | 109/363 [00:06<00:15, 16.01it/s] Loading 0: 31%|███ | 111/363 [00:06<00:15, 16.57it/s] Loading 0: 31%|███ | 113/363 [00:07<00:19, 13.02it/s] Loading 0: 33%|███▎ | 118/363 [00:07<00:14, 17.24it/s] Loading 0: 33%|███▎ | 121/363 [00:07<00:14, 17.00it/s] Loading 0: 34%|███▍ | 123/363 [00:07<00:15, 15.32it/s] Loading 0: 35%|███▍ | 127/363 [00:07<00:13, 17.75it/s] Loading 0: 36%|███▌ | 129/363 [00:08<00:13, 17.96it/s] Loading 0: 36%|███▌ | 131/363 [00:08<00:16, 13.78it/s] Loading 0: 37%|███▋ | 136/363 [00:08<00:12, 18.53it/s] Loading 0: 38%|███▊ | 139/363 [00:08<00:10, 20.66it/s] Loading 0: 39%|███▉ | 142/363 [00:08<00:13, 16.63it/s] Loading 0: 40%|███▉ | 144/363 [00:08<00:14, 15.24it/s] Loading 0: 41%|████ | 149/363 [00:09<00:12, 17.83it/s] Loading 0: 42%|████▏ | 154/363 [00:09<00:09, 22.86it/s] Loading 0: 44%|████▎ | 158/363 [00:09<00:09, 21.27it/s] Loading 0: 45%|████▍ | 163/363 [00:09<00:07, 25.71it/s] Loading 0: 46%|████▌ | 166/363 [00:09<00:07, 26.56it/s] Loading 0: 47%|████▋ | 169/363 [00:09<00:07, 24.97it/s] Loading 0: 47%|████▋ | 172/363 [00:10<00:07, 25.38it/s] Loading 0: 48%|████▊ | 176/363 [00:10<00:08, 22.05it/s] Loading 0: 50%|████▉ | 181/363 [00:10<00:06, 26.33it/s] Loading 0: 51%|█████ | 184/363 [00:10<00:09, 18.65it/s] Loading 0: 52%|█████▏ | 187/363 [00:10<00:09, 18.99it/s] Loading 0: 52%|█████▏ | 190/363 [00:10<00:08, 20.49it/s] Loading 0: 53%|█████▎ | 194/363 [00:11<00:08, 19.64it/s] Loading 0: 55%|█████▍ | 199/363 [00:11<00:06, 24.42it/s] Loading 0: 56%|█████▌ | 202/363 [00:11<00:06, 25.45it/s] Loading 0: 56%|█████▋ | 205/363 [00:11<00:06, 24.50it/s] Loading 0: 57%|█████▋ | 208/363 [00:11<00:06, 24.97it/s] Loading 0: 58%|█████▊ | 212/363 [00:11<00:07, 21.41it/s] Loading 0: 60%|█████▉ | 217/363 [00:11<00:05, 25.40it/s] Loading 0: 61%|██████ | 222/363 [00:12<00:05, 25.37it/s] Loading 0: 62%|██████▏ | 225/363 [00:12<00:09, 15.31it/s] Loading 0: 63%|██████▎ | 229/363 [00:12<00:07, 18.74it/s] Loading 0: 64%|██████▍ | 232/363 [00:12<00:06, 18.87it/s] Loading 0: 65%|██████▍ | 235/363 [00:13<00:06, 20.29it/s] Loading 0: 66%|██████▌ | 239/363 [00:13<00:06, 19.24it/s] Loading 0: 67%|██████▋ | 244/363 [00:13<00:05, 23.57it/s] Loading 0: 68%|██████▊ | 247/363 [00:13<00:04, 24.72it/s] Loading 0: 69%|██████▉ | 250/363 [00:13<00:04, 23.44it/s] Loading 0: 70%|██████▉ | 253/363 [00:13<00:04, 23.54it/s] Loading 0: 71%|███████ | 256/363 [00:13<00:04, 24.89it/s] Loading 0: 71%|███████▏ | 259/363 [00:14<00:04, 23.80it/s] Loading 0: 72%|███████▏ | 262/363 [00:14<00:04, 24.14it/s] Loading 0: 73%|███████▎ | 265/363 [00:14<00:06, 16.08it/s] Loading 0: 74%|███████▍ | 268/363 [00:14<00:05, 17.29it/s] Loading 0: 75%|███████▍ | 271/363 [00:14<00:04, 18.79it/s] Loading 0: 75%|███████▌ | 274/363 [00:14<00:04, 20.96it/s] Loading 0: 76%|███████▋ | 277/363 [00:14<00:04, 21.06it/s] Loading 0: 77%|███████▋ | 280/363 [00:15<00:03, 21.97it/s] Loading 0: 78%|███████▊ | 283/363 [00:15<00:03, 23.33it/s] Loading 0: 79%|███████▉ | 286/363 [00:15<00:03, 22.62it/s] Loading 0: 80%|███████▉ | 289/363 [00:15<00:03, 23.19it/s] Loading 0: 81%|████████ | 293/363 [00:15<00:03, 21.09it/s] Loading 0: 82%|████████▏ | 298/363 [00:15<00:02, 26.69it/s] Loading 0: 83%|████████▎ | 303/363 [00:15<00:02, 27.95it/s] Loading 0: 84%|████████▍ | 306/363 [00:16<00:03, 17.87it/s] Loading 0: 86%|████████▌ | 311/363 [00:16<00:02, 19.80it/s] Loading 0: 88%|████████▊ | 318/363 [00:16<00:01, 26.10it/s] Loading 0: 89%|████████▊ | 322/363 [00:16<00:01, 25.62it/s] Loading 0: 90%|████████▉ | 325/363 [00:16<00:01, 25.14it/s] Loading 0: 90%|█████████ | 328/363 [00:17<00:01, 25.33it/s] Loading 0: 91%|█████████ | 331/363 [00:17<00:01, 24.33it/s] Loading 0: 92%|█████████▏| 334/363 [00:17<00:01, 25.55it/s] Loading 0: 93%|█████████▎| 337/363 [00:17<00:00, 26.51it/s] Loading 0: 94%|█████████▎| 340/363 [00:17<00:00, 24.00it/s] Loading 0: 94%|█████████▍| 343/363 [00:17<00:00, 24.80it/s] Loading 0: 95%|█████████▌| 346/363 [00:25<00:13, 1.29it/s] Loading 0: 96%|█████████▌| 348/363 [00:25<00:09, 1.60it/s] Loading 0: 97%|█████████▋| 353/363 [00:25<00:03, 2.73it/s] Loading 0: 98%|█████████▊| 356/363 [00:25<00:01, 3.60it/s] Loading 0: 99%|█████████▉| 359/363 [00:26<00:00, 4.70it/s] Loading 0: 100%|█████████▉| 362/363 [00:26<00:00, 6.17it/s]
Job zonemercy-lexical-nemo-1518-v29-mkmlizer completed after 390.5s with status: succeeded
Stopping job with name zonemercy-lexical-nemo-1518-v29-mkmlizer
Pipeline stage MKMLizer completed in 391.02s
run pipeline stage %s
Running pipeline stage MKMLTemplater
Pipeline stage MKMLTemplater completed in 0.17s
run pipeline stage %s
Running pipeline stage MKMLDeployer
Creating inference service zonemercy-lexical-nemo-1518-v29
Waiting for inference service zonemercy-lexical-nemo-1518-v29 to be ready
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Inference service zonemercy-lexical-nemo-1518-v29 ready after 190.71319842338562s
Pipeline stage MKMLDeployer completed in 191.28s
run pipeline stage %s
Running pipeline stage StressChecker
Received healthy response to inference request in 2.061600685119629s
Received healthy response to inference request in 1.573612928390503s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Received healthy response to inference request in 1.4395091533660889s
Received healthy response to inference request in 1.506108045578003s
Received healthy response to inference request in 1.50819730758667s
5 requests
0 failed requests
5th percentile: 1.4528289318084717
10th percentile: 1.4661487102508546
20th percentile: 1.49278826713562
30th percentile: 1.5065258979797362
40th percentile: 1.507361602783203
50th percentile: 1.50819730758667
60th percentile: 1.5343635559082032
70th percentile: 1.5605298042297364
80th percentile: 1.6712104797363283
90th percentile: 1.8664055824279786
95th percentile: 1.9640031337738035
99th percentile: 2.042081174850464
mean time: 1.6178056240081786
Pipeline stage StressChecker completed in 9.63s
run pipeline stage %s
Running pipeline stage OfflineFamilyFriendlyTriggerPipeline
run_pipeline:run_in_cloud %s
starting trigger_guanaco_pipeline args=%s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
triggered trigger_guanaco_pipeline args=%s
Pipeline stage OfflineFamilyFriendlyTriggerPipeline completed in 5.65s
run pipeline stage %s
Running pipeline stage TriggerMKMLProfilingPipeline
run_pipeline:run_in_cloud %s
starting trigger_guanaco_pipeline args=%s
triggered trigger_guanaco_pipeline args=%s
Pipeline stage TriggerMKMLProfilingPipeline completed in 2.16s
Shutdown handler de-registered
zonemercy-lexical-nemo-_1518_v29 status is now deployed due to DeploymentManager action
Shutdown handler registered
run pipeline %s
run pipeline stage %s
Running pipeline stage OfflineFamilyFriendlyScorer
Evaluating %s Family Friendly Score with %s threads
Pipeline stage OfflineFamilyFriendlyScorer completed in 2590.03s
Shutdown handler de-registered
zonemercy-lexical-nemo-_1518_v29 status is now inactive due to auto deactivation removed underperforming models