submission_id: mistralai-mixtral-8x7b_3473_v133
developer_uid: azuruce
alignment_samples: 11689
alignment_score: 0.05341537525215034
best_of: 4
celo_rating: 1196.64
display_name: mixtral-8x7_3473_v130
formatter: {'memory_template': '<s>[INST] This is an entertaining conversation. You are {bot_name} who has the persona: {memory}.\nEngage in a chat with {user_name} while staying in character. Try to flirt with {user_name}. Engage in *roleplay* actions. Describe the scene dramatically. \n', 'prompt_template': '{prompt}\n', 'bot_template': '{bot_name}: {message}</s>', 'user_template': '[INST] {user_name}: {message} [/INST]', 'response_template': '{bot_name}:', 'truncate_by_message': False}
generation_params: {'temperature': 0.9, 'top_p': 1.0, 'min_p': 0.0, 'top_k': 50, 'presence_penalty': 0.5, 'frequency_penalty': 0.5, 'stopping_words': ['\n', '</s>', '<|user|>', '###'], 'max_input_tokens': 512, 'best_of': 4, 'max_output_tokens': 64}
gpu_counts: {'NVIDIA A100-SXM4-80GB': 1}
is_internal_developer: True
language_model: mistralai/Mixtral-8x7B-Instruct-v0.1
latencies: [{'batch_size': 1, 'throughput': 0.47181477055952387, 'latency_mean': 2.119407205581665, 'latency_p50': 2.0871907472610474, 'latency_p90': 2.4152173519134523}, {'batch_size': 5, 'throughput': 1.3978100763071002, 'latency_mean': 3.5456458735466003, 'latency_p50': 3.546334743499756, 'latency_p90': 3.951930046081543}, {'batch_size': 10, 'throughput': 2.4230524937793834, 'latency_mean': 4.075820286273956, 'latency_p50': 4.048440098762512, 'latency_p90': 4.570410919189453}, {'batch_size': 15, 'throughput': 3.175168042994806, 'latency_mean': 4.590426172018051, 'latency_p50': 4.560545206069946, 'latency_p90': 5.2239577054977415}, {'batch_size': 20, 'throughput': 3.730100507939458, 'latency_mean': 5.220640211105347, 'latency_p50': 5.196094036102295, 'latency_p90': 5.989784622192383}]
max_input_tokens: 512
max_output_tokens: 64
model_architecture: MixtralForCausalLM
model_group: mistralai/Mixtral-8x7B-I
model_name: mixtral-8x7_3473_v130
model_num_parameters: 46702792704.0
model_repo: mistralai/Mixtral-8x7B-Instruct-v0.1
model_size: 47B
num_battles: 11689
num_wins: 5182
propriety_score: 0.7680872150644202
propriety_total_count: 1009.0
ranking_group: single
status: inactive
submission_type: basic
throughput_3p7s: 1.74
timestamp: 2024-09-04T21:28:29+00:00
us_pacific_date: 2024-09-04
win_ratio: 0.4433227821028317
Download Preference Data
Resubmit model
Shutdown handler not registered because Python interpreter is not running in the main thread
run pipeline %s
run pipeline stage %s
Running pipeline stage MKMLizer
Starting job with name mistralai-mixtral-8x7b-3473-v133-mkmlizer
Waiting for job on mistralai-mixtral-8x7b-3473-v133-mkmlizer to finish
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ╔═════════════════════════════════════════════════════════════════════╗
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ _____ __ __ ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ / _/ /_ ___ __/ / ___ ___ / / ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ / _/ / // / |/|/ / _ \/ -_) -_) / ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ /_//_/\_, /|__,__/_//_/\__/\__/_/ ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ /___/ ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ Version: 0.10.1 ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ Copyright 2023 MK ONE TECHNOLOGIES Inc. ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ https://mk1.ai ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ The license key for the current software has been verified as ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ belonging to: ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ Chai Research Corp. ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ Account ID: 7997a29f-0ceb-4cc7-9adf-840c57b4ae6f ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ Expiration: 2024-10-15 23:59:59 ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ║ ║
mistralai-mixtral-8x7b-3473-v133-mkmlizer: ╚═════════════════════════════════════════════════════════════════════╝
mistralai-mixtral-8x7b-3473-v133-mkmlizer: Downloaded to shared memory in 330.263s
mistralai-mixtral-8x7b-3473-v133-mkmlizer: quantizing model to /dev/shm/model_cache, profile:s0, folder:/tmp/tmp3p0swjad, device:0
mistralai-mixtral-8x7b-3473-v133-mkmlizer: Saving flywheel model at /dev/shm/model_cache
mistralai-mixtral-8x7b-3473-v133-mkmlizer: creating bucket guanaco-mkml-models
mistralai-mixtral-8x7b-3473-v133-mkmlizer: Bucket 's3://guanaco-mkml-models/' created
mistralai-mixtral-8x7b-3473-v133-mkmlizer: uploading /dev/shm/model_cache to s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v133
mistralai-mixtral-8x7b-3473-v133-mkmlizer: cp /dev/shm/model_cache/config.json s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v133/config.json
mistralai-mixtral-8x7b-3473-v133-mkmlizer: cp /dev/shm/model_cache/tokenizer_config.json s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v133/tokenizer_config.json
mistralai-mixtral-8x7b-3473-v133-mkmlizer: cp /dev/shm/model_cache/special_tokens_map.json s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v133/special_tokens_map.json
mistralai-mixtral-8x7b-3473-v133-mkmlizer: cp /dev/shm/model_cache/tokenizer.model s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v133/tokenizer.model
mistralai-mixtral-8x7b-3473-v133-mkmlizer: cp /dev/shm/model_cache/tokenizer.json s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v133/tokenizer.json
mistralai-mixtral-8x7b-3473-v133-mkmlizer: cp /dev/shm/model_cache/flywheel_model.3.safetensors s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v133/flywheel_model.3.safetensors
mistralai-mixtral-8x7b-3473-v133-mkmlizer: cp /dev/shm/model_cache/flywheel_model.0.safetensors s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v133/flywheel_model.0.safetensors
mistralai-mixtral-8x7b-3473-v133-mkmlizer: cp /dev/shm/model_cache/flywheel_model.1.safetensors s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v133/flywheel_model.1.safetensors
mistralai-mixtral-8x7b-3473-v133-mkmlizer: cp /dev/shm/model_cache/flywheel_model.2.safetensors s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v133/flywheel_model.2.safetensors
mistralai-mixtral-8x7b-3473-v133-mkmlizer: Loading 0: 0%| | 0/995 [00:00<?, ?it/s] Loading 0: 0%| | 4/995 [00:00<00:29, 33.04it/s] Loading 0: 1%| | 8/995 [00:00<00:31, 31.78it/s] Loading 0: 1%| | 12/995 [00:00<00:31, 31.30it/s] Loading 0: 2%|▏ | 16/995 [00:00<00:38, 25.59it/s] Loading 0: 2%|▏ | 19/995 [00:00<00:38, 25.66it/s] Loading 0: 2%|▏ | 22/995 [00:00<00:37, 26.24it/s] Loading 0: 3%|▎ | 25/995 [00:00<00:37, 25.61it/s] Loading 0: 3%|▎ | 33/995 [00:01<00:23, 40.09it/s] Loading 0: 4%|▍ | 38/995 [00:01<00:28, 33.41it/s] Loading 0: 4%|▍ | 42/995 [00:01<00:29, 32.21it/s] Loading 0: 5%|▍ | 46/995 [00:01<00:30, 31.24it/s] Loading 0: 5%|▌ | 52/995 [00:01<00:38, 24.79it/s] Loading 0: 6%|▌ | 55/995 [00:01<00:38, 24.62it/s] Loading 0: 6%|▌ | 58/995 [00:02<00:37, 25.12it/s] Loading 0: 6%|▌ | 61/995 [00:02<00:37, 25.01it/s] Loading 0: 7%|▋ | 66/995 [00:02<00:31, 29.87it/s] Loading 0: 7%|▋ | 70/995 [00:02<00:32, 28.73it/s] Loading 0: 7%|▋ | 74/995 [00:02<00:32, 28.55it/s] Loading 0: 8%|▊ | 77/995 [00:02<00:32, 28.00it/s] Loading 0: 8%|▊ | 80/995 [00:02<00:32, 27.79it/s] Loading 0: 8%|▊ | 83/995 [00:02<00:33, 27.02it/s] Loading 0: 9%|▊ | 86/995 [00:03<00:33, 26.98it/s] Loading 0: 9%|▉ | 94/995 [00:03<00:25, 35.70it/s] Loading 0: 10%|▉ | 98/995 [00:03<00:26, 34.11it/s] Loading 0: 10%|█ | 102/995 [00:03<00:25, 34.57it/s] Loading 0: 11%|█ | 107/995 [00:03<00:31, 28.05it/s] Loading 0: 11%|█ | 110/995 [00:03<00:32, 27.59it/s] Loading 0: 11%|█▏ | 113/995 [00:03<00:32, 27.53it/s] Loading 0: 12%|█▏ | 116/995 [00:04<00:32, 26.69it/s] Loading 0: 12%|█▏ | 119/995 [00:04<00:33, 26.23it/s] Loading 0: 12%|█▏ | 122/995 [00:04<00:33, 25.71it/s] Loading 0: 13%|█▎ | 126/995 [00:04<00:30, 28.75it/s] Loading 0: 13%|█▎ | 129/995 [00:04<00:34, 25.28it/s] Loading 0: 13%|█▎ | 132/995 [00:04<00:34, 25.11it/s] Loading 0: 14%|█▎ | 135/995 [00:04<00:34, 25.05it/s] Loading 0: 14%|█▍ | 138/995 [00:04<00:34, 24.86it/s] Loading 0: 14%|█▍ | 141/995 [00:05<00:33, 25.22it/s] Loading 0: 14%|█▍ | 144/995 [00:05<00:33, 25.22it/s] Loading 0: 15%|█▍ | 147/995 [00:05<00:33, 25.05it/s] Loading 0: 15%|█▌ | 151/995 [00:05<00:29, 28.95it/s] Loading 0: 16%|█▌ | 161/995 [00:05<00:19, 42.84it/s] Loading 0: 17%|█▋ | 166/995 [00:05<00:28, 28.98it/s] Loading 0: 17%|█▋ | 170/995 [00:06<00:31, 26.34it/s] Loading 0: 17%|█▋ | 173/995 [00:06<00:31, 26.42it/s] Loading 0: 18%|█▊ | 176/995 [00:06<00:31, 25.85it/s] Loading 0: 18%|█▊ | 179/995 [00:06<00:31, 25.92it/s] Loading 0: 18%|█▊ | 182/995 [00:06<00:31, 26.00it/s] Loading 0: 19%|█▊ | 185/995 [00:06<00:31, 25.71it/s] Loading 0: 19%|█▉ | 190/995 [00:06<00:26, 30.62it/s] Loading 0: 19%|█▉ | 194/995 [00:06<00:26, 30.27it/s] Loading 0: 20%|█▉ | 198/995 [00:06<00:26, 30.56it/s] Loading 0: 20%|██ | 202/995 [00:07<00:30, 26.39it/s] Loading 0: 21%|██ | 209/995 [00:07<00:22, 35.50it/s] Loading 0: 21%|██▏ | 213/995 [00:07<00:35, 22.11it/s] Loading 0: 22%|██▏ | 217/995 [00:07<00:31, 24.51it/s] Loading 0: 22%|██▏ | 221/995 [00:07<00:28, 26.80it/s] Loading 0: 23%|██▎ | 225/995 [00:08<00:27, 27.87it/s] Loading 0: 23%|██▎ | 229/995 [00:08<00:26, 29.11it/s] Loading 0: 23%|██▎ | 233/995 [00:08<00:28, 26.30it/s] Loading 0: 24%|██▎ | 236/995 [00:08<00:29, 26.01it/s] Loading 0: 24%|██▍ | 239/995 [00:08<00:29, 25.88it/s] Loading 0: 24%|██▍ | 242/995 [00:08<00:29, 25.53it/s] Loading 0: 25%|██▌ | 251/995 [00:08<00:18, 40.29it/s] Loading 0: 26%|██▌ | 256/995 [00:09<00:21, 33.63it/s] Loading 0: 26%|██▌ | 260/995 [00:09<00:21, 34.41it/s] Loading 0: 27%|██▋ | 265/995 [00:09<00:25, 28.81it/s] Loading 0: 27%|██▋ | 270/995 [00:09<00:22, 32.78it/s] Loading 0: 28%|██▊ | 274/995 [00:09<00:23, 30.33it/s] Loading 0: 28%|██▊ | 278/995 [00:09<00:24, 29.65it/s] Loading 0: 28%|██▊ | 282/995 [00:09<00:23, 29.91it/s] Loading 0: 28%|██▊ | 282/995 [00:20<00:23, 29.91it/s] Loading 0: 28%|██▊ | 283/995 [00:24<15:51, 1.34s/it] Loading 0: 29%|██▊ | 285/995 [00:24<12:42, 1.07s/it] Loading 0: 29%|██▉ | 288/995 [00:24<08:56, 1.32it/s] Loading 0: 29%|██▉ | 291/995 [00:24<06:23, 1.84it/s] Loading 0: 30%|██▉ | 294/995 [00:24<04:34, 2.55it/s] Loading 0: 30%|██▉ | 297/995 [00:24<03:19, 3.51it/s] Loading 0: 30%|███ | 300/995 [00:25<02:26, 4.75it/s] Loading 0: 30%|███ | 303/995 [00:25<01:49, 6.31it/s] Loading 0: 31%|███ | 306/995 [00:25<01:23, 8.22it/s] Loading 0: 31%|███ | 309/995 [00:25<01:06, 10.34it/s] Loading 0: 31%|███▏ | 312/995 [00:25<00:53, 12.68it/s] Loading 0: 32%|███▏ | 320/995 [00:25<00:37, 18.12it/s] Loading 0: 32%|███▏ | 323/995 [00:25<00:34, 19.59it/s] Loading 0: 33%|███▎ | 326/995 [00:26<00:31, 21.01it/s] Loading 0: 33%|███▎ | 329/995 [00:26<00:29, 22.41it/s] Loading 0: 33%|███▎ | 332/995 [00:26<00:28, 22.92it/s] Loading 0: 34%|███▎ | 335/995 [00:26<00:27, 23.92it/s] Loading 0: 34%|███▍ | 338/995 [00:26<00:27, 23.98it/s] Loading 0: 34%|███▍ | 343/995 [00:26<00:22, 29.23it/s] Loading 0: 35%|███▍ | 347/995 [00:26<00:21, 29.68it/s] Loading 0: 35%|███▌ | 351/995 [00:26<00:24, 26.39it/s] Loading 0: 36%|███▌ | 354/995 [00:27<00:24, 26.21it/s] Loading 0: 36%|███▌ | 357/995 [00:27<00:23, 26.61it/s] Loading 0: 36%|███▌ | 360/995 [00:27<00:23, 26.50it/s] Loading 0: 37%|███▋ | 367/995 [00:27<00:17, 36.43it/s] Loading 0: 37%|███▋ | 371/995 [00:27<00:27, 22.42it/s] Loading 0: 38%|███▊ | 376/995 [00:27<00:23, 26.80it/s] Loading 0: 38%|███▊ | 380/995 [00:27<00:22, 27.16it/s] Loading 0: 39%|███▊ | 384/995 [00:28<00:21, 27.93it/s] Loading 0: 39%|███▉ | 388/995 [00:28<00:24, 24.38it/s] Loading 0: 39%|███▉ | 391/995 [00:28<00:24, 24.42it/s] Loading 0: 40%|███▉ | 394/995 [00:28<00:24, 24.76it/s] Loading 0: 40%|███▉ | 397/995 [00:28<00:23, 25.25it/s] Loading 0: 41%|████ | 406/995 [00:28<00:14, 40.40it/s] Loading 0: 41%|████▏ | 411/995 [00:28<00:17, 33.87it/s] Loading 0: 42%|████▏ | 415/995 [00:29<00:17, 33.16it/s] Loading 0: 42%|████▏ | 419/995 [00:29<00:16, 34.11it/s] Loading 0: 43%|████▎ | 423/995 [00:29<00:22, 25.70it/s] Loading 0: 43%|████▎ | 427/995 [00:29<00:23, 23.79it/s] Loading 0: 43%|████▎ | 430/995 [00:29<00:23, 24.44it/s] Loading 0: 44%|████▎ | 433/995 [00:29<00:22, 25.18it/s] Loading 0: 44%|████▍ | 438/995 [00:30<00:18, 29.55it/s] Loading 0: 44%|████▍ | 442/995 [00:30<00:20, 26.51it/s] Loading 0: 45%|████▍ | 445/995 [00:30<00:21, 26.16it/s] Loading 0: 45%|████▌ | 448/995 [00:30<00:20, 26.47it/s] Loading 0: 45%|████▌ | 451/995 [00:30<00:20, 26.22it/s] Loading 0: 46%|████▌ | 454/995 [00:30<00:21, 25.54it/s] Loading 0: 46%|████▌ | 457/995 [00:30<00:20, 25.92it/s] Loading 0: 47%|████▋ | 464/995 [00:30<00:14, 37.16it/s] Loading 0: 47%|████▋ | 468/995 [00:30<00:14, 37.38it/s] Loading 0: 47%|████▋ | 472/995 [00:31<00:17, 30.02it/s] Loading 0: 48%|████▊ | 478/995 [00:31<00:18, 27.50it/s] Loading 0: 48%|████▊ | 482/995 [00:31<00:18, 27.83it/s] Loading 0: 49%|████▊ | 485/995 [00:31<00:18, 27.66it/s] Loading 0: 49%|████▉ | 488/995 [00:31<00:18, 27.65it/s] Loading 0: 49%|████▉ | 491/995 [00:31<00:18, 27.05it/s] Loading 0: 50%|████▉ | 494/995 [00:32<00:19, 26.27it/s] Loading 0: 50%|█████ | 498/995 [00:32<00:16, 29.67it/s] Loading 0: 50%|█████ | 502/995 [00:32<00:16, 29.35it/s] Loading 0: 51%|█████ | 506/995 [00:32<00:19, 25.65it/s] Loading 0: 51%|█████ | 509/995 [00:32<00:19, 25.34it/s] Loading 0: 51%|█████▏ | 512/995 [00:32<00:19, 25.39it/s] Loading 0: 52%|█████▏ | 515/995 [00:32<00:18, 25.66it/s] Loading 0: 52%|█████▏ | 518/995 [00:32<00:18, 25.42it/s] Loading 0: 53%|█████▎ | 525/995 [00:33<00:12, 36.16it/s] Loading 0: 53%|█████▎ | 529/995 [00:33<00:17, 26.22it/s] Loading 0: 54%|█████▎ | 533/995 [00:33<00:17, 26.85it/s] Loading 0: 54%|█████▍ | 537/995 [00:33<00:18, 24.75it/s] Loading 0: 54%|█████▍ | 540/995 [00:33<00:18, 24.81it/s] Loading 0: 55%|█████▍ | 543/995 [00:33<00:18, 24.49it/s] Loading 0: 55%|█████▍ | 546/995 [00:34<00:17, 24.95it/s] Loading 0: 55%|█████▌ | 549/995 [00:34<00:18, 24.55it/s] Loading 0: 55%|█████▌ | 552/995 [00:34<00:17, 24.75it/s] Loading 0: 56%|█████▋ | 561/995 [00:34<00:10, 40.47it/s] Loading 0: 57%|█████▋ | 566/995 [00:49<06:34, 1.09it/s] Loading 0: 57%|█████▋ | 569/995 [00:49<05:14, 1.36it/s] Loading 0: 58%|█████▊ | 573/995 [00:49<03:47, 1.85it/s] Loading 0: 58%|█████▊ | 577/995 [00:49<02:44, 2.55it/s] Loading 0: 58%|█████▊ | 581/995 [00:49<02:03, 3.36it/s] Loading 0: 59%|█████▊ | 584/995 [00:50<01:37, 4.22it/s] Loading 0: 59%|█████▉ | 587/995 [00:50<01:15, 5.38it/s] Loading 0: 59%|█████▉ | 591/995 [00:50<00:54, 7.46it/s] Loading 0: 60%|█████▉ | 595/995 [00:50<00:40, 9.84it/s] Loading 0: 60%|██████ | 599/995 [00:50<00:34, 11.59it/s] Loading 0: 61%|██████ | 602/995 [00:50<00:29, 13.47it/s] Loading 0: 61%|██████ | 605/995 [00:50<00:25, 15.22it/s] Loading 0: 61%|██████ | 608/995 [00:50<00:22, 17.20it/s] Loading 0: 61%|██████▏ | 611/995 [00:51<00:20, 19.02it/s] Loading 0: 62%|██████▏ | 614/995 [00:51<00:18, 20.86it/s] Loading 0: 63%|██████▎ | 622/995 [00:51<00:11, 33.34it/s] Loading 0: 63%|██████▎ | 627/995 [00:51<00:12, 29.21it/s] Loading 0: 63%|██████▎ | 631/995 [00:51<00:12, 29.99it/s] Loading 0: 64%|██████▍ | 636/995 [00:51<00:14, 24.19it/s] Loading 0: 64%|██████▍ | 639/995 [00:51<00:14, 24.22it/s] Loading 0: 65%|██████▍ | 642/995 [00:52<00:14, 24.08it/s] Loading 0: 65%|██████▍ | 645/995 [00:52<00:14, 24.61it/s] Loading 0: 65%|██████▌ | 648/995 [00:52<00:13, 25.11it/s] Loading 0: 66%|██████▌ | 653/995 [00:52<00:11, 30.27it/s] Loading 0: 66%|██████▌ | 657/995 [00:52<00:11, 29.86it/s] Loading 0: 66%|██████▋ | 661/995 [00:52<00:12, 25.89it/s] Loading 0: 67%|██████▋ | 664/995 [00:52<00:12, 25.97it/s] Loading 0: 67%|██████▋ | 667/995 [00:53<00:12, 25.43it/s] Loading 0: 67%|██████▋ | 670/995 [00:53<00:12, 25.27it/s] Loading 0: 68%|██████▊ | 673/995 [00:53<00:12, 25.15it/s] Loading 0: 68%|██████▊ | 676/995 [00:53<00:12, 25.44it/s] Loading 0: 69%|██████▉ | 685/995 [00:53<00:07, 41.24it/s] Loading 0: 69%|██████▉ | 691/995 [00:53<00:10, 30.11it/s] Loading 0: 70%|██████▉ | 695/995 [00:53<00:10, 29.41it/s] Loading 0: 70%|███████ | 699/995 [00:54<00:10, 29.33it/s] Loading 0: 71%|███████ | 703/995 [00:54<00:11, 26.46it/s] Loading 0: 71%|███████ | 706/995 [00:54<00:11, 25.22it/s] Loading 0: 71%|███████▏ | 709/995 [00:54<00:11, 25.73it/s] Loading 0: 72%|███████▏ | 712/995 [00:54<00:10, 25.82it/s] Loading 0: 72%|███████▏ | 717/995 [00:54<00:09, 30.37it/s] Loading 0: 72%|███████▏ | 721/995 [00:54<00:09, 29.32it/s] Loading 0: 73%|███████▎ | 725/995 [00:55<00:09, 29.89it/s] Loading 0: 73%|███████▎ | 729/995 [00:55<00:10, 26.36it/s] Loading 0: 74%|███████▎ | 732/995 [00:55<00:09, 26.53it/s] Loading 0: 74%|███████▍ | 739/995 [00:55<00:09, 26.35it/s] Loading 0: 75%|███████▍ | 742/995 [00:55<00:09, 26.07it/s] Loading 0: 75%|███████▍ | 746/995 [00:55<00:08, 28.92it/s] Loading 0: 75%|███████▌ | 750/995 [00:55<00:08, 29.41it/s] Loading 0: 76%|███████▌ | 754/995 [00:56<00:09, 25.94it/s] Loading 0: 76%|███████▌ | 757/995 [00:56<00:09, 25.89it/s] Loading 0: 76%|███████▋ | 760/995 [00:56<00:08, 26.29it/s] Loading 0: 77%|███████▋ | 763/995 [00:56<00:09, 25.70it/s] Loading 0: 77%|███████▋ | 766/995 [00:56<00:08, 25.65it/s] Loading 0: 77%|███████▋ | 769/995 [00:56<00:08, 25.63it/s] Loading 0: 78%|███████▊ | 778/995 [00:56<00:05, 41.48it/s] Loading 0: 79%|███████▊ | 783/995 [00:57<00:06, 32.88it/s] Loading 0: 79%|███████▉ | 787/995 [00:57<00:06, 32.56it/s] Loading 0: 80%|███████▉ | 793/995 [00:57<00:05, 35.01it/s] Loading 0: 80%|████████ | 797/995 [00:57<00:08, 24.52it/s] Loading 0: 80%|████████ | 800/995 [00:57<00:07, 24.88it/s] Loading 0: 81%|████████ | 803/995 [00:57<00:07, 24.75it/s] Loading 0: 81%|████████ | 808/995 [00:58<00:06, 28.84it/s] Loading 0: 82%|████████▏ | 812/995 [00:58<00:06, 28.83it/s] Loading 0: 82%|████████▏ | 816/995 [00:58<00:07, 25.41it/s] Loading 0: 82%|████████▏ | 819/995 [00:58<00:06, 25.75it/s] Loading 0: 83%|████████▎ | 822/995 [00:58<00:06, 26.09it/s] Loading 0: 83%|████████▎ | 825/995 [00:58<00:06, 26.26it/s] Loading 0: 83%|████████▎ | 828/995 [00:58<00:06, 26.30it/s] Loading 0: 84%|████████▎ | 831/995 [00:58<00:06, 26.42it/s] Loading 0: 84%|████████▍ | 840/995 [00:59<00:03, 42.28it/s] Loading 0: 85%|████████▍ | 842/995 [01:13<00:03, 42.28it/s] Loading 0: 85%|████████▍ | 843/995 [01:13<02:35, 1.02s/it] Loading 0: 85%|████████▌ | 848/995 [01:13<01:41, 1.44it/s] Loading 0: 86%|████████▌ | 853/995 [01:14<01:11, 2.00it/s] Loading 0: 86%|████████▌ | 857/995 [01:14<00:51, 2.67it/s] Loading 0: 87%|████████▋ | 861/995 [01:14<00:38, 3.51it/s] Loading 0: 87%|████████▋ | 864/995 [01:14<00:29, 4.37it/s] Loading 0: 87%|████████▋ | 867/995 [01:14<00:23, 5.49it/s] Loading 0: 88%|████████▊ | 872/995 [01:14<00:15, 8.12it/s] Loading 0: 88%|████████▊ | 876/995 [01:14<00:11, 10.37it/s] Loading 0: 88%|████████▊ | 880/995 [01:15<00:08, 12.90it/s] Loading 0: 89%|████████▉ | 884/995 [01:15<00:07, 14.54it/s] Loading 0: 89%|████████▉ | 887/995 [01:15<00:06, 16.33it/s] Loading 0: 89%|████████▉ | 890/995 [01:15<00:05, 17.61it/s] Loading 0: 90%|█████████ | 896/995 [01:15<00:03, 24.98it/s] Loading 0: 90%|█████████ | 900/995 [01:15<00:04, 20.95it/s] Loading 0: 91%|█████████ | 903/995 [01:16<00:04, 22.06it/s] Loading 0: 91%|█████████ | 906/995 [01:16<00:03, 22.64it/s] Loading 0: 91%|█████████▏| 909/995 [01:16<00:03, 22.91it/s] Loading 0: 92%|█████████▏| 912/995 [01:16<00:03, 23.17it/s] Loading 0: 92%|█████████▏| 915/995 [01:16<00:03, 24.17it/s] Loading 0: 92%|█████████▏| 918/995 [01:16<00:03, 24.99it/s] Loading 0: 93%|█████████▎| 921/995 [01:16<00:02, 24.85it/s] Loading 0: 93%|█████████▎| 924/995 [01:16<00:02, 25.21it/s] Loading 0: 94%|█████████▍| 933/995 [01:16<00:01, 41.23it/s] Loading 0: 94%|█████████▍| 938/995 [01:17<00:01, 32.92it/s] Loading 0: 95%|█████████▍| 942/995 [01:17<00:01, 32.24it/s] Loading 0: 95%|█████████▌| 946/995 [01:17<00:01, 27.72it/s] Loading 0: 96%|█████████▌| 952/995 [01:19<00:05, 8.54it/s] Loading 0: 96%|█████████▌| 955/995 [01:19<00:04, 9.95it/s] Loading 0: 96%|█████████▋| 958/995 [01:19<00:03, 11.61it/s] Loading 0: 97%|█████████▋| 961/995 [01:19<00:02, 13.39it/s] Loading 0: 97%|█████████▋| 966/995 [01:19<00:01, 18.06it/s] Loading 0: 97%|█████████▋| 970/995 [01:19<00:01, 20.55it/s] Loading 0: 98%|█████████▊| 974/995 [01:19<00:00, 22.86it/s] Loading 0: 98%|█████████▊| 978/995 [01:19<00:00, 22.15it/s] Loading 0: 99%|█████████▊| 981/995 [01:20<00:00, 23.05it/s] Loading 0: 99%|█████████▉| 984/995 [01:20<00:00, 23.38it/s] Loading 0: 99%|█████████▉| 987/995 [01:20<00:00, 24.03it/s]
Job mistralai-mixtral-8x7b-3473-v133-mkmlizer completed after 458.1s with status: succeeded
Stopping job with name mistralai-mixtral-8x7b-3473-v133-mkmlizer
Pipeline stage MKMLizer completed in 459.11s
run pipeline stage %s
Running pipeline stage MKMLTemplater
Pipeline stage MKMLTemplater completed in 0.08s
run pipeline stage %s
Running pipeline stage MKMLDeployer
Creating inference service mistralai-mixtral-8x7b-3473-v133
Waiting for inference service mistralai-mixtral-8x7b-3473-v133 to be ready
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Inference service mistralai-mixtral-8x7b-3473-v133 ready after 150.87287211418152s
Pipeline stage MKMLDeployer completed in 151.26s
run pipeline stage %s
Running pipeline stage StressChecker
Received healthy response to inference request in 3.064758777618408s
Received healthy response to inference request in 1.5640225410461426s
Received healthy response to inference request in 1.9802556037902832s
Received healthy response to inference request in 2.0549333095550537s
Received healthy response to inference request in 1.9201595783233643s
5 requests
0 failed requests
5th percentile: 1.635249948501587
10th percentile: 1.7064773559570312
20th percentile: 1.8489321708679198
30th percentile: 1.932178783416748
40th percentile: 1.9562171936035155
50th percentile: 1.9802556037902832
60th percentile: 2.0101266860961915
70th percentile: 2.0399977684021
80th percentile: 2.2568984031677246
90th percentile: 2.6608285903930664
95th percentile: 2.8627936840057373
99th percentile: 3.024365758895874
mean time: 2.1168259620666503
Pipeline stage StressChecker completed in 11.67s
run pipeline stage %s
Running pipeline stage TriggerMKMLProfilingPipeline
run_pipeline:run_in_cloud %s
starting trigger_guanaco_pipeline args=%s
Pipeline stage TriggerMKMLProfilingPipeline completed in 4.06s
Shutdown handler de-registered
mistralai-mixtral-8x7b_3473_v133 status is now deployed due to DeploymentManager action
Shutdown handler registered
run pipeline %s
run pipeline stage %s
Running pipeline stage MKMLProfilerDeleter
Skipping teardown as no inference service was successfully deployed
Pipeline stage MKMLProfilerDeleter completed in 0.14s
run pipeline stage %s
Running pipeline stage MKMLProfilerTemplater
Pipeline stage MKMLProfilerTemplater completed in 0.13s
run pipeline stage %s
Running pipeline stage MKMLProfilerDeployer
Creating inference service mistralai-mixtral-8x7b-3473-v133-profiler
Waiting for inference service mistralai-mixtral-8x7b-3473-v133-profiler to be ready
Inference service mistralai-mixtral-8x7b-3473-v133-profiler ready after 150.34845232963562s
Pipeline stage MKMLProfilerDeployer completed in 150.72s
run pipeline stage %s
Running pipeline stage MKMLProfilerRunner
kubectl cp /code/guanaco/guanaco_inference_services/src/inference_scripts tenant-chaiml-guanaco/mistralai-mixtral-8x1182627c103eea660fa2ef97ad572dac-deplopw8jj:/code/chaiverse_profiler_1725486129 --namespace tenant-chaiml-guanaco
kubectl exec -it mistralai-mixtral-8x1182627c103eea660fa2ef97ad572dac-deplopw8jj --namespace tenant-chaiml-guanaco -- sh -c 'cd /code/chaiverse_profiler_1725486129 && python profiles.py profile --best_of_n 4 --auto_batch 5 --batches 1,5,10,15,20,25,30,35,40,45,50,55,60,65,70,75,80,85,90,95,100,105,110,115,120,125,130,135,140,145,150,155,160,165,170,175,180,185,190,195 --samples 200 --input_tokens 512 --output_tokens 64 --summary /code/chaiverse_profiler_1725486129/summary.json'
kubectl exec -it mistralai-mixtral-8x1182627c103eea660fa2ef97ad572dac-deplopw8jj --namespace tenant-chaiml-guanaco -- bash -c 'cat /code/chaiverse_profiler_1725486129/summary.json'
Pipeline stage MKMLProfilerRunner completed in 774.52s
run pipeline stage %s
Running pipeline stage MKMLProfilerDeleter
Checking if service mistralai-mixtral-8x7b-3473-v133-profiler is running
Tearing down inference service mistralai-mixtral-8x7b-3473-v133-profiler
Service mistralai-mixtral-8x7b-3473-v133-profiler has been torndown
Pipeline stage MKMLProfilerDeleter completed in 1.83s
Shutdown handler de-registered
mistralai-mixtral-8x7b_3473_v133 status is now inactive due to auto deactivation removed underperforming models

Usage Metrics

Latency Metrics