submission_id: mistralai-mixtral-8x7b_3473_v138
developer_uid: robert_irvine
alignment_samples: 9961
alignment_score: 0.0287184057423505
best_of: 4
celo_rating: 1198.67
display_name: mistralai-mixtral-8x7b_3473_v138
formatter: {'memory_template': '<s>[INST] This is an entertaining conversation. You are {bot_name} who has the persona: {memory}.\nEngage in a chat with {user_name} while staying in character. Try to flirt with {user_name}. Engage in *roleplay* actions. Describe the scene dramatically. \n', 'prompt_template': '{prompt}\n', 'bot_template': '{bot_name}: {message}</s>', 'user_template': '[INST] {user_name}: {message} [/INST]', 'response_template': '{bot_name}:', 'truncate_by_message': False}
generation_params: {'temperature': 0.9, 'top_p': 1.0, 'min_p': 0.0, 'top_k': 50, 'presence_penalty': 0.5, 'frequency_penalty': 0.5, 'stopping_words': ['\n', '</s>', '<|user|>', '###'], 'max_input_tokens': 512, 'best_of': 4, 'max_output_tokens': 64}
gpu_counts: {'NVIDIA A100-SXM4-80GB': 1}
is_internal_developer: True
language_model: mistralai/Mixtral-8x7B-Instruct-v0.1
latencies: [{'batch_size': 1, 'throughput': 0.4653118141847497, 'latency_mean': 2.1490279030799866, 'latency_p50': 2.1950384378433228, 'latency_p90': 2.3988908529281616}, {'batch_size': 5, 'throughput': 1.408517952731804, 'latency_mean': 3.5236748385429384, 'latency_p50': 3.510183095932007, 'latency_p90': 3.9504790544509887}, {'batch_size': 10, 'throughput': 2.411350285048922, 'latency_mean': 4.111768436431885, 'latency_p50': 4.112135410308838, 'latency_p90': 4.635820055007935}, {'batch_size': 15, 'throughput': 3.131733270510071, 'latency_mean': 4.684914736747742, 'latency_p50': 4.708239197731018, 'latency_p90': 5.313648676872253}, {'batch_size': 20, 'throughput': 3.6706792550345924, 'latency_mean': 5.276691547632217, 'latency_p50': 5.232999801635742, 'latency_p90': 6.03054268360138}]
max_input_tokens: 512
max_output_tokens: 64
model_architecture: MixtralForCausalLM
model_group: mistralai/Mixtral-8x7B-I
model_name: mistralai-mixtral-8x7b_3473_v138
model_num_parameters: 46702792704.0
model_repo: mistralai/Mixtral-8x7B-Instruct-v0.1
model_size: 47B
num_battles: 9960
num_wins: 4344
propriety_score: 0.7055555555555556
propriety_total_count: 900.0
ranking_group: single
status: inactive
submission_type: basic
throughput_3p7s: 1.76
timestamp: 2024-09-13T06:14:27+00:00
us_pacific_date: 2024-09-12
win_ratio: 0.43614457831325304
Download Preference Data
Resubmit model
Shutdown handler not registered because Python interpreter is not running in the main thread
run pipeline %s
run pipeline stage %s
Running pipeline stage MKMLizer
Starting job with name mistralai-mixtral-8x7b-3473-v138-mkmlizer
Waiting for job on mistralai-mixtral-8x7b-3473-v138-mkmlizer to finish
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ╔═════════════════════════════════════════════════════════════════════╗
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ _____ __ __ ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ / _/ /_ ___ __/ / ___ ___ / / ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ / _/ / // / |/|/ / _ \/ -_) -_) / ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ /_//_/\_, /|__,__/_//_/\__/\__/_/ ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ /___/ ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ Version: 0.10.1 ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ Copyright 2023 MK ONE TECHNOLOGIES Inc. ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ https://mk1.ai ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ The license key for the current software has been verified as ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ belonging to: ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ Chai Research Corp. ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ Account ID: 7997a29f-0ceb-4cc7-9adf-840c57b4ae6f ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ Expiration: 2024-10-15 23:59:59 ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ║ ║
mistralai-mixtral-8x7b-3473-v138-mkmlizer: ╚═════════════════════════════════════════════════════════════════════╝
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
mistralai-mixtral-8x7b-3473-v138-mkmlizer: Downloaded to shared memory in 186.345s
mistralai-mixtral-8x7b-3473-v138-mkmlizer: quantizing model to /dev/shm/model_cache, profile:s0, folder:/tmp/tmp8r2hzf63, device:0
mistralai-mixtral-8x7b-3473-v138-mkmlizer: Saving flywheel model at /dev/shm/model_cache
mistralai-mixtral-8x7b-3473-v138-mkmlizer: quantized model in 90.440s
mistralai-mixtral-8x7b-3473-v138-mkmlizer: Processed model mistralai/Mixtral-8x7B-Instruct-v0.1 in 276.785s
mistralai-mixtral-8x7b-3473-v138-mkmlizer: creating bucket guanaco-mkml-models
mistralai-mixtral-8x7b-3473-v138-mkmlizer: cp /dev/shm/model_cache/config.json s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v138/config.json
mistralai-mixtral-8x7b-3473-v138-mkmlizer: cp /dev/shm/model_cache/special_tokens_map.json s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v138/special_tokens_map.json
mistralai-mixtral-8x7b-3473-v138-mkmlizer: cp /dev/shm/model_cache/tokenizer_config.json s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v138/tokenizer_config.json
mistralai-mixtral-8x7b-3473-v138-mkmlizer: cp /dev/shm/model_cache/tokenizer.model s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v138/tokenizer.model
mistralai-mixtral-8x7b-3473-v138-mkmlizer: cp /dev/shm/model_cache/tokenizer.json s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v138/tokenizer.json
mistralai-mixtral-8x7b-3473-v138-mkmlizer: cp /dev/shm/model_cache/flywheel_model.3.safetensors s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v138/flywheel_model.3.safetensors
mistralai-mixtral-8x7b-3473-v138-mkmlizer: cp /dev/shm/model_cache/flywheel_model.0.safetensors s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v138/flywheel_model.0.safetensors
mistralai-mixtral-8x7b-3473-v138-mkmlizer: cp /dev/shm/model_cache/flywheel_model.2.safetensors s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v138/flywheel_model.2.safetensors
mistralai-mixtral-8x7b-3473-v138-mkmlizer: cp /dev/shm/model_cache/flywheel_model.1.safetensors s3://guanaco-mkml-models/mistralai-mixtral-8x7b-3473-v138/flywheel_model.1.safetensors
mistralai-mixtral-8x7b-3473-v138-mkmlizer: Loading 0: 0%| | 0/995 [00:00<?, ?it/s] Loading 0: 0%| | 4/995 [00:00<00:28, 35.35it/s] Loading 0: 1%| | 8/995 [00:00<00:32, 30.17it/s] Loading 0: 1%| | 12/995 [00:00<00:33, 29.16it/s] Loading 0: 2%|▏ | 15/995 [00:00<00:35, 27.38it/s] Loading 0: 2%|▏ | 18/995 [00:00<00:37, 26.38it/s] Loading 0: 2%|▏ | 21/995 [00:00<00:36, 26.48it/s] Loading 0: 2%|▏ | 24/995 [00:00<00:36, 26.63it/s] Loading 0: 3%|▎ | 32/995 [00:01<00:26, 36.16it/s] Loading 0: 4%|▎ | 36/995 [00:01<00:28, 34.03it/s] Loading 0: 4%|▍ | 40/995 [00:01<00:29, 32.92it/s] Loading 0: 4%|▍ | 44/995 [00:01<00:35, 27.13it/s] Loading 0: 5%|▌ | 51/995 [00:01<00:27, 34.92it/s] Loading 0: 6%|▌ | 55/995 [00:01<00:41, 22.61it/s] Loading 0: 6%|▌ | 58/995 [00:02<00:40, 23.26it/s] Loading 0: 6%|▌ | 61/995 [00:02<00:38, 24.00it/s] Loading 0: 7%|▋ | 66/995 [00:02<00:32, 28.25it/s] Loading 0: 7%|▋ | 70/995 [00:02<00:33, 28.02it/s] Loading 0: 7%|▋ | 74/995 [00:02<00:32, 28.38it/s] Loading 0: 8%|▊ | 78/995 [00:02<00:36, 25.02it/s] Loading 0: 8%|▊ | 81/995 [00:02<00:36, 25.07it/s] Loading 0: 8%|▊ | 84/995 [00:03<00:35, 25.61it/s] Loading 0: 9%|▊ | 87/995 [00:03<00:35, 25.80it/s] Loading 0: 10%|▉ | 96/995 [00:03<00:21, 41.06it/s] Loading 0: 10%|█ | 101/995 [00:03<00:26, 33.96it/s] Loading 0: 11%|█ | 107/995 [00:03<00:29, 30.38it/s] Loading 0: 11%|█ | 111/995 [00:03<00:32, 26.89it/s] Loading 0: 11%|█▏ | 114/995 [00:04<00:33, 26.37it/s] Loading 0: 12%|█▏ | 117/995 [00:04<00:34, 25.61it/s] Loading 0: 12%|█▏ | 120/995 [00:04<00:34, 25.18it/s] Loading 0: 12%|█▏ | 123/995 [00:04<00:34, 25.53it/s] Loading 0: 13%|█▎ | 128/995 [00:04<00:28, 30.26it/s] Loading 0: 13%|█▎ | 132/995 [00:04<00:29, 29.69it/s] Loading 0: 14%|█▎ | 136/995 [00:04<00:28, 29.99it/s] Loading 0: 14%|█▍ | 140/995 [00:04<00:33, 25.76it/s] Loading 0: 14%|█▍ | 143/995 [00:05<00:32, 26.24it/s] Loading 0: 15%|█▍ | 146/995 [00:05<00:31, 26.62it/s] Loading 0: 15%|█▍ | 149/995 [00:05<00:31, 27.02it/s] Loading 0: 16%|█▌ | 161/995 [00:05<00:18, 46.26it/s] Loading 0: 17%|█▋ | 166/995 [00:05<00:27, 29.93it/s] Loading 0: 17%|█▋ | 170/995 [00:05<00:30, 27.11it/s] Loading 0: 17%|█▋ | 174/995 [00:06<00:29, 27.64it/s] Loading 0: 18%|█▊ | 178/995 [00:06<00:28, 28.45it/s] Loading 0: 18%|█▊ | 182/995 [00:06<00:31, 26.00it/s] Loading 0: 19%|█▊ | 185/995 [00:06<00:31, 26.09it/s] Loading 0: 19%|█▉ | 190/995 [00:06<00:26, 30.44it/s] Loading 0: 19%|█▉ | 194/995 [00:06<00:26, 29.74it/s] Loading 0: 20%|█▉ | 198/995 [00:06<00:26, 29.83it/s] Loading 0: 20%|██ | 202/995 [00:07<00:30, 25.95it/s] Loading 0: 21%|██ | 209/995 [00:07<00:22, 34.19it/s] Loading 0: 21%|██▏ | 213/995 [00:07<00:34, 22.49it/s] Loading 0: 22%|██▏ | 216/995 [00:07<00:33, 23.15it/s] Loading 0: 22%|██▏ | 221/995 [00:07<00:28, 27.25it/s] Loading 0: 23%|██▎ | 225/995 [00:08<00:28, 26.80it/s] Loading 0: 23%|██▎ | 229/995 [00:08<00:28, 27.18it/s] Loading 0: 23%|██▎ | 232/995 [00:08<00:29, 26.03it/s] Loading 0: 24%|██▎ | 235/995 [00:08<00:29, 25.79it/s] Loading 0: 24%|██▍ | 238/995 [00:08<00:29, 25.55it/s] Loading 0: 24%|██▍ | 241/995 [00:08<00:29, 25.56it/s] Loading 0: 25%|██▍ | 247/995 [00:08<00:21, 34.02it/s] Loading 0: 25%|██▌ | 251/995 [00:08<00:21, 34.37it/s] Loading 0: 26%|██▌ | 255/995 [00:09<00:25, 28.69it/s] Loading 0: 26%|██▌ | 259/995 [00:09<00:25, 28.74it/s] Loading 0: 27%|██▋ | 265/995 [00:09<00:27, 26.25it/s] Loading 0: 27%|██▋ | 268/995 [00:09<00:27, 26.76it/s] Loading 0: 27%|██▋ | 273/995 [00:09<00:23, 31.31it/s] Loading 0: 28%|██▊ | 277/995 [00:09<00:26, 26.85it/s] Loading 0: 28%|██▊ | 280/995 [00:09<00:26, 26.91it/s] Loading 0: 28%|██▊ | 282/995 [00:20<00:26, 26.91it/s] Loading 0: 28%|██▊ | 283/995 [00:24<14:31, 1.22s/it] Loading 0: 29%|██▊ | 285/995 [00:24<11:51, 1.00s/it] Loading 0: 29%|██▉ | 288/995 [00:24<08:31, 1.38it/s] Loading 0: 29%|██▉ | 291/995 [00:24<06:10, 1.90it/s] Loading 0: 30%|██▉ | 294/995 [00:24<04:28, 2.61it/s] Loading 0: 30%|██▉ | 297/995 [00:25<03:16, 3.55it/s] Loading 0: 30%|███ | 300/995 [00:25<02:25, 4.78it/s] Loading 0: 30%|███ | 303/995 [00:25<01:50, 6.29it/s] Loading 0: 31%|███ | 306/995 [00:25<01:24, 8.14it/s] Loading 0: 31%|███ | 309/995 [00:25<01:07, 10.13it/s] Loading 0: 31%|███▏ | 312/995 [00:25<00:55, 12.24it/s] Loading 0: 32%|███▏ | 320/995 [00:25<00:37, 18.09it/s] Loading 0: 32%|███▏ | 323/995 [00:26<00:34, 19.20it/s] Loading 0: 33%|███▎ | 326/995 [00:26<00:33, 20.27it/s] Loading 0: 33%|███▎ | 329/995 [00:26<00:31, 20.97it/s] Loading 0: 33%|███▎ | 332/995 [00:26<00:29, 22.14it/s] Loading 0: 34%|███▎ | 335/995 [00:26<00:28, 23.42it/s] Loading 0: 34%|███▍ | 338/995 [00:26<00:26, 24.34it/s] Loading 0: 34%|███▍ | 343/995 [00:26<00:21, 29.77it/s] Loading 0: 35%|███▍ | 347/995 [00:26<00:22, 29.42it/s] Loading 0: 35%|███▌ | 351/995 [00:27<00:24, 26.01it/s] Loading 0: 36%|███▌ | 354/995 [00:27<00:24, 25.65it/s] Loading 0: 36%|███▌ | 357/995 [00:27<00:24, 25.57it/s] Loading 0: 36%|███▌ | 360/995 [00:27<00:24, 25.64it/s] Loading 0: 37%|███▋ | 367/995 [00:27<00:17, 35.12it/s] Loading 0: 37%|███▋ | 371/995 [00:27<00:28, 21.77it/s] Loading 0: 38%|███▊ | 376/995 [00:28<00:23, 25.95it/s] Loading 0: 38%|███▊ | 380/995 [00:28<00:22, 26.91it/s] Loading 0: 39%|███▊ | 384/995 [00:28<00:21, 27.90it/s] Loading 0: 39%|███▉ | 388/995 [00:28<00:23, 25.37it/s] Loading 0: 39%|███▉ | 391/995 [00:28<00:23, 25.54it/s] Loading 0: 40%|███▉ | 394/995 [00:28<00:24, 24.93it/s] Loading 0: 40%|███▉ | 397/995 [00:28<00:23, 25.11it/s] Loading 0: 41%|████ | 406/995 [00:28<00:14, 40.08it/s] Loading 0: 41%|████▏ | 411/995 [00:29<00:18, 32.38it/s] Loading 0: 42%|████▏ | 415/995 [00:29<00:18, 31.95it/s] Loading 0: 42%|████▏ | 419/995 [00:29<00:17, 33.72it/s] Loading 0: 43%|████▎ | 423/995 [00:29<00:23, 24.32it/s] Loading 0: 43%|████▎ | 426/995 [00:29<00:23, 24.27it/s] Loading 0: 43%|████▎ | 429/995 [00:29<00:23, 24.56it/s] Loading 0: 43%|████▎ | 432/995 [00:30<00:22, 25.02it/s] Loading 0: 44%|████▍ | 437/995 [00:30<00:18, 30.11it/s] Loading 0: 44%|████▍ | 441/995 [00:30<00:21, 25.82it/s] Loading 0: 45%|████▍ | 444/995 [00:30<00:21, 25.72it/s] Loading 0: 45%|████▍ | 447/995 [00:30<00:21, 25.72it/s] Loading 0: 45%|████▌ | 450/995 [00:30<00:21, 25.95it/s] Loading 0: 46%|████▌ | 453/995 [00:30<00:21, 25.68it/s] Loading 0: 46%|████▌ | 456/995 [00:30<00:21, 25.22it/s] Loading 0: 46%|████▌ | 459/995 [00:31<00:20, 25.54it/s] Loading 0: 47%|████▋ | 468/995 [00:31<00:12, 41.22it/s] Loading 0: 48%|████▊ | 473/995 [00:31<00:15, 34.50it/s] Loading 0: 48%|████▊ | 478/995 [00:31<00:18, 27.33it/s] Loading 0: 48%|████▊ | 482/995 [00:31<00:18, 28.04it/s] Loading 0: 49%|████▉ | 486/995 [00:32<00:20, 25.11it/s] Loading 0: 49%|████▉ | 489/995 [00:32<00:20, 24.79it/s] Loading 0: 49%|████▉ | 492/995 [00:32<00:20, 24.80it/s] Loading 0: 50%|████▉ | 495/995 [00:32<00:19, 25.28it/s] Loading 0: 50%|█████ | 500/995 [00:32<00:16, 30.45it/s] Loading 0: 51%|█████ | 504/995 [00:32<00:16, 29.84it/s] Loading 0: 51%|█████ | 508/995 [00:32<00:16, 29.71it/s] Loading 0: 51%|█████▏ | 512/995 [00:32<00:18, 26.67it/s] Loading 0: 52%|█████▏ | 515/995 [00:33<00:17, 26.79it/s] Loading 0: 52%|█████▏ | 518/995 [00:33<00:17, 26.57it/s] Loading 0: 53%|█████▎ | 525/995 [00:33<00:13, 35.20it/s] Loading 0: 53%|█████▎ | 529/995 [00:33<00:18, 25.50it/s] Loading 0: 53%|█████▎ | 532/995 [00:33<00:18, 25.11it/s] Loading 0: 54%|█████▍ | 535/995 [00:33<00:18, 24.49it/s] Loading 0: 54%|█████▍ | 538/995 [00:33<00:18, 24.58it/s] Loading 0: 54%|█████▍ | 541/995 [00:34<00:18, 24.41it/s] Loading 0: 55%|█████▍ | 544/995 [00:34<00:18, 24.30it/s] Loading 0: 55%|█████▍ | 547/995 [00:34<00:17, 24.92it/s] Loading 0: 55%|█████▌ | 550/995 [00:34<00:17, 25.26it/s] Loading 0: 56%|█████▌ | 553/995 [00:34<00:16, 26.22it/s] Loading 0: 56%|█████▋ | 560/995 [00:34<00:11, 37.85it/s] Loading 0: 56%|█████▋ | 561/995 [00:49<00:11, 37.85it/s] Loading 0: 56%|█████▋ | 562/995 [00:49<08:59, 1.25s/it] Loading 0: 57%|█████▋ | 564/995 [00:49<07:18, 1.02s/it] Loading 0: 57%|█████▋ | 568/995 [00:49<04:51, 1.46it/s] Loading 0: 57%|█████▋ | 571/995 [00:49<03:34, 1.98it/s] Loading 0: 58%|█████▊ | 574/995 [00:49<02:37, 2.68it/s] Loading 0: 58%|█████▊ | 581/995 [00:50<01:27, 4.74it/s] Loading 0: 59%|█████▊ | 584/995 [00:50<01:10, 5.83it/s] Loading 0: 59%|█████▉ | 587/995 [00:50<00:56, 7.17it/s] Loading 0: 59%|█████▉ | 591/995 [00:50<00:42, 9.61it/s] Loading 0: 60%|█████▉ | 594/995 [00:50<00:35, 11.37it/s] Loading 0: 60%|██████ | 597/995 [00:50<00:29, 13.43it/s] Loading 0: 60%|██████ | 600/995 [00:50<00:25, 15.51it/s] Loading 0: 61%|██████ | 603/995 [00:50<00:22, 17.27it/s] Loading 0: 61%|██████ | 606/995 [00:51<00:20, 18.87it/s] Loading 0: 61%|██████ | 609/995 [00:51<00:18, 20.43it/s] Loading 0: 62%|██████▏ | 612/995 [00:51<00:17, 21.85it/s] Loading 0: 62%|██████▏ | 619/995 [00:51<00:11, 32.97it/s] Loading 0: 63%|██████▎ | 624/995 [00:51<00:11, 31.19it/s] Loading 0: 63%|██████▎ | 628/995 [00:51<00:12, 30.24it/s] Loading 0: 64%|██████▎ | 633/995 [00:51<00:10, 34.76it/s] Loading 0: 64%|██████▍ | 637/995 [00:52<00:14, 25.05it/s] Loading 0: 64%|██████▍ | 641/995 [00:52<00:15, 23.35it/s] Loading 0: 65%|██████▍ | 644/995 [00:52<00:14, 23.86it/s] Loading 0: 65%|██████▌ | 647/995 [00:52<00:14, 23.74it/s] Loading 0: 65%|██████▌ | 650/995 [00:52<00:14, 23.72it/s] Loading 0: 66%|██████▌ | 655/995 [00:52<00:11, 28.55it/s] Loading 0: 66%|██████▌ | 659/995 [00:52<00:11, 28.90it/s] Loading 0: 67%|██████▋ | 663/995 [00:53<00:11, 28.66it/s] Loading 0: 67%|██████▋ | 666/995 [00:53<00:12, 27.35it/s] Loading 0: 67%|██████▋ | 669/995 [00:53<00:12, 25.98it/s] Loading 0: 68%|██████▊ | 672/995 [00:53<00:12, 25.34it/s] Loading 0: 68%|██████▊ | 675/995 [00:53<00:12, 25.41it/s] Loading 0: 69%|██████▊ | 683/995 [00:53<00:09, 34.40it/s] Loading 0: 69%|██████▉ | 690/995 [00:53<00:07, 42.29it/s] Loading 0: 70%|██████▉ | 695/995 [00:54<00:11, 26.19it/s] Loading 0: 70%|███████ | 699/995 [00:54<00:11, 26.76it/s] Loading 0: 71%|███████ | 703/995 [00:54<00:11, 25.12it/s] Loading 0: 71%|███████ | 706/995 [00:54<00:11, 25.33it/s] Loading 0: 71%|███████▏ | 709/995 [00:54<00:11, 25.46it/s] Loading 0: 72%|███████▏ | 712/995 [00:54<00:11, 25.47it/s] Loading 0: 72%|███████▏ | 717/995 [00:55<00:09, 30.52it/s] Loading 0: 72%|███████▏ | 721/995 [00:55<00:09, 30.01it/s] Loading 0: 73%|███████▎ | 725/995 [00:55<00:08, 30.44it/s] Loading 0: 73%|███████▎ | 729/995 [00:55<00:09, 27.31it/s] Loading 0: 74%|███████▎ | 732/995 [00:55<00:09, 27.47it/s] Loading 0: 74%|███████▍ | 739/995 [00:55<00:09, 26.95it/s] Loading 0: 75%|███████▍ | 742/995 [00:55<00:09, 26.63it/s] Loading 0: 75%|███████▍ | 746/995 [00:56<00:08, 29.46it/s] Loading 0: 75%|███████▌ | 750/995 [00:56<00:08, 28.53it/s] Loading 0: 76%|███████▌ | 753/995 [00:56<00:08, 27.60it/s] Loading 0: 76%|███████▌ | 756/995 [00:56<00:08, 26.58it/s] Loading 0: 76%|███████▋ | 759/995 [00:56<00:08, 26.31it/s] Loading 0: 77%|███████▋ | 762/995 [00:56<00:08, 26.08it/s] Loading 0: 77%|███████▋ | 765/995 [00:56<00:08, 26.01it/s] Loading 0: 77%|███████▋ | 768/995 [00:56<00:08, 25.58it/s] Loading 0: 78%|███████▊ | 776/995 [00:57<00:06, 35.57it/s] Loading 0: 78%|███████▊ | 780/995 [00:57<00:06, 34.12it/s] Loading 0: 79%|███████▉ | 784/995 [00:57<00:06, 33.19it/s] Loading 0: 79%|███████▉ | 788/995 [00:57<00:07, 28.31it/s] Loading 0: 80%|███████▉ | 794/995 [00:57<00:07, 26.69it/s] Loading 0: 80%|████████ | 797/995 [00:57<00:07, 25.48it/s] Loading 0: 80%|████████ | 800/995 [00:58<00:07, 25.42it/s] Loading 0: 81%|████████ | 803/995 [00:58<00:07, 25.74it/s] Loading 0: 81%|████████ | 806/995 [00:58<00:07, 26.49it/s] Loading 0: 81%|████████▏ | 810/995 [00:58<00:06, 28.12it/s] Loading 0: 82%|████████▏ | 813/995 [00:58<00:06, 27.80it/s] Loading 0: 82%|████████▏ | 816/995 [00:58<00:06, 27.65it/s] Loading 0: 82%|████████▏ | 819/995 [00:58<00:06, 26.66it/s] Loading 0: 83%|████████▎ | 822/995 [00:58<00:06, 26.49it/s] Loading 0: 83%|████████▎ | 825/995 [00:58<00:06, 26.59it/s] Loading 0: 83%|████████▎ | 828/995 [00:59<00:06, 26.01it/s] Loading 0: 84%|████████▎ | 831/995 [00:59<00:06, 25.12it/s] Loading 0: 84%|████████▍ | 840/995 [00:59<00:03, 41.16it/s] Loading 0: 85%|████████▍ | 842/995 [01:13<00:03, 41.16it/s] Loading 0: 85%|████████▍ | 843/995 [01:13<02:38, 1.04s/it] Loading 0: 85%|████████▌ | 848/995 [01:14<01:43, 1.42it/s] Loading 0: 86%|████████▌ | 853/995 [01:14<01:11, 1.98it/s] Loading 0: 86%|████████▌ | 857/995 [01:14<00:52, 2.65it/s] Loading 0: 87%|████████▋ | 861/995 [01:14<00:38, 3.50it/s] Loading 0: 87%|████████▋ | 864/995 [01:14<00:29, 4.37it/s] Loading 0: 87%|████████▋ | 867/995 [01:15<00:23, 5.48it/s] Loading 0: 88%|████████▊ | 872/995 [01:15<00:15, 8.11it/s] Loading 0: 88%|████████▊ | 876/995 [01:15<00:11, 10.28it/s] Loading 0: 88%|████████▊ | 880/995 [01:15<00:09, 12.75it/s] Loading 0: 89%|████████▉ | 884/995 [01:15<00:07, 14.32it/s] Loading 0: 89%|████████▉ | 887/995 [01:15<00:06, 16.07it/s] Loading 0: 89%|████████▉ | 890/995 [01:15<00:05, 17.56it/s] Loading 0: 90%|█████████ | 896/995 [01:15<00:03, 24.97it/s] Loading 0: 90%|█████████ | 900/995 [01:16<00:04, 20.51it/s] Loading 0: 91%|█████████ | 903/995 [01:16<00:04, 21.01it/s] Loading 0: 91%|█████████ | 906/995 [01:16<00:04, 22.05it/s] Loading 0: 91%|█████████▏| 909/995 [01:16<00:03, 23.00it/s] Loading 0: 92%|█████████▏| 912/995 [01:16<00:03, 24.01it/s] Loading 0: 92%|█████████▏| 915/995 [01:16<00:03, 24.24it/s] Loading 0: 92%|█████████▏| 918/995 [01:16<00:03, 24.75it/s] Loading 0: 93%|█████████▎| 921/995 [01:17<00:02, 25.32it/s] Loading 0: 93%|█████████▎| 924/995 [01:17<00:02, 25.87it/s] Loading 0: 94%|█████████▍| 933/995 [01:17<00:01, 42.16it/s] Loading 0: 94%|█████████▍| 938/995 [01:17<00:01, 32.38it/s] Loading 0: 95%|█████████▍| 942/995 [01:17<00:01, 31.34it/s] Loading 0: 95%|█████████▌| 946/995 [01:17<00:01, 28.00it/s] Loading 0: 96%|█████████▌| 952/995 [01:19<00:05, 8.58it/s] Loading 0: 96%|█████████▌| 955/995 [01:19<00:04, 9.97it/s] Loading 0: 96%|█████████▋| 958/995 [01:19<00:03, 11.60it/s] Loading 0: 97%|█████████▋| 961/995 [01:19<00:02, 13.42it/s] Loading 0: 97%|█████████▋| 966/995 [01:19<00:01, 18.16it/s] Loading 0: 97%|█████████▋| 970/995 [01:19<00:01, 20.66it/s] Loading 0: 98%|█████████▊| 974/995 [01:20<00:00, 22.87it/s] Loading 0: 98%|█████████▊| 978/995 [01:20<00:00, 22.44it/s] Loading 0: 99%|█████████▊| 981/995 [01:20<00:00, 23.48it/s] Loading 0: 99%|█████████▉| 984/995 [01:20<00:00, 23.79it/s] Loading 0: 99%|█████████▉| 987/995 [01:20<00:00, 24.52it/s]
Job mistralai-mixtral-8x7b-3473-v138-mkmlizer completed after 314.72s with status: succeeded
Stopping job with name mistralai-mixtral-8x7b-3473-v138-mkmlizer
Pipeline stage MKMLizer completed in 316.13s
run pipeline stage %s
Running pipeline stage MKMLTemplater
Pipeline stage MKMLTemplater completed in 0.10s
run pipeline stage %s
Running pipeline stage MKMLDeployer
Creating inference service mistralai-mixtral-8x7b-3473-v138
Waiting for inference service mistralai-mixtral-8x7b-3473-v138 to be ready
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Failed to get response for submission chaiml-elo-alignment-run-3_v41: ('http://chaiml-elo-alignment-run-3-v41-predictor.tenant-chaiml-guanaco.k.chaiverse.com/v1/models/GPT-J-6B-lit-v2:predict', 'activator request timeout')
Failed to get response for submission chaiml-elo-alignment-run-3_v41: ('http://chaiml-elo-alignment-run-3-v41-predictor.tenant-chaiml-guanaco.k.chaiverse.com/v1/models/GPT-J-6B-lit-v2:predict', 'activator request timeout')
Inference service mistralai-mixtral-8x7b-3473-v138 ready after 181.49621057510376s
Pipeline stage MKMLDeployer completed in 182.46s
run pipeline stage %s
Running pipeline stage StressChecker
Received healthy response to inference request in 2.8176703453063965s
Received healthy response to inference request in 2.3565804958343506s
Received healthy response to inference request in 1.5183544158935547s
Received healthy response to inference request in 1.8702850341796875s
Failed to get response for submission chaiml-elo-alignment-run-3_v41: ('http://chaiml-elo-alignment-run-3-v41-predictor.tenant-chaiml-guanaco.k.chaiverse.com/v1/models/GPT-J-6B-lit-v2:predict', 'activator request timeout')
Received healthy response to inference request in 1.8487212657928467s
5 requests
0 failed requests
5th percentile: 1.584427785873413
10th percentile: 1.6505011558532714
20th percentile: 1.7826478958129883
30th percentile: 1.8530340194702148
40th percentile: 1.8616595268249512
50th percentile: 1.8702850341796875
60th percentile: 2.064803218841553
70th percentile: 2.2593214035034177
80th percentile: 2.44879846572876
90th percentile: 2.633234405517578
95th percentile: 2.725452375411987
99th percentile: 2.7992267513275144
mean time: 2.0823223114013674
Pipeline stage StressChecker completed in 11.32s
run pipeline stage %s
Running pipeline stage TriggerMKMLProfilingPipeline
run_pipeline:run_in_cloud %s
starting trigger_guanaco_pipeline args=%s
Pipeline stage TriggerMKMLProfilingPipeline completed in 4.52s
Shutdown handler de-registered
mistralai-mixtral-8x7b_3473_v138 status is now deployed due to DeploymentManager action
Shutdown handler registered
run pipeline %s
run pipeline stage %s
Running pipeline stage MKMLProfilerDeleter
Skipping teardown as no inference service was successfully deployed
Pipeline stage MKMLProfilerDeleter completed in 0.14s
run pipeline stage %s
Running pipeline stage MKMLProfilerTemplater
Pipeline stage MKMLProfilerTemplater completed in 0.13s
run pipeline stage %s
Running pipeline stage MKMLProfilerDeployer
Creating inference service mistralai-mixtral-8x7b-3473-v138-profiler
Waiting for inference service mistralai-mixtral-8x7b-3473-v138-profiler to be ready
Inference service mistralai-mixtral-8x7b-3473-v138-profiler ready after 180.4268069267273s
Pipeline stage MKMLProfilerDeployer completed in 180.83s
run pipeline stage %s
Running pipeline stage MKMLProfilerRunner
kubectl cp /code/guanaco/guanaco_inference_services/src/inference_scripts tenant-chaiml-guanaco/mistralai-mixtral-8x5caa983aee7106533d2fd313332a0693-deplo72td8:/code/chaiverse_profiler_1726208810 --namespace tenant-chaiml-guanaco
kubectl exec -it mistralai-mixtral-8x5caa983aee7106533d2fd313332a0693-deplo72td8 --namespace tenant-chaiml-guanaco -- sh -c 'cd /code/chaiverse_profiler_1726208810 && python profiles.py profile --best_of_n 4 --auto_batch 5 --batches 1,5,10,15,20,25,30,35,40,45,50,55,60,65,70,75,80,85,90,95,100,105,110,115,120,125,130,135,140,145,150,155,160,165,170,175,180,185,190,195 --samples 200 --input_tokens 512 --output_tokens 64 --summary /code/chaiverse_profiler_1726208810/summary.json'
kubectl exec -it mistralai-mixtral-8x5caa983aee7106533d2fd313332a0693-deplo72td8 --namespace tenant-chaiml-guanaco -- bash -c 'cat /code/chaiverse_profiler_1726208810/summary.json'
Pipeline stage MKMLProfilerRunner completed in 779.17s
run pipeline stage %s
Running pipeline stage MKMLProfilerDeleter
Checking if service mistralai-mixtral-8x7b-3473-v138-profiler is running
Tearing down inference service mistralai-mixtral-8x7b-3473-v138-profiler
Service mistralai-mixtral-8x7b-3473-v138-profiler has been torndown
Pipeline stage MKMLProfilerDeleter completed in 1.98s
Shutdown handler de-registered
mistralai-mixtral-8x7b_3473_v138 status is now inactive due to auto deactivation removed underperforming models