submission_id: nousresearch-hermes-2-pr_1418_v5
developer_uid: immaculate_possum_03470
best_of: 4
celo_rating: 1174.83
display_name: mistral
family_friendly_score: 0.6004672897196262
family_friendly_standard_error: 0.008633772907985272
formatter: {'memory_template': "{bot_name}'s Persona: {memory}\n####\n", 'prompt_template': '{prompt}\n<START>\n', 'bot_template': '{bot_name}: {message}\n', 'user_template': '{user_name}: {message}\n', 'response_template': '{bot_name}:', 'truncate_by_message': False}
generation_params: {'temperature': 0.99, 'top_p': 0.2, 'min_p': 0.0, 'top_k': 40, 'presence_penalty': 0.5, 'frequency_penalty': 0.5, 'stopping_words': ['\n'], 'max_input_tokens': 1024, 'best_of': 4, 'max_output_tokens': 64}
gpu_counts: {'NVIDIA RTX A5000': 1}
ineligible_reason: num_battles<5000
is_internal_developer: False
language_model: NousResearch/Hermes-2-Pro-Mistral-7B
latencies: [{'batch_size': 1, 'throughput': 0.9428787287768751, 'latency_mean': 1.0604888272285462, 'latency_p50': 1.0543179512023926, 'latency_p90': 1.1754693508148193}, {'batch_size': 5, 'throughput': 2.4573629292710746, 'latency_mean': 2.022642220258713, 'latency_p50': 2.020264148712158, 'latency_p90': 2.235901379585266}, {'batch_size': 10, 'throughput': 3.032567300102297, 'latency_mean': 3.2656181657314303, 'latency_p50': 3.264852523803711, 'latency_p90': 3.675941276550293}, {'batch_size': 15, 'throughput': 3.216176714705725, 'latency_mean': 4.618912569284439, 'latency_p50': 4.638434648513794, 'latency_p90': 5.3110260486602785}, {'batch_size': 20, 'throughput': 3.2256575275072157, 'latency_mean': 6.084995464086533, 'latency_p50': 6.099307417869568, 'latency_p90': 6.766555047035217}]
max_input_tokens: 1024
max_output_tokens: 64
model_architecture: MistralForCausalLM
model_group: NousResearch/Hermes-2-Pr
model_name: mistral
model_num_parameters: 7241994240.0
model_repo: NousResearch/Hermes-2-Pro-Mistral-7B
model_size: 7B
num_battles: 3321
num_wins: 1324
ranking_group: single
status: torndown
submission_type: basic
throughput_3p7s: 3.14
timestamp: 2024-09-26T17:14:16+00:00
us_pacific_date: 2024-09-26
win_ratio: 0.3986750978620897
Download Preference Data
Resubmit model
Shutdown handler not registered because Python interpreter is not running in the main thread
run pipeline %s
run pipeline stage %s
Running pipeline stage MKMLizer
Starting job with name nousresearch-hermes-2-pr-1418-v5-mkmlizer
Waiting for job on nousresearch-hermes-2-pr-1418-v5-mkmlizer to finish
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ╔═════════════════════════════════════════════════════════════════════╗
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ _____ __ __ ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ / _/ /_ ___ __/ / ___ ___ / / ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ / _/ / // / |/|/ / _ \/ -_) -_) / ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ /_//_/\_, /|__,__/_//_/\__/\__/_/ ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ /___/ ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ Version: 0.11.12 ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ Copyright 2023 MK ONE TECHNOLOGIES Inc. ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ https://mk1.ai ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ The license key for the current software has been verified as ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ belonging to: ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ Chai Research Corp. ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ Account ID: 7997a29f-0ceb-4cc7-9adf-840c57b4ae6f ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ Expiration: 2024-10-15 23:59:59 ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ║ ║
nousresearch-hermes-2-pr-1418-v5-mkmlizer: ╚═════════════════════════════════════════════════════════════════════╝
nousresearch-hermes-2-pr-1418-v5-mkmlizer: Downloaded to shared memory in 20.405s
nousresearch-hermes-2-pr-1418-v5-mkmlizer: quantizing model to /dev/shm/model_cache, profile:s0, folder:/tmp/tmpeil4hvty, device:0
nousresearch-hermes-2-pr-1418-v5-mkmlizer: Saving flywheel model at /dev/shm/model_cache
nousresearch-hermes-2-pr-1418-v5-mkmlizer: quantized model in 17.060s
nousresearch-hermes-2-pr-1418-v5-mkmlizer: Processed model NousResearch/Hermes-2-Pro-Mistral-7B in 37.465s
nousresearch-hermes-2-pr-1418-v5-mkmlizer: creating bucket guanaco-mkml-models
nousresearch-hermes-2-pr-1418-v5-mkmlizer: Bucket 's3://guanaco-mkml-models/' created
nousresearch-hermes-2-pr-1418-v5-mkmlizer: uploading /dev/shm/model_cache to s3://guanaco-mkml-models/nousresearch-hermes-2-pr-1418-v5
nousresearch-hermes-2-pr-1418-v5-mkmlizer: cp /dev/shm/model_cache/config.json s3://guanaco-mkml-models/nousresearch-hermes-2-pr-1418-v5/config.json
nousresearch-hermes-2-pr-1418-v5-mkmlizer: cp /dev/shm/model_cache/added_tokens.json s3://guanaco-mkml-models/nousresearch-hermes-2-pr-1418-v5/added_tokens.json
nousresearch-hermes-2-pr-1418-v5-mkmlizer: cp /dev/shm/model_cache/special_tokens_map.json s3://guanaco-mkml-models/nousresearch-hermes-2-pr-1418-v5/special_tokens_map.json
nousresearch-hermes-2-pr-1418-v5-mkmlizer: cp /dev/shm/model_cache/tokenizer_config.json s3://guanaco-mkml-models/nousresearch-hermes-2-pr-1418-v5/tokenizer_config.json
nousresearch-hermes-2-pr-1418-v5-mkmlizer: cp /dev/shm/model_cache/tokenizer.model s3://guanaco-mkml-models/nousresearch-hermes-2-pr-1418-v5/tokenizer.model
nousresearch-hermes-2-pr-1418-v5-mkmlizer: cp /dev/shm/model_cache/tokenizer.json s3://guanaco-mkml-models/nousresearch-hermes-2-pr-1418-v5/tokenizer.json
nousresearch-hermes-2-pr-1418-v5-mkmlizer: cp /dev/shm/model_cache/flywheel_model.0.safetensors s3://guanaco-mkml-models/nousresearch-hermes-2-pr-1418-v5/flywheel_model.0.safetensors
nousresearch-hermes-2-pr-1418-v5-mkmlizer: Loading 0: 0%| | 0/291 [00:00<?, ?it/s] Loading 0: 2%|▏ | 5/291 [00:00<00:07, 40.32it/s] Loading 0: 5%|▍ | 14/291 [00:00<00:05, 50.41it/s] Loading 0: 8%|▊ | 23/291 [00:00<00:05, 52.90it/s] Loading 0: 11%|█ | 31/291 [00:00<00:04, 60.55it/s] Loading 0: 13%|█▎ | 38/291 [00:00<00:04, 59.18it/s] Loading 0: 15%|█▌ | 45/291 [00:00<00:04, 58.80it/s] Loading 0: 18%|█▊ | 51/291 [00:00<00:04, 51.79it/s] Loading 0: 20%|█▉ | 58/291 [00:01<00:04, 54.89it/s] Loading 0: 22%|██▏ | 64/291 [00:01<00:04, 49.75it/s] Loading 0: 24%|██▍ | 70/291 [00:01<00:04, 50.94it/s] Loading 0: 27%|██▋ | 78/291 [00:01<00:04, 52.48it/s] Loading 0: 29%|██▉ | 84/291 [00:01<00:05, 38.32it/s] Loading 0: 31%|███▏ | 91/291 [00:01<00:05, 38.76it/s] Loading 0: 34%|███▍ | 99/291 [00:02<00:04, 45.72it/s] Loading 0: 36%|███▌ | 105/291 [00:02<00:04, 42.60it/s] Loading 0: 38%|███▊ | 110/291 [00:02<00:04, 41.69it/s] Loading 0: 40%|███▉ | 115/291 [00:02<00:04, 43.46it/s] Loading 0: 41%|████ | 120/291 [00:02<00:03, 43.45it/s] Loading 0: 44%|████▎ | 127/291 [00:02<00:03, 44.05it/s] Loading 0: 46%|████▋ | 135/291 [00:02<00:02, 52.20it/s] Loading 0: 48%|████▊ | 141/291 [00:02<00:02, 51.73it/s] Loading 0: 51%|█████ | 148/291 [00:03<00:02, 56.18it/s] Loading 0: 53%|█████▎ | 154/291 [00:03<00:02, 49.13it/s] Loading 0: 55%|█████▍ | 160/291 [00:03<00:03, 42.21it/s] Loading 0: 57%|█████▋ | 165/291 [00:03<00:03, 41.97it/s] Loading 0: 58%|█████▊ | 170/291 [00:03<00:02, 42.28it/s] Loading 0: 60%|██████ | 176/291 [00:03<00:02, 41.30it/s] Loading 0: 63%|██████▎ | 184/291 [00:03<00:02, 49.87it/s] Loading 0: 65%|██████▌ | 190/291 [00:03<00:02, 47.56it/s] Loading 0: 67%|██████▋ | 195/291 [00:04<00:02, 45.27it/s] Loading 0: 70%|██████▉ | 203/291 [00:04<00:01, 46.73it/s] Loading 0: 73%|███████▎ | 211/291 [00:04<00:01, 54.45it/s] Loading 0: 75%|███████▍ | 217/291 [00:04<00:01, 50.61it/s] Loading 0: 77%|███████▋ | 223/291 [00:04<00:01, 50.16it/s] Loading 0: 79%|███████▊ | 229/291 [00:04<00:01, 52.03it/s] Loading 0: 81%|████████ | 235/291 [00:04<00:01, 49.41it/s] Loading 0: 83%|████████▎ | 241/291 [00:06<00:04, 11.25it/s] Loading 0: 84%|████████▍ | 245/291 [00:06<00:03, 13.31it/s] Loading 0: 86%|████████▌ | 249/291 [00:06<00:02, 15.72it/s] Loading 0: 88%|████████▊ | 257/291 [00:06<00:01, 23.26it/s] Loading 0: 90%|█████████ | 263/291 [00:06<00:01, 27.38it/s] Loading 0: 92%|█████████▏| 268/291 [00:06<00:00, 30.80it/s] Loading 0: 95%|█████████▍| 275/291 [00:07<00:00, 37.91it/s] Loading 0: 97%|█████████▋| 281/291 [00:07<00:00, 40.05it/s] Loading 0: 99%|█████████▊| 287/291 [00:07<00:00, 44.05it/s]
Job nousresearch-hermes-2-pr-1418-v5-mkmlizer completed after 62.22s with status: succeeded
Stopping job with name nousresearch-hermes-2-pr-1418-v5-mkmlizer
Pipeline stage MKMLizer completed in 62.48s
run pipeline stage %s
Running pipeline stage MKMLTemplater
Pipeline stage MKMLTemplater completed in 0.07s
run pipeline stage %s
Running pipeline stage MKMLDeployer
Creating inference service nousresearch-hermes-2-pr-1418-v5
Waiting for inference service nousresearch-hermes-2-pr-1418-v5 to be ready
Shutdown handler not registered because Python interpreter is not running in the main thread
run pipeline %s
run pipeline stage %s
Running pipeline stage MKMLizer
Starting job with name zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer
Waiting for job on zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer to finish
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ╔═════════════════════════════════════════════════════════════════════╗
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ _____ __ __ ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ / _/ /_ ___ __/ / ___ ___ / / ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ / _/ / // / |/|/ / _ \/ -_) -_) / ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ /_//_/\_, /|__,__/_//_/\__/\__/_/ ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ /___/ ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ Version: 0.11.12 ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ Copyright 2023 MK ONE TECHNOLOGIES Inc. ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ https://mk1.ai ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ The license key for the current software has been verified as ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ belonging to: ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ Chai Research Corp. ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ Account ID: 7997a29f-0ceb-4cc7-9adf-840c57b4ae6f ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ Expiration: 2024-10-15 23:59:59 ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ╚═════════════════════════════════════════════════════════════════════╝
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: Downloaded to shared memory in 52.968s
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: quantizing model to /dev/shm/model_cache, profile:s0, folder:/tmp/tmp22j23_g9, device:0
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: Saving flywheel model at /dev/shm/model_cache
Job zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer completed after 152.09s with status: failed
Stopping job with name zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer
%s, retrying in %s seconds...
Starting job with name zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer
Waiting for job on zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer to finish
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ╔═════════════════════════════════════════════════════════════════════╗
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ _____ __ __ ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ / _/ /_ ___ __/ / ___ ___ / / ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ / _/ / // / |/|/ / _ \/ -_) -_) / ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ /_//_/\_, /|__,__/_//_/\__/\__/_/ ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ /___/ ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ Version: 0.11.12 ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ Copyright 2023 MK ONE TECHNOLOGIES Inc. ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ https://mk1.ai ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ The license key for the current software has been verified as ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ belonging to: ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ Chai Research Corp. ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ Account ID: 7997a29f-0ceb-4cc7-9adf-840c57b4ae6f ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ Expiration: 2024-10-15 23:59:59 ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ║ ║
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: ╚═════════════════════════════════════════════════════════════════════╝
Shutdown handler not registered because Python interpreter is not running in the main thread
run pipeline %s
run pipeline stage %s
Running pipeline stage MKMLizer
Starting job with name zonemercy-vingt-deux-gfv-4513-v1-mkmlizer
Waiting for job on zonemercy-vingt-deux-gfv-4513-v1-mkmlizer to finish
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: Downloaded to shared memory in 47.965s
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: quantizing model to /dev/shm/model_cache, profile:s0, folder:/tmp/tmpdcubjc6b, device:0
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: Saving flywheel model at /dev/shm/model_cache
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ╔═════════════════════════════════════════════════════════════════════╗
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ _____ __ __ ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ / _/ /_ ___ __/ / ___ ___ / / ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ / _/ / // / |/|/ / _ \/ -_) -_) / ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ /_//_/\_, /|__,__/_//_/\__/\__/_/ ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ /___/ ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ Version: 0.11.12 ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ Copyright 2023 MK ONE TECHNOLOGIES Inc. ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ https://mk1.ai ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ The license key for the current software has been verified as ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ belonging to: ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ Chai Research Corp. ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ Account ID: 7997a29f-0ceb-4cc7-9adf-840c57b4ae6f ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ Expiration: 2024-10-15 23:59:59 ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ║ ║
zonemercy-vingt-deux-gfv-4513-v1-mkmlizer: ╚═════════════════════════════════════════════════════════════════════╝
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: Loading 0: 0%| | 0/507 [00:00<?, ?it/s] Loading 0: 1%| | 5/507 [00:00<00:17, 28.25it/s] Loading 0: 2%|▏ | 12/507 [00:00<00:11, 43.13it/s] Loading 0: 3%|▎ | 17/507 [00:00<00:12, 39.59it/s] Loading 0: 4%|▍ | 22/507 [00:00<00:12, 39.23it/s] Loading 0: 5%|▌ | 27/507 [00:00<00:11, 40.39it/s] Loading 0: 6%|▋ | 32/507 [00:00<00:14, 32.76it/s] Loading 0: 8%|▊ | 39/507 [00:01<00:11, 39.35it/s] Loading 0: 9%|▊ | 44/507 [00:01<00:11, 39.51it/s] Loading 0: 10%|▉ | 49/507 [00:01<00:13, 33.98it/s] Loading 0: 10%|█ | 53/507 [00:01<00:18, 23.91it/s] Loading 0: 11%|█ | 56/507 [00:01<00:19, 22.90it/s] Loading 0: 12%|█▏ | 63/507 [00:01<00:14, 30.22it/s] Loading 0: 13%|█▎ | 67/507 [00:02<00:14, 30.90it/s] Loading 0: 14%|█▍ | 72/507 [00:02<00:12, 34.90it/s] Loading 0: 15%|█▌ | 78/507 [00:02<00:10, 39.10it/s] Loading 0: 16%|█▋ | 83/507 [00:02<00:11, 36.58it/s] Loading 0: 17%|█▋ | 87/507 [00:02<00:11, 36.36it/s] Loading 0: 18%|█▊ | 91/507 [00:02<00:11, 35.49it/s] Loading 0: 19%|█▉ | 96/507 [00:02<00:11, 37.33it/s] Loading 0: 20%|█▉ | 100/507 [00:02<00:11, 34.52it/s] Loading 0: 21%|██ | 105/507 [00:03<00:10, 36.95it/s] Loading 0: 21%|██▏ | 109/507 [00:03<00:11, 35.93it/s] Loading 0: 22%|██▏ | 113/507 [00:03<00:16, 24.43it/s] Loading 0: 23%|██▎ | 116/507 [00:03<00:16, 23.25it/s] Loading 0: 24%|██▍ | 122/507 [00:03<00:14, 27.25it/s] Loading 0: 25%|██▌ | 129/507 [00:03<00:11, 34.00it/s] Loading 0: 26%|██▌ | 133/507 [00:04<00:11, 33.72it/s] Loading 0: 27%|██▋ | 138/507 [00:04<00:10, 36.28it/s] Loading 0: 28%|██▊ | 142/507 [00:04<00:10, 35.42it/s] Loading 0: 29%|██▉ | 147/507 [00:04<00:09, 38.09it/s] Loading 0: 30%|██▉ | 151/507 [00:04<00:09, 35.83it/s] Loading 0: 31%|███ | 156/507 [00:04<00:09, 38.44it/s] Loading 0: 32%|███▏ | 160/507 [00:04<00:09, 36.87it/s] Loading 0: 32%|███▏ | 164/507 [00:04<00:09, 36.36it/s] Loading 0: 33%|███▎ | 169/507 [00:05<00:12, 27.46it/s] Loading 0: 34%|███▍ | 173/507 [00:05<00:11, 29.19it/s] Loading 0: 35%|███▍ | 177/507 [00:05<00:11, 28.96it/s] Loading 0: 36%|███▌ | 183/507 [00:05<00:09, 34.70it/s] Loading 0: 37%|███▋ | 187/507 [00:05<00:09, 34.58it/s] Loading 0: 38%|███▊ | 192/507 [00:05<00:08, 37.78it/s] Loading 0: 39%|███▊ | 196/507 [00:05<00:08, 36.42it/s] Loading 0: 40%|███▉ | 201/507 [00:05<00:08, 37.38it/s] Loading 0: 40%|████ | 205/507 [00:06<00:08, 36.96it/s] Loading 0: 41%|████▏ | 210/507 [00:06<00:07, 39.94it/s] Loading 0: 42%|████▏ | 215/507 [00:06<00:07, 40.28it/s] Loading 0: 43%|████▎ | 220/507 [00:06<00:08, 35.15it/s] Loading 0: 44%|████▍ | 224/507 [00:06<00:10, 26.39it/s] Loading 0: 45%|████▌ | 230/507 [00:06<00:10, 27.64it/s] Loading 0: 47%|████▋ | 237/507 [00:07<00:07, 33.93it/s] Loading 0: 48%|████▊ | 241/507 [00:07<00:07, 33.76it/s] Loading 0: 49%|████▊ | 246/507 [00:07<00:07, 36.16it/s] Loading 0: 49%|████▉ | 250/507 [00:07<00:07, 35.56it/s] Loading 0: 50%|█████ | 255/507 [00:07<00:06, 37.36it/s] Loading 0: 51%|█████ | 259/507 [00:07<00:06, 36.17it/s] Loading 0: 52%|█████▏ | 264/507 [00:07<00:06, 38.59it/s] Loading 0: 53%|█████▎ | 268/507 [00:07<00:06, 37.12it/s] Loading 0: 54%|█████▍ | 273/507 [00:07<00:05, 39.19it/s] Loading 0: 55%|█████▍ | 277/507 [00:08<00:06, 36.68it/s] Loading 0: 56%|█████▌ | 283/507 [00:08<00:06, 36.81it/s] Loading 0: 57%|█████▋ | 287/507 [00:08<00:09, 24.24it/s] Loading 0: 58%|█████▊ | 293/507 [00:08<00:07, 27.77it/s] Loading 0: 59%|█████▉ | 299/507 [00:23<00:07, 27.77it/s] Loading 0: 59%|█████▉ | 300/507 [00:23<02:42, 1.27it/s] Loading 0: 60%|█████▉ | 302/507 [00:23<02:21, 1.45it/s] Loading 0: 61%|██████ | 307/507 [00:23<01:35, 2.09it/s] Loading 0: 61%|██████ | 310/507 [00:23<01:16, 2.58it/s] Loading 0: 62%|██████▏ | 313/507 [00:23<00:58, 3.29it/s] Loading 0: 63%|██████▎ | 318/507 [00:23<00:38, 4.93it/s] Loading 0: 64%|██████▎ | 322/507 [00:23<00:28, 6.56it/s] Loading 0: 64%|██████▍ | 327/507 [00:23<00:19, 9.30it/s] Loading 0: 65%|██████▌ | 331/507 [00:24<00:15, 11.67it/s] Loading 0: 66%|██████▌ | 335/507 [00:24<00:11, 14.57it/s] Loading 0: 67%|██████▋ | 340/507 [00:24<00:10, 15.96it/s] Loading 0: 68%|██████▊ | 344/507 [00:24<00:08, 18.78it/s] Loading 0: 69%|██████▊ | 348/507 [00:24<00:07, 20.68it/s] Loading 0: 70%|██████▉ | 354/507 [00:24<00:05, 26.96it/s] Loading 0: 71%|███████ | 358/507 [00:24<00:05, 28.46it/s] Loading 0: 72%|███████▏ | 363/507 [00:25<00:04, 32.38it/s] Loading 0: 72%|███████▏ | 367/507 [00:25<00:04, 32.31it/s] Loading 0: 73%|███████▎ | 372/507 [00:25<00:03, 34.34it/s] Loading 0: 74%|███████▍ | 376/507 [00:25<00:03, 34.82it/s] Loading 0: 75%|███████▌ | 381/507 [00:25<00:03, 38.18it/s] Loading 0: 76%|███████▌ | 386/507 [00:25<00:03, 39.07it/s] Loading 0: 77%|███████▋ | 391/507 [00:25<00:03, 34.52it/s] Loading 0: 78%|███████▊ | 395/507 [00:26<00:04, 26.47it/s] Loading 0: 79%|███████▉ | 401/507 [00:26<00:03, 28.93it/s] Loading 0: 80%|████████ | 408/507 [00:26<00:02, 35.24it/s] Loading 0: 81%|████████▏ | 412/507 [00:26<00:02, 34.20it/s] Loading 0: 82%|████████▏ | 417/507 [00:26<00:02, 36.60it/s] Loading 0: 83%|████████▎ | 421/507 [00:26<00:02, 35.83it/s] Loading 0: 84%|████████▍ | 426/507 [00:26<00:02, 38.69it/s] Loading 0: 85%|████████▌ | 431/507 [00:26<00:01, 38.46it/s] Loading 0: 86%|████████▌ | 436/507 [00:27<00:01, 39.23it/s] Loading 0: 87%|████████▋ | 440/507 [00:27<00:01, 39.21it/s] Loading 0: 88%|████████▊ | 445/507 [00:27<00:01, 39.86it/s] Loading 0: 89%|████████▉ | 450/507 [00:27<00:01, 42.16it/s] Loading 0: 90%|████████▉ | 455/507 [00:29<00:08, 6.39it/s] Loading 0: 91%|█████████ | 459/507 [00:29<00:05, 8.01it/s] Loading 0: 92%|█████████▏| 465/507 [00:30<00:03, 11.17it/s] Loading 0: 93%|█████████▎| 472/507 [00:30<00:02, 15.89it/s] Loading 0: 94%|█████████▍| 476/507 [00:30<00:01, 18.20it/s] Loading 0: 95%|█████████▍| 481/507 [00:30<00:01, 22.13it/s] Loading 0: 96%|█████████▌| 486/507 [00:30<00:00, 25.32it/s] Loading 0: 97%|█████████▋| 490/507 [00:30<00:00, 27.23it/s] Loading 0: 97%|█████████▋| 494/507 [00:30<00:00, 27.98it/s] Loading 0: 98%|█████████▊| 499/507 [00:30<00:00, 31.38it/s] Loading 0: 99%|█████████▉| 503/507 [00:30<00:00, 32.20it/s] Traceback (most recent call last):
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: File "/code/uploading/mkmlize.py", line 151, in <module>
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: cli()
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: File "/opt/conda/lib/python3.10/site-packages/click/core.py", line 1157, in __call__
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: return self.main(*args, **kwargs)
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: File "/opt/conda/lib/python3.10/site-packages/click/core.py", line 1078, in main
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: rv = self.invoke(ctx)
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: File "/opt/conda/lib/python3.10/site-packages/click/core.py", line 1688, in invoke
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: return _process_result(sub_ctx.command.invoke(sub_ctx))
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: File "/opt/conda/lib/python3.10/site-packages/click/core.py", line 1434, in invoke
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: return ctx.invoke(self.callback, **ctx.params)
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: File "/opt/conda/lib/python3.10/site-packages/click/core.py", line 783, in invoke
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: return __callback(*args, **kwargs)
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: File "/code/uploading/mkmlize.py", line 42, in quantize
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: quantize_model(temp_folder, output_path, profile, device)
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: File "/code/uploading/mkmlize.py", line 135, in quantize_model
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: flywheel.instrument(
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: File "/opt/conda/lib/python3.10/site-packages/mk1/flywheel/instrument.py", line 96, in instrument
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: tokenizer = AutoTokenizer.from_pretrained(input_model_path, verbose=False)
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: File "/opt/conda/lib/python3.10/site-packages/transformers/models/auto/tokenization_auto.py", line 897, in from_pretrained
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: return tokenizer_class.from_pretrained(pretrained_model_name_or_path, *inputs, **kwargs)
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: File "/opt/conda/lib/python3.10/site-packages/transformers/tokenization_utils_base.py", line 2271, in from_pretrained
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: return cls._from_pretrained(
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: File "/opt/conda/lib/python3.10/site-packages/transformers/tokenization_utils_base.py", line 2505, in _from_pretrained
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: tokenizer = cls(*init_inputs, **init_kwargs)
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: File "/opt/conda/lib/python3.10/site-packages/transformers/models/llama/tokenization_llama_fast.py", line 157, in __init__
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: super().__init__(
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: File "/opt/conda/lib/python3.10/site-packages/transformers/tokenization_utils_fast.py", line 115, in __init__
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: fast_tokenizer = TokenizerFast.from_file(fast_tokenizer_file)
zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer: Exception: data did not match any variant of untagged enum ModelWrapper at line 275732 column 3
Job zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer completed after 117.42s with status: failed
Stopping job with name zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer
%s, retrying in %s seconds...
Starting job with name zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer
Waiting for job on zonemercy-vingt-deux-v5-1e5v0-v5-mkmlizer to finish
Inference service nousresearch-hermes-2-pr-1418-v5 ready after 350.7747962474823s
Pipeline stage MKMLDeployer completed in 351.11s
run pipeline stage %s
Running pipeline stage StressChecker
Received healthy response to inference request in 1.4446451663970947s
Received healthy response to inference request in 0.8907690048217773s
Received healthy response to inference request in 0.8413486480712891s
Received healthy response to inference request in 1.2591774463653564s
Received healthy response to inference request in 0.9848537445068359s
5 requests
0 failed requests
5th percentile: 0.8512327194213867
10th percentile: 0.8611167907714844
20th percentile: 0.8808849334716797
30th percentile: 0.9095859527587891
40th percentile: 0.9472198486328125
50th percentile: 0.9848537445068359
60th percentile: 1.094583225250244
70th percentile: 1.2043127059936523
80th percentile: 1.2962709903717042
90th percentile: 1.3704580783843994
95th percentile: 1.407551622390747
99th percentile: 1.4372264575958251
mean time: 1.0841588020324706
Pipeline stage StressChecker completed in 8.34s
run pipeline stage %s
Running pipeline stage TriggerMKMLProfilingPipeline
run_pipeline:run_in_cloud %s
starting trigger_guanaco_pipeline args=%s
Pipeline stage TriggerMKMLProfilingPipeline completed in 5.30s
Shutdown handler de-registered
nousresearch-hermes-2-pr_1418_v5 status is now deployed due to DeploymentManager action
Shutdown handler registered
run pipeline %s
run pipeline stage %s
Running pipeline stage MKMLProfilerDeleter
Skipping teardown as no inference service was successfully deployed
Pipeline stage MKMLProfilerDeleter completed in 0.23s
run pipeline stage %s
Running pipeline stage MKMLProfilerTemplater
Pipeline stage MKMLProfilerTemplater completed in 0.15s
run pipeline stage %s
Running pipeline stage MKMLProfilerDeployer
Creating inference service nousresearch-hermes-2-pr-1418-v5-profiler
Waiting for inference service nousresearch-hermes-2-pr-1418-v5-profiler to be ready
Inference service nousresearch-hermes-2-pr-1418-v5-profiler ready after 210.55639100074768s
Pipeline stage MKMLProfilerDeployer completed in 211.00s
run pipeline stage %s
Running pipeline stage MKMLProfilerRunner
kubectl cp /code/guanaco/guanaco_inference_services/src/inference_scripts tenant-chaiml-guanaco/nousresearch-hermes-dd6d96ce67f486b5e6a67ddfd92844d2-deplobp9wj:/code/chaiverse_profiler_1727371542 --namespace tenant-chaiml-guanaco
kubectl exec -it nousresearch-hermes-dd6d96ce67f486b5e6a67ddfd92844d2-deplobp9wj --namespace tenant-chaiml-guanaco -- sh -c 'cd /code/chaiverse_profiler_1727371542 && python profiles.py profile --best_of_n 4 --auto_batch 5 --batches 1,5,10,15,20,25,30,35,40,45,50,55,60,65,70,75,80,85,90,95,100,105,110,115,120,125,130,135,140,145,150,155,160,165,170,175,180,185,190,195 --samples 200 --input_tokens 1024 --output_tokens 64 --summary /code/chaiverse_profiler_1727371542/summary.json'
kubectl exec -it nousresearch-hermes-dd6d96ce67f486b5e6a67ddfd92844d2-deplobp9wj --namespace tenant-chaiml-guanaco -- bash -c 'cat /code/chaiverse_profiler_1727371542/summary.json'
Pipeline stage MKMLProfilerRunner completed in 488.91s
run pipeline stage %s
Running pipeline stage MKMLProfilerDeleter
Checking if service nousresearch-hermes-2-pr-1418-v5-profiler is running
Tearing down inference service nousresearch-hermes-2-pr-1418-v5-profiler
Service nousresearch-hermes-2-pr-1418-v5-profiler has been torndown
Pipeline stage MKMLProfilerDeleter completed in 2.49s
Shutdown handler de-registered
nousresearch-hermes-2-pr_1418_v5 status is now inactive due to auto deactivation removed underperforming models
chaiml-albert-dpo-0912-v_1751_v2 status is now torndown due to DeploymentManager action
Cleaning model data from model cache
Deleting key chaiml-albert-dpo-0912-v-8296-v2/config.json from bucket guanaco-mkml-models
function_rihet_2024-09-26 status is now torndown due to DeploymentManager action
Shutdown handler de-registered
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of nousresearch-hermes-2-pr_1418_v5
Deleting key chaiml-albert-dpo-0912-v-9673-v1/config.json from bucket guanaco-mkml-models
Deleting key chaiml-albert-dpo-0912-v-8296-v2/flywheel_model.0.safetensors from bucket guanaco-mkml-models
function_todun_2024-09-26 status is now torndown due to DeploymentManager action
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of rirv938-llama-8b-big-ret_5210_v1
Deleting key chaiml-albert-dpo-0912-v-9673-v1/flywheel_model.0.safetensors from bucket guanaco-mkml-models
Deleting key chaiml-albert-dpo-0912-v-8296-v2/special_tokens_map.json from bucket guanaco-mkml-models
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of rirv938-llama-8b-big-ret_5422_v1
Deleting key chaiml-albert-dpo-0912-v-9673-v1/special_tokens_map.json from bucket guanaco-mkml-models
Deleting key chaiml-albert-dpo-0912-v-8296-v2/tokenizer.json from bucket guanaco-mkml-models
Checking if service jic062-dpo-v1-9-nemo-v1 is running
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of rirv938-llama-8b-big-ret_9237_v3
Deleting key chaiml-albert-dpo-0912-v-9673-v1/tokenizer.json from bucket guanaco-mkml-models
Deleting key chaiml-albert-dpo-0912-v-8296-v2/tokenizer_config.json from bucket guanaco-mkml-models
Checking if service jic062-dpo-v1-9-nemo-v2 is running
Running pipeline stage MKMLDeleter
Tearing down inference service jic062-dpo-v1-9-nemo-v1
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of zonemercy-cogent-nemo-v_3266_v11
Deleting key chaiml-albert-dpo-0912-v-9673-v1/tokenizer_config.json from bucket guanaco-mkml-models
Pipeline stage MKMLModelDeleter completed in 98.68s
Checking if service nousresearch-hermes-2-pr-1418-v5 is running
Tearing down inference service jic062-dpo-v1-9-nemo-v2
Service jic062-dpo-v1-9-nemo-v1 has been torndown
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of zonemercy-elite-edit-v1-1e5_v1
Pipeline stage MKMLModelDeleter completed in 98.22s
Shutdown handler de-registered
Tearing down inference service nousresearch-hermes-2-pr-1418-v5
Service jic062-dpo-v1-9-nemo-v2 has been torndown
Pipeline stage MKMLDeleter completed in 52.77s
Checking if service rirv938-llama-8b-big-ret-5210-v1 is running
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of zonemercy-elite-pref-v4-1e5_v1
Shutdown handler de-registered
chaiml-albert-dpo-0912-v_8296_v2 status is now torndown due to DeploymentManager action
Service nousresearch-hermes-2-pr-1418-v5 has been torndown
Pipeline stage MKMLDeleter completed in 56.75s
run pipeline stage %s
Checking if service rirv938-llama-8b-big-ret-5422-v1 is running
Running pipeline stage MKMLDeleter
Tearing down inference service rirv938-llama-8b-big-ret-5210-v1
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of zonemercy-vingt-deux-gfv_4513_v1
chaiml-albert-dpo-0912-v_9673_v1 status is now torndown due to DeploymentManager action
Pipeline stage MKMLDeleter completed in 65.22s
run pipeline stage %s
Running pipeline stage MKMLModelDeleter
Tearing down inference service rirv938-llama-8b-big-ret-5422-v1
Checking if service rirv938-llama-8b-big-ret-9237-v3 is running
Service rirv938-llama-8b-big-ret-5210-v1 has been torndown
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of zonemercy-virgo-edit-v3-_7871_v1
run pipeline stage %s
Running pipeline stage MKMLModelDeleter
Cleaning model data from S3
Service rirv938-llama-8b-big-ret-5422-v1 has been torndown
Tearing down inference service rirv938-llama-8b-big-ret-9237-v3
Pipeline stage MKMLDeleter completed in 73.20s
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLDeleter
admin requested tearing down of chaiml-0916-intent-suppo_6584_v3
admin requested tearing down of blend_rofur_2024-10-03
admin requested tearing down of blend_rofur_2024-10-03
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
Cleaning model data from S3
Running pipeline stage MKMLModelDeleter
admin requested tearing down of blend_rofur_2024-10-03
Cleaning model data from model cache
Pipeline stage MKMLDeleter completed in 119.45s
Service rirv938-llama-8b-big-ret-9237-v3 has been torndown
run pipeline stage %s
Pipeline stage MKMLDeleter completed in 88.17s
Checking if service zonemercy-elite-edit-v1-1e5-v1 is running
Shutdown handler not registered because Python interpreter is not running in the main thread
Shutdown handler not registered because Python interpreter is not running in the main thread
Shutdown handler not registered because Python interpreter is not running in the main thread
run pipeline %s
Running pipeline stage MKMLDeleter
run pipeline stage %s
Cleaning model data from model cache
Cleaning model data from S3
Shutdown handler not registered because Python interpreter is not running in the main thread
Deleting key jic062-dpo-v1-9-nemo-v1/config.json from bucket guanaco-mkml-models
run pipeline stage %s
Pipeline stage MKMLDeleter completed in 154.64s
Running pipeline stage MKMLModelDeleter
run pipeline stage %s
run pipeline %s
run pipeline %s
Skipping teardown as no inference service was found
run pipeline %s
run pipeline stage %s
Checking if service zonemercy-elite-pref-v4-1e5-v1 is running
Running pipeline stage MKMLDeleter
Deleting key jic062-dpo-v1-9-nemo-v2/config.json from bucket guanaco-mkml-models
Cleaning model data from model cache
run pipeline %s
Deleting key jic062-dpo-v1-9-nemo-v1/flywheel_model.0.safetensors from bucket guanaco-mkml-models
Running pipeline stage MKMLModelDeleter
run pipeline stage %s
Cleaning model data from S3
Running pipeline stage MKMLModelDeleter
run pipeline stage %s
run pipeline stage %s
Pipeline stage MKMLDeleter completed in 182.27s
run pipeline stage %s
Running pipeline stage MKMLDeleter
Tearing down inference service zonemercy-elite-pref-v4-1e5-v1
Checking if service zonemercy-vingt-deux-gfv-4513-v1 is running
Deleting key jic062-dpo-v1-9-nemo-v2/flywheel_model.0.safetensors from bucket guanaco-mkml-models
Deleting key nousresearch-hermes-2-pr-1418-v5/added_tokens.json from bucket guanaco-mkml-models
run pipeline stage %s
Deleting key jic062-dpo-v1-9-nemo-v1/special_tokens_map.json from bucket guanaco-mkml-models
Cleaning model data from S3
Running pipeline stage MKMLModelDeleter
Cleaning model data from model cache
Cleaning model data from S3
Running pipeline stage MKMLDeleter
Running pipeline stage ProductionBlendMKMLTemplater
run pipeline stage %s
Running pipeline stage ProductionBlendMKMLTemplater
Checking if service zonemercy-virgo-edit-v3-7871-v1 is running
Service zonemercy-elite-pref-v4-1e5-v1 has been torndown
Tearing down inference service zonemercy-vingt-deux-gfv-4513-v1
Deleting key jic062-dpo-v1-9-nemo-v2/special_tokens_map.json from bucket guanaco-mkml-models
Deleting key nousresearch-hermes-2-pr-1418-v5/config.json from bucket guanaco-mkml-models
Running pipeline stage ProductionBlendMKMLTemplater
Deleting key jic062-dpo-v1-9-nemo-v1/tokenizer.json from bucket guanaco-mkml-models
Cleaning model data from model cache
Cleaning model data from S3
Deleting key rirv938-llama-8b-big-ret-5210-v1/config.json from bucket guanaco-mkml-models
Cleaning model data from model cache
Pipeline stage %s skipped, reason=%s
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLModelDeleter
Pipeline stage %s skipped, reason=%s
Tearing down inference service zonemercy-virgo-edit-v3-7871-v1
admin requested tearing down of chaiml-0916-intent-suppo_6584_v3
Pipeline stage MKMLDeleter completed in 215.40s
admin requested tearing down of blend_rofur_2024-10-03
Service zonemercy-vingt-deux-gfv-4513-v1 has been torndown
Deleting key jic062-dpo-v1-9-nemo-v2/tokenizer.json from bucket guanaco-mkml-models
Deleting key nousresearch-hermes-2-pr-1418-v5/flywheel_model.0.safetensors from bucket guanaco-mkml-models
admin requested tearing down of blend_rofur_2024-10-03
Pipeline stage %s skipped, reason=%s
Deleting key jic062-dpo-v1-9-nemo-v1/tokenizer_config.json from bucket guanaco-mkml-models
Deleting key rirv938-llama-8b-big-ret-5422-v1/config.json from bucket guanaco-mkml-models
Cleaning model data from model cache
Deleting key rirv938-llama-8b-big-ret-5210-v1/flywheel_model.0.safetensors from bucket guanaco-mkml-models
Deleting key zonemercy-cogent-nemo-v-3266-v11/config.json from bucket guanaco-mkml-models
Pipeline stage MKMLDeleter completed in 144.20s
Pipeline stage ProductionBlendMKMLTemplater completed in 146.69s
Cleaning model data from S3
Pipeline stage ProductionBlendMKMLTemplater completed in 151.85s
Service zonemercy-virgo-edit-v3-7871-v1 has been torndown
Shutdown handler not registered because Python interpreter is not running in the main thread
Shutdown handler not registered because Python interpreter is not running in the main thread
run pipeline stage %s
Pipeline stage MKMLDeleter completed in 282.47s
Deleting key jic062-dpo-v1-9-nemo-v2/tokenizer_config.json from bucket guanaco-mkml-models
Deleting key nousresearch-hermes-2-pr-1418-v5/special_tokens_map.json from bucket guanaco-mkml-models
Shutdown handler not registered because Python interpreter is not running in the main thread
Pipeline stage ProductionBlendMKMLTemplater completed in 178.13s
Pipeline stage MKMLModelDeleter completed in 481.79s
Tearing down inference service blend-rofur-2024-10-03
Deleting key rirv938-llama-8b-big-ret-5422-v1/flywheel_model.0.safetensors from bucket guanaco-mkml-models
Deleting key rirv938-llama-8b-big-ret-5210-v1/special_tokens_map.json from bucket guanaco-mkml-models
Deleting key rirv938-llama-8b-big-ret-9237-v3/config.json from bucket guanaco-mkml-models
Deleting key zonemercy-cogent-nemo-v-3266-v11/flywheel_model.0.safetensors from bucket guanaco-mkml-models
run pipeline stage %s
run pipeline stage %s
Cleaning model data from model cache
run pipeline stage %s
run pipeline %s
Pipeline stage MKMLDeleter completed in 320.87s
run pipeline %s
Running pipeline stage MKMLModelDeleter
run pipeline stage %s
Pipeline stage MKMLModelDeleter completed in 549.00s
Deleting key nousresearch-hermes-2-pr-1418-v5/tokenizer.json from bucket guanaco-mkml-models
run pipeline %s
run pipeline stage %s
Shutdown handler de-registered
%s, retrying in %s seconds...
Deleting key rirv938-llama-8b-big-ret-5422-v1/special_tokens_map.json from bucket guanaco-mkml-models
Deleting key rirv938-llama-8b-big-ret-5210-v1/tokenizer.json from bucket guanaco-mkml-models
Deleting key rirv938-llama-8b-big-ret-9237-v3/flywheel_model.0.safetensors from bucket guanaco-mkml-models
Deleting key zonemercy-cogent-nemo-v-3266-v11/special_tokens_map.json from bucket guanaco-mkml-models
Running pipeline stage MKMLModelDeleter
Running pipeline stage MKMLDeployer
Deleting key zonemercy-elite-edit-v1-1e5-v1/config.json from bucket guanaco-mkml-models
Running pipeline stage MKMLDeployer
admin requested tearing down of chaiml-0916-intent-suppo_6584_v3
run pipeline stage %s
admin requested tearing down of blend_rofur_2024-10-03
run pipeline stage %s
run pipeline stage %s
admin requested tearing down of blend_rofur_2024-10-03
Cleaning model data from S3
Running pipeline stage MKMLModelDeleter
Shutdown handler de-registered
Deleting key nousresearch-hermes-2-pr-1418-v5/tokenizer.model from bucket guanaco-mkml-models
run pipeline stage %s
Running pipeline stage MKMLDeployer
jic062-dpo-v1-9-nemo_v1 status is now torndown due to DeploymentManager action
Deleting key rirv938-llama-8b-big-ret-9237-v3/special_tokens_map.json from bucket guanaco-mkml-models
Creating inference service blend-rofur-2024-10-03
Connection pool is full, discarding connection: %s. Connection pool size: %s
Running pipeline stage ProductionBlendMKMLTemplater
Shutdown handler not registered because Python interpreter is not running in the main thread
Cleaning model data from S3
jic062-dpo-v1-9-nemo_v2 status is now torndown due to DeploymentManager action
Deleting key nousresearch-hermes-2-pr-1418-v5/tokenizer_config.json from bucket guanaco-mkml-models
Running pipeline stage ProductionBlendMKMLTemplater
Deleting key rirv938-llama-8b-big-ret-9237-v3/tokenizer.json from bucket guanaco-mkml-models
Creating inference service blend-rofur-2024-10-03
Waiting for inference service blend-rofur-2024-10-03 to be ready
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
admin requested tearing down of chaiml-0916-intent-suppo_6584_v3
admin requested tearing down of blend_rofur_2024-10-03
admin requested tearing down of blend_rofur_2024-10-03
admin requested tearing down of chaiml-0916-intent-suppo_6584_v3
admin requested tearing down of blend_rofur_2024-10-03
Deleting key rirv938-llama-8b-big-ret-5422-v1/tokenizer.json from bucket guanaco-mkml-models
run pipeline stage %s
Cleaning model data from model cache
run pipeline stage %s
Cleaning model data from S3
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLDeployer
run pipeline stage %s
Running pipeline stage MKMLDeployer
Shutdown handler de-registered
nousresearch-hermes-2-pr_1418_v5 status is now torndown due to DeploymentManager action
Pipeline stage MKMLModelDeleter completed in 147.96s
run pipeline %s
run pipeline stage %s
run pipeline stage %s
run pipeline stage %s
run pipeline %s
Running pipeline stage MKMLModelDeleter
Pipeline stage MKMLDeleter completed in 131.01s
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLModelDeleter
Pipeline stage MKMLModelDeleter completed in 96.16s
nousresearch-hermes-2-pr_1418_v5 status is now torndown due to DeploymentManager action
run pipeline stage %s
Running pipeline stage ProductionBlendMKMLTemplater
mistralai-mistral-nemo-9330-v138-mkmlizer: quantized model in 37.014s
Running pipeline stage MKMLDeleter
Running pipeline stage MKMLDeleter
Pipeline stage MKMLDeleter completed in 118.42s
Pipeline stage %s skipped, reason=%s
Shutdown handler de-registered
Pipeline stage MKMLModelDeleter completed in 115.88s
Running pipeline stage ProductionBlendMKMLTemplater
nousresearch-hermes-2-pr_1418_v5 status is now torndown due to DeploymentManager action
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLModelDeleter
Running pipeline stage ProductionBlendMKMLTemplater
Pipeline stage %s skipped, reason=%s
Shutdown handler de-registered
Pipeline stage MKMLModelDeleter completed in 60.27s
Skipping deletion as no model was successfully uploaded
Running pipeline stage MKMLModelDeleter
run pipeline stage %s
Pipeline stage MKMLDeleter completed in 60.42s
chaiml-albert-dpo-0912-v_1751_v2 status is now torndown due to DeploymentManager action
Shutdown handler de-registered
Pipeline stage MKMLModelDeleter completed in 58.60s
function_rihet_2024-09-26 status is now torndown due to DeploymentManager action
Shutdown handler de-registered
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of nousresearch-hermes-2-pr_1418_v5
mistralai-mistral-nemo_9330_v138 status is now torndown due to DeploymentManager action
Shutdown handler de-registered
Shutdown handler de-registered
Pipeline stage MKMLModelDeleter completed in 54.45s
Skipping deletion as no model was successfully uploaded
Running pipeline stage MKMLModelDeleter
run pipeline stage %s
admin requested tearing down of chaiml-0916-intent-suppo_6584_v3
admin requested tearing down of blend_rofur_2024-10-03
chaiml-albert-dpo-0912-v_8296_v2 status is now torndown due to DeploymentManager action
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of rirv938-llama-8b-big-ret_5210_v1
mistralai-mistral-nemo_9330_v140 status is now torndown due to DeploymentManager action
Shutdown handler de-registered
Running pipeline stage MKMLModelDeleter
Skipping deletion as no model was successfully uploaded
Shutdown handler not registered because Python interpreter is not running in the main thread
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of chaiml-0917-bot-dominant_6324_v5
admin requested tearing down of mistralai-mistral-nemo_9330_v140
chaiml-albert-dpo-0912-v_9673_v1 status is now torndown due to DeploymentManager action
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of rirv938-llama-8b-big-ret_5422_v1
mistralai-mistral-nemo_9330_v141 status is now torndown due to DeploymentManager action
Skipping deletion as no model was successfully uploaded
Shutdown handler de-registered
run pipeline %s
Pipeline stage MKMLModelDeleter completed in 92.57s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of chaiml-albert-dpo-0912-v_1751_v2
chaiml-albert-dpo-0912-v_1751_v2 status is now torndown due to DeploymentManager action
Shutdown handler de-registered
admin requested tearing down of nousresearch-hermes-2-pr_1418_v5
Shutdown handler de-registered
chaiml-albert-dpo-0912-v_8296_v2 status is now torndown due to DeploymentManager action
function_todun_2024-09-26 status is now torndown due to DeploymentManager action
run pipeline stage %s
run pipeline %s
admin requested tearing down of rirv938-llama-8b-big-ret_5210_v1
chaiml-albert-dpo-0912-v_9673_v1 status is now torndown due to DeploymentManager action
admin requested tearing down of chaiml-0916-intent-suppo_6584_v3
admin requested tearing down of blend_rofur_2024-10-03
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of rirv938-llama-8b-big-ret_5422_v1
Shutdown handler not registered because Python interpreter is not running in the main thread
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of chaiml-0917-bot-dominant_6324_v5
admin requested tearing down of mistralai-mistral-small_5341_v42
Running pipeline stage MKMLDeleter
Pipeline stage %s skipped, reason=%s
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of rirv938-llama-8b-big-ret_9237_v3
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
run pipeline %s
admin requested tearing down of chaiml-albert-dpo-0912-v_1751_v2
Shutdown handler not registered because Python interpreter is not running in the main thread
Pipeline stage %s skipped, reason=%s
admin requested tearing down of zonemercy-viral-ss-v0-1e5_v9
Pipeline stage MKMLDeleter completed in 61.37s
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of zonemercy-cogent-nemo-v_3266_v11
run pipeline stage %s
run pipeline %s
run pipeline stage %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of chaiml-albert-dpo-0912-v_8296_v2
run pipeline %s
Pipeline stage MKMLDeleter completed in 77.41s
Shutdown handler not registered because Python interpreter is not running in the main thread
run pipeline stage %s
admin requested tearing down of zonemercy-viral-ss-v0-1e5ep2_v22
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Running pipeline stage MKMLDeleter
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of zonemercy-elite-edit-v1-1e5_v1
run pipeline stage %s
Running pipeline stage ProductionBlendMKMLTemplater
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
run pipeline stage %s
admin requested tearing down of chaiml-albert-dpo-0912-v_9673_v1
run pipeline stage %s
run pipeline %s
Running pipeline stage MKMLModelDeleter
Shutdown handler not registered because Python interpreter is not running in the main thread
Tearing down inference service blend-rofur-2024-10-03
admin requested tearing down of zonemercy-viral-ss-v0-1e5ep2_v23
Pipeline stage MKMLDeleter completed in 98.42s
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLDeleter
run pipeline stage %s
Pipeline stage %s skipped, reason=%s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of zonemercy-elite-pref-v4-1e5_v1
Running pipeline stage MKMLDeleter
Pipeline stage %s skipped, reason=%s
run pipeline stage %s
run pipeline %s
Running pipeline stage MKMLDeleter
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of blend_rofur_2024-10-03
Running pipeline stage MKMLModelDeleter
run pipeline stage %s
Pipeline stage %s skipped, reason=%s
run pipeline %s
%s, retrying in %s seconds...
Tearing down inference service blend-rofur-2024-10-03
Shutdown handler not registered because Python interpreter is not running in the main thread
run pipeline stage %s
Pipeline stage MKMLDeleter completed in 126.95s
Pipeline stage %s skipped, reason=%s
admin requested tearing down of blend_rofur_2024-10-03
Running pipeline stage MKMLDeleter
Pipeline stage MKMLDeleter completed in 146.90s
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
Pipeline stage %s skipped, reason=%s
admin requested tearing down of chaiml-0916-intent-suppo_6584_v3
admin requested tearing down of blend_rofur_2024-10-03
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Pipeline stage ProductionBlendMKMLTemplater completed in 192.81s
Running pipeline stage MKMLDeleter
run pipeline stage %s
Checking if service mistralai-mistral-small-5341-v42 is running
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
Pipeline stage %s skipped, reason=%s
admin requested tearing down of blend_rofur_2024-10-03
Running pipeline stage MKMLDeleter
Pipeline stage MKMLModelDeleter completed in 222.48s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of blend_rofur_2024-10-03
admin requested tearing down of chaiml-0916-intent-suppo_6584_v3
admin requested tearing down of blend_rofur_2024-10-03
chaiml-albert-dpo-0912-v_1751_v2 status is now torndown due to DeploymentManager action
Shutdown handler de-registered
Pipeline stage MKMLModelDeleter completed in 31.30s
function_rihet_2024-09-26 status is now torndown due to DeploymentManager action
Shutdown handler de-registered
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of nousresearch-hermes-2-pr_1418_v5
chaiml-albert-dpo-0912-v_8296_v2 status is now torndown due to DeploymentManager action
Shutdown handler de-registered
function_todun_2024-09-26 status is now torndown due to DeploymentManager action
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of rirv938-llama-8b-big-ret_5210_v1
chaiml-albert-dpo-0912-v_9673_v1 status is now torndown due to DeploymentManager action
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of rirv938-llama-8b-big-ret_5422_v1
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of rirv938-llama-8b-big-ret_9237_v3
Pipeline stage MKMLDeleter completed in 19.34s
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of zonemercy-cogent-nemo-v_3266_v11
run pipeline stage %s
Pipeline stage MKMLDeleter completed in 19.97s
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of zonemercy-elite-edit-v1-1e5_v1
Running pipeline stage MKMLModelDeleter
run pipeline stage %s
Pipeline stage MKMLDeleter completed in 22.80s
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of zonemercy-elite-pref-v4-1e5_v1
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLModelDeleter
run pipeline stage %s
Pipeline stage MKMLDeleter completed in 27.09s
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of zonemercy-vingt-deux-gfv_4513_v1
Pipeline stage MKMLModelDeleter completed in 31.17s
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLModelDeleter
admin requested tearing down of chaiml-0916-intent-suppo_6584_v3
run pipeline stage %s
admin requested tearing down of blend_rofur_2024-10-03
Pipeline stage MKMLDeleter completed in 39.32s
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLDeleter
run pipeline stage %s
run pipeline %s
Pipeline stage MKMLModelDeleter completed in 49.49s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of zonemercy-virgo-edit-v3-_7871_v1
Shutdown handler de-registered
Pipeline stage %s skipped, reason=%s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of chaiml-0917-bot-dominant_6324_v5
Running pipeline stage MKMLModelDeleter
Shutdown handler not registered because Python interpreter is not running in the main thread
run pipeline stage %s
Pipeline stage MKMLDeleter completed in 71.47s
Running pipeline stage MKMLDeleter
run pipeline stage %s
Shutdown handler de-registered
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
admin requested tearing down of zonemercy-virgo-edit-v5-1e5b1_v2
jic062-dpo-v1-9-nemo_v1 status is now torndown due to DeploymentManager action
Pipeline stage MKMLModelDeleter completed in 85.36s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
Pipeline stage %s skipped, reason=%s
admin requested tearing down of chaiml-albert-dpo-0912-v_1751_v2
run pipeline %s
Running pipeline stage MKMLModelDeleter
Pipeline stage MKMLDeleter completed in 87.39s
run pipeline stage %s
Pipeline stage %s skipped, reason=%s
Running pipeline stage MKMLDeleter
jic062-dpo-v1-9-nemo_v2 status is now torndown due to DeploymentManager action
run pipeline stage %s
run pipeline %s
Shutdown handler not registered because Python interpreter is not running in the main thread
Shutdown handler de-registered
run pipeline stage %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
Connection pool is full, discarding connection: %s. Connection pool size: %s
run pipeline %s
admin requested tearing down of blend_rofur_2024-10-03
Connection pool is full, discarding connection: %s. Connection pool size: %s
admin requested tearing down of blend_rofur_2024-10-03
admin requested tearing down of blend_rofur_2024-10-03
admin requested tearing down of blend_dones_2024-09-27
admin requested tearing down of blend_rofur_2024-10-03
Tearing down inference service blend-rofur-2024-10-03
admin requested tearing down of blend_dones_2024-09-27
admin requested tearing down of blend_rofur_2024-10-03
admin requested tearing down of blend_rofur_2024-10-03
admin requested tearing down of blend_rofur_2024-10-03
admin requested tearing down of blend_dones_2024-09-27
admin requested tearing down of blend_rofur_2024-10-03
admin requested tearing down of blend_dones_2024-09-27
admin requested tearing down of blend_rofur_2024-10-03
admin requested tearing down of blend_rofur_2024-10-03
admin requested tearing down of blend_rofur_2024-10-03