From fad74b701bae025af7475354a5b96a239446f4a6 Mon Sep 17 00:00:00 2001 From: Li Jiashu Date: Fri, 24 Oct 2025 15:45:06 +0800 Subject: [PATCH] Update to new version of base image --- Dockerfile | 10 +- paged_attn.py | 1 + vllm/__pycache__/__init__.cpython-310.pyc | Bin 1152 -> 1148 bytes vllm/__pycache__/_core_ext.cpython-310.pyc | Bin 9616 -> 9612 bytes vllm/__pycache__/_custom_ops.cpython-310.pyc | Bin 31185 -> 31179 bytes vllm/__pycache__/_ipex_ops.cpython-310.pyc | Bin 6562 -> 6558 bytes vllm/__pycache__/beam_search.cpython-310.pyc | Bin 2439 -> 2435 bytes vllm/__pycache__/block.cpython-310.pyc | Bin 3453 -> 3449 bytes vllm/__pycache__/config.cpython-310.pyc | Bin 58859 -> 58835 bytes vllm/__pycache__/connections.cpython-310.pyc | Bin 4879 -> 4875 bytes vllm/__pycache__/envs.cpython-310.pyc | Bin 11501 -> 11644 bytes .../forward_context.cpython-310.pyc | Bin 745 -> 741 bytes vllm/__pycache__/logger.cpython-310.pyc | Bin 4037 -> 4033 bytes vllm/__pycache__/outputs.cpython-310.pyc | Bin 9660 -> 9654 bytes .../pooling_params.cpython-310.pyc | Bin 1047 -> 1043 bytes .../sampling_params.cpython-310.pyc | Bin 17076 -> 17070 bytes vllm/__pycache__/scalar_type.cpython-310.pyc | Bin 814 -> 810 bytes vllm/__pycache__/scripts.cpython-310.pyc | Bin 5134 -> 5130 bytes vllm/__pycache__/sequence.cpython-310.pyc | Bin 46643 -> 46639 bytes vllm/__pycache__/tracing.cpython-310.pyc | Bin 4450 -> 4446 bytes vllm/__pycache__/utils.cpython-310.pyc | Bin 41033 -> 41025 bytes vllm/__pycache__/version.cpython-310.pyc | Bin 211 -> 207 bytes vllm/_custom_ops.py | 2 +- .../__pycache__/__init__.cpython-310.pyc | Bin 165 -> 161 bytes .../__pycache__/layers.cpython-310.pyc | Bin 684 -> 680 bytes .../__pycache__/models.cpython-310.pyc | Bin 4228 -> 4224 bytes .../__pycache__/request.cpython-310.pyc | Bin 1207 -> 1203 bytes .../__pycache__/utils.cpython-310.pyc | Bin 2983 -> 2979 bytes .../worker_manager.cpython-310.pyc | Bin 1754 -> 1750 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 156 -> 152 bytes vllm/assets/__pycache__/audio.cpython-310.pyc | Bin 1264 -> 1260 bytes vllm/assets/__pycache__/base.cpython-310.pyc | Bin 1285 -> 1281 bytes vllm/assets/__pycache__/image.cpython-310.pyc | Bin 1174 -> 1221 bytes vllm/assets/__pycache__/video.cpython-310.pyc | Bin 2868 -> 2864 bytes vllm/assets/image.py | 2 +- .../__pycache__/__init__.cpython-310.pyc | Bin 523 -> 519 bytes .../__pycache__/layer.cpython-310.pyc | Bin 3240 -> 3236 bytes .../__pycache__/selector.cpython-310.pyc | Bin 7285 -> 7211 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 168 -> 164 bytes .../__pycache__/abstract.cpython-310.pyc | Bin 8560 -> 8554 bytes .../blocksparse_attn.cpython-310.pyc | Bin 10203 -> 10195 bytes .../__pycache__/flash_attn.cpython-310.pyc | Bin 21141 -> 21133 bytes .../__pycache__/flashinfer.cpython-310.pyc | Bin 20844 -> 20838 bytes .../__pycache__/ipex_attn.cpython-310.pyc | Bin 9222 -> 9214 bytes .../__pycache__/openvino.cpython-310.pyc | Bin 4008 -> 4004 bytes .../__pycache__/pallas.cpython-310.pyc | Bin 7382 -> 7378 bytes .../placeholder_attn.cpython-310.pyc | Bin 8326 -> 8322 bytes .../rocm_flash_attn.cpython-310.pyc | Bin 15131 -> 15127 bytes .../__pycache__/torch_sdpa.cpython-310.pyc | Bin 13858 -> 13852 bytes .../__pycache__/utils.cpython-310.pyc | Bin 12352 -> 12346 bytes .../__pycache__/xformers.cpython-310.pyc | Bin 18770 -> 18760 bytes .../ops/__pycache__/__init__.cpython-310.pyc | Bin 163 -> 159 bytes .../ops/__pycache__/ipex_attn.cpython-310.pyc | Bin 3804 -> 3800 bytes .../__pycache__/paged_attn.cpython-310.pyc | Bin 5238 -> 5232 bytes .../prefix_prefill.cpython-310.pyc | Bin 11986 -> 11976 bytes .../triton_flash_attention.cpython-310.pyc | Bin 10389 -> 10385 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 185 -> 181 bytes ...ocksparse_attention_kernel.cpython-310.pyc | Bin 6627 -> 6619 bytes .../__pycache__/interface.cpython-310.pyc | Bin 7332 -> 7326 bytes .../__pycache__/utils.cpython-310.pyc | Bin 6723 -> 6719 bytes vllm/attention/ops/paged_attn.py | 5 +- vllm/attention/ops/prefix_prefill.py | 4 - vllm/attention/selector.py | 3 - .../__pycache__/__init__.cpython-310.pyc | Bin 161 -> 157 bytes .../__pycache__/backends.cpython-310.pyc | Bin 5078 -> 5072 bytes .../compile_context.cpython-310.pyc | Bin 775 -> 771 bytes .../__pycache__/decorators.cpython-310.pyc | Bin 3458 -> 3454 bytes .../__pycache__/levels.cpython-310.pyc | Bin 448 -> 444 bytes .../__pycache__/wrapper.cpython-310.pyc | Bin 3866 -> 3862 bytes .../core/__pycache__/__init__.cpython-310.pyc | Bin 154 -> 150 bytes .../block_manager_v1.cpython-310.pyc | Bin 20021 -> 20013 bytes .../block_manager_v2.cpython-310.pyc | Bin 15123 -> 15119 bytes .../__pycache__/evictor_v1.cpython-310.pyc | Bin 4170 -> 4166 bytes .../__pycache__/evictor_v2.cpython-310.pyc | Bin 5081 -> 5077 bytes .../__pycache__/interfaces.cpython-310.pyc | Bin 4797 -> 4793 bytes ...holder_block_space_manager.cpython-310.pyc | Bin 4349 -> 4345 bytes .../__pycache__/scheduler.cpython-310.pyc | Bin 38351 -> 38323 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 160 -> 156 bytes .../__pycache__/block_table.cpython-310.pyc | Bin 13230 -> 13226 bytes .../block/__pycache__/common.cpython-310.pyc | Bin 13454 -> 13450 bytes .../cpu_gpu_block_allocator.cpython-310.pyc | Bin 15406 -> 15402 bytes .../__pycache__/interfaces.cpython-310.pyc | Bin 10841 -> 10837 bytes .../__pycache__/naive_block.cpython-310.pyc | Bin 15192 -> 15188 bytes .../prefix_caching_block.cpython-310.pyc | Bin 27524 -> 27516 bytes .../block/__pycache__/utils.cpython-310.pyc | Bin 1648 -> 1644 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 237 -> 233 bytes .../communication_op.cpython-310.pyc | Bin 1413 -> 1409 bytes .../parallel_state.cpython-310.pyc | Bin 29563 -> 29555 bytes .../__pycache__/utils.cpython-310.pyc | Bin 2844 -> 2840 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 182 -> 178 bytes .../__pycache__/cuda_wrapper.cpython-310.pyc | Bin 5422 -> 5418 bytes .../custom_all_reduce.cpython-310.pyc | Bin 8280 -> 8276 bytes .../custom_all_reduce_utils.cpython-310.pyc | Bin 6689 -> 6685 bytes .../__pycache__/pynccl.cpython-310.pyc | Bin 4345 -> 4341 bytes .../pynccl_wrapper.cpython-310.pyc | Bin 6572 -> 6568 bytes .../__pycache__/shm_broadcast.cpython-310.pyc | Bin 13067 -> 13087 bytes .../tpu_communicator.cpython-310.pyc | Bin 1861 -> 1857 bytes .../device_communicators/shm_broadcast.py | 3 +- .../__pycache__/__init__.cpython-310.pyc | Bin 156 -> 152 bytes .../__pycache__/arg_utils.cpython-310.pyc | Bin 32851 -> 32837 bytes .../async_llm_engine.cpython-310.pyc | Bin 38114 -> 38104 bytes .../__pycache__/async_timeout.cpython-310.pyc | Bin 5658 -> 5652 bytes .../__pycache__/llm_engine.cpython-310.pyc | Bin 48366 -> 48342 bytes .../__pycache__/metrics.cpython-310.pyc | Bin 16460 -> 16454 bytes .../__pycache__/metrics_types.cpython-310.pyc | Bin 3341 -> 3337 bytes .../__pycache__/protocol.cpython-310.pyc | Bin 4177 -> 4173 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 4124 -> 4118 bytes .../__pycache__/client.cpython-310.pyc | Bin 19788 -> 19776 bytes .../__pycache__/engine.cpython-310.pyc | Bin 11879 -> 11875 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 173 -> 169 bytes .../__pycache__/interfaces.cpython-310.pyc | Bin 3066 -> 3062 bytes .../__pycache__/multi_step.cpython-310.pyc | Bin 6575 -> 6569 bytes .../__pycache__/single_step.cpython-310.pyc | Bin 6356 -> 6352 bytes .../__pycache__/stop_checker.cpython-310.pyc | Bin 2984 -> 2978 bytes .../__pycache__/util.cpython-310.pyc | Bin 1079 -> 1075 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 161 -> 157 bytes .../__pycache__/api_server.cpython-310.pyc | Bin 4995 -> 4991 bytes .../__pycache__/chat_utils.cpython-310.pyc | Bin 16276 -> 16286 bytes .../__pycache__/launcher.cpython-310.pyc | Bin 3634 -> 3630 bytes .../__pycache__/llm.cpython-310.pyc | Bin 26794 -> 26786 bytes .../__pycache__/logger.cpython-310.pyc | Bin 1573 -> 1569 bytes vllm/entrypoints/chat_utils.py | 4 +- .../__pycache__/__init__.cpython-310.pyc | Bin 168 -> 164 bytes .../__pycache__/api_server.cpython-310.pyc | Bin 14833 -> 14834 bytes .../__pycache__/cli_args.cpython-310.pyc | Bin 6927 -> 6923 bytes .../logits_processors.cpython-310.pyc | Bin 3168 -> 3164 bytes .../__pycache__/protocol.cpython-310.pyc | Bin 30255 -> 30247 bytes .../__pycache__/run_batch.cpython-310.pyc | Bin 7902 -> 7898 bytes .../__pycache__/serving_chat.cpython-310.pyc | Bin 17221 -> 17201 bytes .../serving_completion.cpython-310.pyc | Bin 10653 -> 10645 bytes .../serving_embedding.cpython-310.pyc | Bin 5340 -> 5336 bytes .../serving_engine.cpython-310.pyc | Bin 13799 -> 13793 bytes .../serving_tokenization.cpython-310.pyc | Bin 3612 -> 3608 bytes vllm/entrypoints/openai/api_server.py | 2 +- .../__pycache__/__init__.cpython-310.pyc | Bin 566 -> 562 bytes .../abstract_tool_parser.cpython-310.pyc | Bin 5963 -> 5959 bytes .../hermes_tool_parser.cpython-310.pyc | Bin 6844 -> 6839 bytes .../internlm2_tool_parser.cpython-310.pyc | Bin 4998 -> 4992 bytes .../llama_tool_parser.cpython-310.pyc | Bin 6040 -> 6039 bytes .../mistral_tool_parser.cpython-310.pyc | Bin 6650 -> 6647 bytes .../__pycache__/utils.cpython-310.pyc | Bin 2990 -> 2986 bytes .../openai/tool_parsers/hermes_tool_parser.py | 2 +- .../openai/tool_parsers/llama_tool_parser.py | 2 +- .../tool_parsers/mistral_tool_parser.py | 2 +- vllm/envs.py | 7 + .../__pycache__/__init__.cpython-310.pyc | Bin 158 -> 154 bytes .../__pycache__/cpu_executor.cpython-310.pyc | Bin 11331 -> 11323 bytes .../distributed_gpu_executor.cpython-310.pyc | Bin 7542 -> 7538 bytes .../__pycache__/executor_base.cpython-310.pyc | Bin 6178 -> 6174 bytes .../__pycache__/gpu_executor.cpython-310.pyc | Bin 7014 -> 7010 bytes .../__pycache__/msgspec_utils.cpython-310.pyc | Bin 1076 -> 1072 bytes .../multiproc_gpu_executor.cpython-310.pyc | Bin 8079 -> 8073 bytes .../multiproc_worker_utils.cpython-310.pyc | Bin 8641 -> 8637 bytes .../multiproc_xpu_executor.cpython-310.pyc | Bin 1527 -> 1523 bytes .../neuron_executor.cpython-310.pyc | Bin 4897 -> 4893 bytes .../openvino_executor.cpython-310.pyc | Bin 7393 -> 7387 bytes .../ray_gpu_executor.cpython-310.pyc | Bin 15850 -> 15842 bytes .../ray_tpu_executor.cpython-310.pyc | Bin 11056 -> 11052 bytes .../__pycache__/ray_utils.cpython-310.pyc | Bin 10039 -> 10035 bytes .../ray_xpu_executor.cpython-310.pyc | Bin 1769 -> 1765 bytes .../__pycache__/tpu_executor.cpython-310.pyc | Bin 5405 -> 5401 bytes .../__pycache__/xpu_executor.cpython-310.pyc | Bin 3509 -> 3505 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 1079 -> 1075 bytes vllm/inputs/__pycache__/data.cpython-310.pyc | Bin 5523 -> 5519 bytes vllm/inputs/__pycache__/parse.cpython-310.pyc | Bin 3438 -> 3434 bytes .../__pycache__/preprocess.cpython-310.pyc | Bin 13418 -> 13412 bytes .../__pycache__/registry.cpython-310.pyc | Bin 10229 -> 10225 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 244 -> 240 bytes .../__pycache__/formatter.cpython-310.pyc | Bin 883 -> 879 bytes .../lora/__pycache__/__init__.cpython-310.pyc | Bin 154 -> 150 bytes .../fully_sharded_layers.cpython-310.pyc | Bin 8862 -> 8858 bytes vllm/lora/__pycache__/layers.cpython-310.pyc | Bin 34030 -> 34024 bytes vllm/lora/__pycache__/lora.cpython-310.pyc | Bin 5357 -> 5353 bytes vllm/lora/__pycache__/models.cpython-310.pyc | Bin 21990 -> 22019 bytes vllm/lora/__pycache__/punica.cpython-310.pyc | Bin 16365 -> 16361 bytes vllm/lora/__pycache__/request.cpython-310.pyc | Bin 3289 -> 3285 bytes vllm/lora/__pycache__/utils.cpython-310.pyc | Bin 5745 -> 5748 bytes .../worker_manager.cpython-310.pyc | Bin 7505 -> 7501 bytes vllm/lora/models.py | 4 +- .../ops/__pycache__/__init__.cpython-310.pyc | Bin 158 -> 154 bytes .../__pycache__/bgmv_expand.cpython-310.pyc | Bin 3642 -> 3638 bytes .../bgmv_expand_slice.cpython-310.pyc | Bin 3782 -> 3778 bytes .../__pycache__/bgmv_shrink.cpython-310.pyc | Bin 3333 -> 3329 bytes .../__pycache__/sgmv_expand.cpython-310.pyc | Bin 4667 -> 4663 bytes .../sgmv_expand_slice.cpython-310.pyc | Bin 5149 -> 5145 bytes .../__pycache__/sgmv_shrink.cpython-310.pyc | Bin 4639 -> 4635 bytes .../ops/__pycache__/utils.cpython-310.pyc | Bin 1522 -> 1518 bytes vllm/lora/utils.py | 2 +- .../__pycache__/__init__.cpython-310.pyc | Bin 486 -> 482 bytes .../__pycache__/custom_op.cpython-310.pyc | Bin 2379 -> 2375 bytes .../__pycache__/parameter.cpython-310.pyc | Bin 13315 -> 13303 bytes .../pooling_metadata.cpython-310.pyc | Bin 2409 -> 2405 bytes .../sampling_metadata.cpython-310.pyc | Bin 12513 -> 12501 bytes .../__pycache__/utils.cpython-310.pyc | Bin 1118 -> 1114 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 1420 -> 1416 bytes .../__pycache__/guided_fields.cpython-310.pyc | Bin 1735 -> 1731 bytes ...m_format_enforcer_decoding.cpython-310.pyc | Bin 2403 -> 2399 bytes .../outlines_decoding.cpython-310.pyc | Bin 3455 -> 3451 bytes ...outlines_logits_processors.cpython-310.pyc | Bin 6825 -> 7157 bytes .../outlines_logits_processors.py | 11 +- .../__pycache__/__init__.cpython-310.pyc | Bin 171 -> 167 bytes .../__pycache__/activation.cpython-310.pyc | Bin 8413 -> 8407 bytes .../__pycache__/layernorm.cpython-310.pyc | Bin 4665 -> 4661 bytes .../layers/__pycache__/linear.cpython-310.pyc | Bin 28104 -> 28115 bytes .../logits_processor.cpython-310.pyc | Bin 3909 -> 3905 bytes .../layers/__pycache__/pooler.cpython-310.pyc | Bin 2461 -> 2457 bytes .../rejection_sampler.cpython-310.pyc | Bin 12061 -> 12057 bytes .../__pycache__/resampler.cpython-310.pyc | Bin 7111 -> 7105 bytes .../rotary_embedding.cpython-310.pyc | Bin 25500 -> 25494 bytes .../__pycache__/sampler.cpython-310.pyc | Bin 31672 -> 31666 bytes .../spec_decode_base_sampler.cpython-310.pyc | Bin 7336 -> 7330 bytes ...typical_acceptance_sampler.cpython-310.pyc | Bin 6710 -> 6706 bytes .../vocab_parallel_embedding.cpython-310.pyc | Bin 15137 -> 15133 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 747 -> 743 bytes .../fused_marlin_moe.cpython-310.pyc | Bin 7430 -> 7426 bytes .../__pycache__/fused_moe.cpython-310.pyc | Bin 15815 -> 15811 bytes .../__pycache__/layer.cpython-310.pyc | Bin 15772 -> 15762 bytes .../__pycache__/moe_pallas.cpython-310.pyc | Bin 1864 -> 1860 bytes vllm/model_executor/layers/linear.py | 2 +- .../__pycache__/__init__.cpython-310.pyc | Bin 177 -> 173 bytes .../ops/__pycache__/__init__.cpython-310.pyc | Bin 181 -> 177 bytes .../__pycache__/causal_conv1d.cpython-310.pyc | Bin 3041 -> 3037 bytes .../ops/__pycache__/mamba_ssm.cpython-310.pyc | Bin 8952 -> 8948 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 2812 -> 2808 bytes .../__pycache__/aqlm.cpython-310.pyc | Bin 9013 -> 8995 bytes .../__pycache__/awq.cpython-310.pyc | Bin 5552 -> 5548 bytes .../__pycache__/awq_marlin.cpython-310.pyc | Bin 11320 -> 11316 bytes .../__pycache__/awq_triton.cpython-310.pyc | Bin 6241 -> 6237 bytes .../__pycache__/base_config.cpython-310.pyc | Bin 5829 -> 5825 bytes .../__pycache__/bitsandbytes.cpython-310.pyc | Bin 8817 -> 8809 bytes .../__pycache__/deepspeedfp.cpython-310.pyc | Bin 7460 -> 7456 bytes .../__pycache__/experts_int8.cpython-310.pyc | Bin 5905 -> 5901 bytes .../__pycache__/fbgemm_fp8.cpython-310.pyc | Bin 5598 -> 5594 bytes .../__pycache__/fp8.cpython-310.pyc | Bin 12475 -> 12469 bytes .../__pycache__/gguf.cpython-310.pyc | Bin 6385 -> 6381 bytes .../__pycache__/gptq.cpython-310.pyc | Bin 7062 -> 7056 bytes .../__pycache__/gptq_marlin.cpython-310.pyc | Bin 12521 -> 12515 bytes .../gptq_marlin_24.cpython-310.pyc | Bin 7535 -> 7527 bytes .../__pycache__/ipex_quant.cpython-310.pyc | Bin 5672 -> 5668 bytes .../__pycache__/kv_cache.cpython-310.pyc | Bin 2599 -> 2593 bytes .../__pycache__/marlin.cpython-310.pyc | Bin 6943 -> 6937 bytes .../__pycache__/modelopt.cpython-310.pyc | Bin 6192 -> 6188 bytes .../__pycache__/neuron_quant.cpython-310.pyc | Bin 3053 -> 3049 bytes .../__pycache__/qqq.cpython-310.pyc | Bin 7002 -> 6996 bytes .../__pycache__/schema.cpython-310.pyc | Bin 3242 -> 3238 bytes .../__pycache__/tpu_int8.cpython-310.pyc | Bin 5099 -> 5095 bytes .../__pycache__/w8a16.cpython-310.pyc | Bin 4007 -> 4003 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 203 -> 199 bytes .../compressed_tensors.cpython-310.pyc | Bin 12423 -> 12415 bytes .../compressed_tensors_moe.cpython-310.pyc | Bin 11486 -> 11478 bytes .../__pycache__/utils.cpython-310.pyc | Bin 8412 -> 8415 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 800 -> 796 bytes .../compressed_tensors_scheme.cpython-310.pyc | Bin 2110 -> 2106 bytes ...ompressed_tensors_w4a16_24.cpython-310.pyc | Bin 4097 -> 4093 bytes ...mpressed_tensors_w8a16_fp8.cpython-310.pyc | Bin 3570 -> 3566 bytes ...ompressed_tensors_w8a8_fp8.cpython-310.pyc | Bin 3694 -> 3690 bytes ...mpressed_tensors_w8a8_int8.cpython-310.pyc | Bin 3900 -> 3896 bytes .../compressed_tensors_wNa16.cpython-310.pyc | Bin 4507 -> 4503 bytes .../quantization/compressed_tensors/utils.py | 2 +- .../MPLinearKernel.cpython-310.pyc | Bin 3007 -> 3003 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 2321 -> 2317 bytes .../__pycache__/machete.cpython-310.pyc | Bin 4248 -> 4240 bytes .../__pycache__/marlin.cpython-310.pyc | Bin 4213 -> 4209 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 304 -> 300 bytes .../__pycache__/layer_utils.cpython-310.pyc | Bin 1049 -> 1043 bytes .../__pycache__/machete_utils.cpython-310.pyc | Bin 1248 -> 1244 bytes .../__pycache__/marlin_utils.cpython-310.pyc | Bin 8305 -> 8301 bytes .../marlin_utils_fp8.cpython-310.pyc | Bin 2825 -> 2821 bytes .../marlin_utils_test.cpython-310.pyc | Bin 4169 -> 4165 bytes .../marlin_utils_test_24.cpython-310.pyc | Bin 10355 -> 10351 bytes .../marlin_utils_test_qqq.cpython-310.pyc | Bin 3502 -> 3498 bytes .../__pycache__/quant_utils.cpython-310.pyc | Bin 9626 -> 9620 bytes .../__pycache__/w8a8_utils.cpython-310.pyc | Bin 4467 -> 4461 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 1122 -> 1118 bytes .../__pycache__/loader.cpython-310.pyc | Bin 33753 -> 33745 bytes .../__pycache__/neuron.cpython-310.pyc | Bin 7537 -> 7533 bytes .../__pycache__/openvino.cpython-310.pyc | Bin 6200 -> 6194 bytes .../__pycache__/tensorizer.cpython-310.pyc | Bin 15180 -> 15181 bytes .../__pycache__/utils.cpython-310.pyc | Bin 1373 -> 1365 bytes .../__pycache__/weight_utils.cpython-310.pyc | Bin 20218 -> 20227 bytes .../model_executor/model_loader/tensorizer.py | 2 +- .../model_loader/weight_utils.py | 6 +- .../__pycache__/__init__.cpython-310.pyc | Bin 688 -> 684 bytes .../models/__pycache__/arctic.cpython-310.pyc | Bin 14388 -> 14378 bytes .../__pycache__/baichuan.cpython-310.pyc | Bin 11583 -> 11579 bytes .../models/__pycache__/bart.cpython-310.pyc | Bin 21146 -> 21136 bytes .../models/__pycache__/blip.cpython-310.pyc | Bin 11302 -> 11296 bytes .../models/__pycache__/blip2.cpython-310.pyc | Bin 18095 -> 18091 bytes .../models/__pycache__/bloom.cpython-310.pyc | Bin 9108 -> 9104 bytes .../__pycache__/chameleon.cpython-310.pyc | Bin 28220 -> 28210 bytes .../__pycache__/chatglm.cpython-310.pyc | Bin 16767 -> 16763 bytes .../models/__pycache__/clip.cpython-310.pyc | Bin 12880 -> 12874 bytes .../__pycache__/commandr.cpython-310.pyc | Bin 11349 -> 11345 bytes .../models/__pycache__/dbrx.cpython-310.pyc | Bin 11990 -> 11986 bytes .../models/__pycache__/decilm.cpython-310.pyc | Bin 3370 -> 3366 bytes .../__pycache__/deepseek.cpython-310.pyc | Bin 12247 -> 12235 bytes .../__pycache__/deepseek_v2.cpython-310.pyc | Bin 14358 -> 14350 bytes .../models/__pycache__/eagle.cpython-310.pyc | Bin 5486 -> 5480 bytes .../models/__pycache__/exaone.cpython-310.pyc | Bin 13509 -> 13503 bytes .../models/__pycache__/falcon.cpython-310.pyc | Bin 11468 -> 11462 bytes .../models/__pycache__/fuyu.cpython-310.pyc | Bin 10367 -> 10363 bytes .../models/__pycache__/gemma.cpython-310.pyc | Bin 11297 -> 11293 bytes .../models/__pycache__/gemma2.cpython-310.pyc | Bin 11387 -> 11383 bytes .../gemma2_embedding.cpython-310.pyc | Bin 2485 -> 2481 bytes .../models/__pycache__/glm4.cpython-310.pyc | Bin 8415 -> 8411 bytes .../glm4_vision_encoder.cpython-310.pyc | Bin 8422 -> 8418 bytes .../models/__pycache__/gpt2.cpython-310.pyc | Bin 8474 -> 8470 bytes .../__pycache__/gpt_bigcode.cpython-310.pyc | Bin 8921 -> 8917 bytes .../models/__pycache__/gpt_j.cpython-310.pyc | Bin 8418 -> 8414 bytes .../__pycache__/gpt_neox.cpython-310.pyc | Bin 8631 -> 8623 bytes .../__pycache__/granite.cpython-310.pyc | Bin 13100 -> 13094 bytes .../__pycache__/granitemoe.cpython-310.pyc | Bin 11518 -> 11514 bytes .../idefics2_vision_model.cpython-310.pyc | Bin 9134 -> 9130 bytes .../__pycache__/interfaces.cpython-310.pyc | Bin 9556 -> 9552 bytes .../interfaces_base.cpython-310.pyc | Bin 5363 -> 5359 bytes .../__pycache__/intern_vit.cpython-310.pyc | Bin 11647 -> 11643 bytes .../__pycache__/internlm2.cpython-310.pyc | Bin 10531 -> 10527 bytes .../__pycache__/internvl.cpython-310.pyc | Bin 16333 -> 16336 bytes .../models/__pycache__/jais.cpython-310.pyc | Bin 10106 -> 10102 bytes .../models/__pycache__/jamba.cpython-310.pyc | Bin 17466 -> 17458 bytes .../models/__pycache__/llama.cpython-310.pyc | Bin 14843 -> 14837 bytes .../llama_embedding.cpython-310.pyc | Bin 2671 -> 2667 bytes .../models/__pycache__/llava.cpython-310.pyc | Bin 11813 -> 11809 bytes .../__pycache__/llava_next.cpython-310.pyc | Bin 17300 -> 17296 bytes .../llava_next_video.cpython-310.pyc | Bin 13108 -> 13104 bytes .../llava_onevision.cpython-310.pyc | Bin 22295 -> 22289 bytes .../models/__pycache__/mamba.cpython-310.pyc | Bin 12737 -> 12729 bytes .../__pycache__/mamba_cache.cpython-310.pyc | Bin 7761 -> 7755 bytes .../models/__pycache__/medusa.cpython-310.pyc | Bin 6284 -> 6280 bytes .../__pycache__/minicpm.cpython-310.pyc | Bin 14890 -> 14884 bytes .../__pycache__/minicpm3.cpython-310.pyc | Bin 8056 -> 8052 bytes .../__pycache__/minicpmv.cpython-310.pyc | Bin 27234 -> 27231 bytes .../__pycache__/mixtral.cpython-310.pyc | Bin 11844 -> 11828 bytes .../__pycache__/mixtral_quant.cpython-310.pyc | Bin 11346 -> 11340 bytes .../models/__pycache__/mllama.cpython-310.pyc | Bin 28831 -> 28823 bytes .../mlp_speculator.cpython-310.pyc | Bin 5852 -> 5846 bytes .../module_mapping.cpython-310.pyc | Bin 1913 -> 1909 bytes .../models/__pycache__/molmo.cpython-310.pyc | Bin 31070 -> 31073 bytes .../models/__pycache__/mpt.cpython-310.pyc | Bin 8973 -> 8969 bytes .../__pycache__/nemotron.cpython-310.pyc | Bin 12733 -> 12727 bytes .../models/__pycache__/nvlm_d.cpython-310.pyc | Bin 2745 -> 2741 bytes .../models/__pycache__/olmo.cpython-310.pyc | Bin 9564 -> 9558 bytes .../models/__pycache__/olmoe.cpython-310.pyc | Bin 10864 -> 10860 bytes .../models/__pycache__/opt.cpython-310.pyc | Bin 10462 -> 10458 bytes .../models/__pycache__/orion.cpython-310.pyc | Bin 9526 -> 9520 bytes .../__pycache__/paligemma.cpython-310.pyc | Bin 8862 -> 8858 bytes .../__pycache__/persimmon.cpython-310.pyc | Bin 9435 -> 9429 bytes .../models/__pycache__/phi.cpython-310.pyc | Bin 8861 -> 8857 bytes .../models/__pycache__/phi3.cpython-310.pyc | Bin 557 -> 553 bytes .../__pycache__/phi3_small.cpython-310.pyc | Bin 13162 -> 13156 bytes .../models/__pycache__/phi3v.cpython-310.pyc | Bin 17529 -> 17530 bytes .../models/__pycache__/phimoe.cpython-310.pyc | Bin 14435 -> 14431 bytes .../__pycache__/pixtral.cpython-310.pyc | Bin 19011 -> 19005 bytes .../models/__pycache__/qwen.cpython-310.pyc | Bin 26256 -> 26253 bytes .../models/__pycache__/qwen2.cpython-310.pyc | Bin 10923 -> 10919 bytes .../__pycache__/qwen2_5_vl.cpython-310.pyc | Bin 0 -> 32068 bytes .../__pycache__/qwen2_moe.cpython-310.pyc | Bin 12427 -> 12413 bytes .../__pycache__/qwen2_rm.cpython-310.pyc | Bin 3918 -> 3914 bytes .../__pycache__/qwen2_vl.cpython-310.pyc | Bin 30630 -> 30618 bytes .../models/__pycache__/qwen3.cpython-310.pyc | Bin 8737 -> 8751 bytes .../__pycache__/qwen3_moe.cpython-310.pyc | Bin 13242 -> 13228 bytes .../__pycache__/registry.cpython-310.pyc | Bin 14640 -> 14695 bytes .../models/__pycache__/siglip.cpython-310.pyc | Bin 15151 -> 15143 bytes .../models/__pycache__/solar.cpython-310.pyc | Bin 13030 -> 13024 bytes .../__pycache__/stablelm.cpython-310.pyc | Bin 9424 -> 9418 bytes .../__pycache__/starcoder2.cpython-310.pyc | Bin 8871 -> 8867 bytes .../__pycache__/ultravox.cpython-310.pyc | Bin 15127 -> 15123 bytes .../models/__pycache__/utils.cpython-310.pyc | Bin 17025 -> 17025 bytes .../models/__pycache__/xverse.cpython-310.pyc | Bin 10177 -> 10169 bytes vllm/model_executor/models/internvl.py | 2 +- vllm/model_executor/models/minicpmv.py | 2 +- vllm/model_executor/models/molmo.py | 2 +- vllm/model_executor/models/phi3v.py | 2 +- vllm/model_executor/models/qwen.py | 2 +- vllm/model_executor/models/qwen2_5_vl.py | 1213 +++++++++++++++++ vllm/model_executor/models/qwen3.py | 4 +- vllm/model_executor/models/registry.py | 1 + .../__pycache__/__init__.cpython-310.pyc | Bin 493 -> 489 bytes .../__pycache__/audio.cpython-310.pyc | Bin 1179 -> 1175 bytes .../__pycache__/base.cpython-310.pyc | Bin 10657 -> 10653 bytes .../__pycache__/image.cpython-310.pyc | Bin 2627 -> 2623 bytes .../__pycache__/registry.cpython-310.pyc | Bin 8486 -> 8482 bytes .../__pycache__/utils.cpython-310.pyc | Bin 8515 -> 8511 bytes .../__pycache__/video.cpython-310.pyc | Bin 2545 -> 2541 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 1327 -> 1323 bytes .../platforms/__pycache__/cpu.cpython-310.pyc | Bin 1018 -> 1014 bytes .../__pycache__/cuda.cpython-310.pyc | Bin 5108 -> 5104 bytes .../__pycache__/interface.cpython-310.pyc | Bin 4244 -> 4240 bytes .../__pycache__/rocm.cpython-310.pyc | Bin 1578 -> 1574 bytes .../platforms/__pycache__/tpu.cpython-310.pyc | Bin 1324 -> 1320 bytes .../platforms/__pycache__/xpu.cpython-310.pyc | Bin 1245 -> 1241 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 1873 -> 1869 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 164 -> 160 bytes .../__pycache__/layers.cpython-310.pyc | Bin 2926 -> 2922 bytes .../__pycache__/models.cpython-310.pyc | Bin 13059 -> 13057 bytes .../__pycache__/request.cpython-310.pyc | Bin 1331 -> 1327 bytes .../__pycache__/utils.cpython-310.pyc | Bin 2412 -> 2424 bytes .../worker_manager.cpython-310.pyc | Bin 6564 -> 6560 bytes vllm/prompt_adapter/utils.py | 2 +- .../__pycache__/__init__.cpython-310.pyc | Bin 161 -> 157 bytes .../batch_expansion.cpython-310.pyc | Bin 12458 -> 12452 bytes .../draft_model_runner.cpython-310.pyc | Bin 7879 -> 7875 bytes .../__pycache__/interfaces.cpython-310.pyc | Bin 2900 -> 2896 bytes .../__pycache__/medusa_worker.cpython-310.pyc | Bin 4541 -> 4537 bytes .../__pycache__/metrics.cpython-310.pyc | Bin 5021 -> 5017 bytes .../mlp_speculator_worker.cpython-310.pyc | Bin 2937 -> 2933 bytes .../__pycache__/mqa_scorer.cpython-310.pyc | Bin 2775 -> 2771 bytes .../multi_step_worker.cpython-310.pyc | Bin 11513 -> 11509 bytes .../__pycache__/ngram_worker.cpython-310.pyc | Bin 4923 -> 4919 bytes .../proposer_worker_base.cpython-310.pyc | Bin 2684 -> 2680 bytes ...smaller_tp_proposer_worker.cpython-310.pyc | Bin 5903 -> 5899 bytes .../spec_decode_worker.cpython-310.pyc | Bin 31989 -> 31981 bytes .../target_model_runner.cpython-310.pyc | Bin 2679 -> 2675 bytes .../__pycache__/top1_proposer.cpython-310.pyc | Bin 5711 -> 5701 bytes .../__pycache__/util.cpython-310.pyc | Bin 7939 -> 7933 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 546 -> 542 bytes .../__pycache__/config.cpython-310.pyc | Bin 8784 -> 8778 bytes .../__pycache__/detokenizer.cpython-310.pyc | Bin 7331 -> 7323 bytes .../__pycache__/processor.cpython-310.pyc | Bin 2058 -> 2054 bytes .../__pycache__/tokenizer.cpython-310.pyc | Bin 5727 -> 5719 bytes .../__pycache__/utils.cpython-310.pyc | Bin 649 -> 645 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 1526 -> 1522 bytes .../__pycache__/arctic.cpython-310.pyc | Bin 8227 -> 8223 bytes .../__pycache__/chatglm.cpython-310.pyc | Bin 1786 -> 1782 bytes .../configs/__pycache__/dbrx.cpython-310.pyc | Bin 9418 -> 9406 bytes .../configs/__pycache__/eagle.cpython-310.pyc | Bin 1563 -> 1559 bytes .../__pycache__/exaone.cpython-310.pyc | Bin 7252 -> 7248 bytes .../__pycache__/falcon.cpython-310.pyc | Bin 1913 -> 1909 bytes .../__pycache__/internvl.cpython-310.pyc | Bin 1243 -> 1239 bytes .../configs/__pycache__/jais.cpython-310.pyc | Bin 8283 -> 8271 bytes .../__pycache__/medusa.cpython-310.pyc | Bin 2093 -> 2089 bytes .../__pycache__/mllama.cpython-310.pyc | Bin 1249 -> 1245 bytes .../mlp_speculator.cpython-310.pyc | Bin 2482 -> 2478 bytes .../configs/__pycache__/mpt.cpython-310.pyc | Bin 5388 -> 5382 bytes .../__pycache__/nemotron.cpython-310.pyc | Bin 7287 -> 7279 bytes .../__pycache__/nvlm_d.cpython-310.pyc | Bin 413 -> 409 bytes .../__pycache__/qwen2vl.cpython-310.pyc | Bin 2740 -> 2736 bytes .../configs/__pycache__/solar.cpython-310.pyc | Bin 8837 -> 8829 bytes .../__pycache__/ultravox.cpython-310.pyc | Bin 3417 -> 3413 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 1699 -> 1695 bytes .../base_tokenizer_group.cpython-310.pyc | Bin 2486 -> 2482 bytes .../ray_tokenizer_group.cpython-310.pyc | Bin 7370 -> 7366 bytes .../tokenizer_group.cpython-310.pyc | Bin 3475 -> 3471 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 249 -> 245 bytes .../__pycache__/mistral.cpython-310.pyc | Bin 8554 -> 8555 bytes vllm/transformers_utils/tokenizers/mistral.py | 2 +- vllm/triton_utils/__init__.py | 6 +- .../__pycache__/__init__.cpython-310.pyc | Bin 422 -> 418 bytes .../custom_cache_manager.cpython-310.pyc | Bin 2070 -> 2066 bytes .../__pycache__/importing.cpython-310.pyc | Bin 411 -> 407 bytes .../__pycache__/libentry.cpython-310.pyc | Bin 4529 -> 4523 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 155 -> 151 bytes .../__pycache__/usage_lib.cpython-310.pyc | Bin 6694 -> 6690 bytes .../__pycache__/__init__.cpython-310.pyc | Bin 156 -> 152 bytes .../__pycache__/cache_engine.cpython-310.pyc | Bin 3465 -> 3461 bytes .../cpu_enc_dec_model_runner.cpython-310.pyc | Bin 8139 -> 8135 bytes .../cpu_model_runner.cpython-310.pyc | Bin 13347 -> 13343 bytes .../__pycache__/cpu_worker.cpython-310.pyc | Bin 11658 -> 11654 bytes .../embedding_model_runner.cpython-310.pyc | Bin 6129 -> 6121 bytes .../enc_dec_model_runner.cpython-310.pyc | Bin 14152 -> 14144 bytes .../__pycache__/model_runner.cpython-310.pyc | Bin 46602 -> 46582 bytes .../model_runner_base.cpython-310.pyc | Bin 9637 -> 9631 bytes .../multi_step_model_runner.cpython-310.pyc | Bin 21814 -> 21810 bytes .../multi_step_tpu_worker.cpython-310.pyc | Bin 2659 -> 2655 bytes .../multi_step_worker.cpython-310.pyc | Bin 4772 -> 4768 bytes .../neuron_model_runner.cpython-310.pyc | Bin 9008 -> 9004 bytes .../__pycache__/neuron_worker.cpython-310.pyc | Bin 4380 -> 4376 bytes .../openvino_model_runner.cpython-310.pyc | Bin 6970 -> 6960 bytes .../openvino_worker.cpython-310.pyc | Bin 15482 -> 15474 bytes .../tpu_model_runner.cpython-310.pyc | Bin 17909 -> 17905 bytes .../__pycache__/tpu_worker.cpython-310.pyc | Bin 8261 -> 8257 bytes vllm/worker/__pycache__/utils.cpython-310.pyc | Bin 1415 -> 1411 bytes .../worker/__pycache__/worker.cpython-310.pyc | Bin 15199 -> 15189 bytes .../__pycache__/worker_base.cpython-310.pyc | Bin 15423 -> 15417 bytes .../xpu_model_runner.cpython-310.pyc | Bin 14480 -> 14474 bytes .../__pycache__/xpu_worker.cpython-310.pyc | Bin 6080 -> 6076 bytes 476 files changed, 1270 insertions(+), 46 deletions(-) create mode 100644 vllm/model_executor/models/__pycache__/qwen2_5_vl.cpython-310.pyc create mode 100644 vllm/model_executor/models/qwen2_5_vl.py diff --git a/Dockerfile b/Dockerfile index 62b7be9..51d3df7 100644 --- a/Dockerfile +++ b/Dockerfile @@ -1,19 +1,15 @@ -FROM git.modelhub.org.cn:9443/enginex-iluvatar/bi100-3.2.1-x86-ubuntu20.04-py3.10-poc-llm-infer:20250731115755 +FROM git.modelhub.org.cn:9443/enginex-iluvatar/bi100-3.2.3-x86-ubuntu20.04-py3.10-poc-llm-infer:v1.2.3 RUN pip install --no-cache-dir triton==2.1.0 COPY pkgs/triton /usr/local/corex/lib64/python3/dist-packages/triton COPY pkgs/triton-2.1.0+corex.4.1.2.dist-info /usr/local/corex/lib64/python3/dist-packages/triton-2.1.0+corex.4.1.2.dist-info -COPY pkgs/xformers-0.0.22+corex.4.1.2.dist-info /usr/local/corex/lib64/python3/dist-packages/xformers-0.0.22+corex.4.1.2.dist-info -COPY pkgs/xformers /usr/local/corex/lib64/python3/dist-packages/xformers -COPY paged_attn.py /usr/local/lib/python3.10/site-packages/vllm/attention/ops/paged_attn.py -COPY __init__.py /usr/local/lib/python3.10/site-packages/vllm/triton_utils/__init__.py -COPY prefix_prefill.py /usr/local/lib/python3.10/site-packages/vllm/attention/ops/prefix_prefill.py +COPY paged_attn.py /usr/local/corex/lib64/python3/dist-packages/vllm/attention/ops/paged_attn.py +COPY __init__.py /usr/local/corex/lib64/python3/dist-packages/vllm/triton_utils/__init__.py RUN mkdir /workspace WORKDIR /workspace/ COPY ./launch_service /workspace/launch_service -ENTRYPOINT ["./launch_service"] diff --git a/paged_attn.py b/paged_attn.py index 1741dd1..988f903 100644 --- a/paged_attn.py +++ b/paged_attn.py @@ -4,6 +4,7 @@ from typing import List, Optional, Tuple import torch from vllm import _custom_ops as ops + from vllm.attention.ops.prefix_prefill import context_attention_fwd # Should be the same as PARTITION_SIZE in `paged_attention_v2_launcher`. diff --git a/vllm/__pycache__/__init__.cpython-310.pyc b/vllm/__pycache__/__init__.cpython-310.pyc index 1190aa948727b88527e085bf7ce5b7df9b06ff3f..ba64550a2c6a8a7041378751ce1af0fcef7174af 100644 GIT binary patch delta 61 zcmZqR{KLVW&&$ij00f3>_ig0nXHhZHFUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E PFQ_cZ$j_VX#9{{k8b=cu delta 65 zcmeyv(ZI=_&&$ij00foW8a8tCvuIf8mlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} Tr0NzVCTAz6rxs7PW3dAOX`B=( diff --git a/vllm/__pycache__/_core_ext.cpython-310.pyc b/vllm/__pycache__/_core_ext.cpython-310.pyc index aaa4f730d201a068e324d53e9ed2cc18839346f7..3c7a3da722c8b7075830a0dd6a521b1f342ff5a5 100644 GIT binary patch delta 62 zcmbQ>-Q&%j&&$ij00f3>_if}3Vp1{HFUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E QFQ_cZ$j{r{%EYY<07B&x(EtDd delta 66 zcmeD2p5V=$&&$ij00foW8a8qVF=<%pmlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} Ur0NzVCTAz6rxtH+Wa3r^0F&qx;Q#;t diff --git a/vllm/__pycache__/_custom_ops.cpython-310.pyc b/vllm/__pycache__/_custom_ops.cpython-310.pyc index 4f0ece79f06a2af0ad01e92d8668be1ad59592fc..fc17fb1a445bad3351367ff5ae3c208ad14c21fe 100644 GIT binary patch delta 6875 zcmb`L33yc1700CkPRdWAt4D%WF2-A9?LLE-XvpY#b!n|q>ROkc|9v6LB((Z{o$t#p=bd}*x#!+< zxA#t-VK1Fwao)JN=wb9LK6;{M&at?8DY>PE0k^Nv=k(TcOL@ zQ0VIjw0J$;ohfsSsY;C9=i}aXr`sM-yYxy#qu1AA3$a>7yqi9Wm5G|wW^r-G2v#C? zWsEdOHLI?m&7-z0rS|w#pnQPIIHOcf6DKm}GetyaE+Q(KqluSfo=@D98Dz6XT-MmR zm8d-(s3L@7Jwdmvb)&6CwKw^BHS{&mNBPwaHka!0^BH)IaogK%Jt{sER1K zLYxE41qM3j^PsB+;FHe>;EpcTXb*nw*|y z%9OX=V&wH`Uk=GCND8nTSR?%`%*kf!gg57!+;bbk+6JtbRf=;bum-U72_$|gV+ z_Vf{n4icZEzcV_5S;rmXi`=$kY2}2KW(w&dY40NOMf&qgdp&oFyT^QGal^m^$TWE& z`G5_8%pZqT10T#U-pU(A{3>tzEIH(H{0BRLmjDn1HUe$3i@zP4%i6`)W33ay@@eE9 zu-XJ{1}+9J0WOs_FCRCGb&A8|R*g{f_O=ZlW>Jwv$1j7$HW6>h94&{V&kIVF7@xhd z)#k7_2E3fiYBJ2C(PCzoi*`#WLoqb_0vkRwz{OU$V|*Jb863Xi5=HpNo6p})&!LE> zK!;BaMUaoi7RAtFcR3WXZ+vd%6{vY7a20Sha1C%RutU5v-pXzig%j2;YavCKj_;;_ zA!C!e(b=e4BKY-qj8NUaKu5^ncWzRp0pCMvOC*dew~oXGZx`zOvT8aUQn{ax>e?E&B*a0oao2Ygz7qHzlz?+{D#3(LcNnEHix zC#?D$-G#@4KtFG<Q_(1PLTo8omyNt~IN^^I&e}f-g{<_HY%i%ek3A!%7TZf^lNnERY10M64Gx_C)OJb*c_@o5Tr(wXot%l zusJ=xgkV64kq=bvqX+SalKCtoa!Z@b`i2Z=l{Oh(B8hU@*9=-vVw|2{-~5kq`@M$lz`z9JY2=uHnr1*idEOtt~TDH$7qq>)h2hTQ4H0jB(SCR(JiaSO;$Zn$_K|p@d|#1V7avfGC5n%Sfjr&* z2I=p>$G|^;Pk>Kl^&``AbZ3T%UrkesPD48!_$PsOJL%+KQ1p5F6px<)pUe8eiagzy z!^FOd9hF}}`!(=y;2Ypu;5*=Z0M`=EfUsb6;^fK^VpC-<(~AR@bD2Rte^WVuMT&9L z_qt_Tgx`$l^ZMbwvJC9ksQI*XS#J5%HgHLU_aQo(Y zzvU#JUS}4os^g7a2qsautJBlMLeTeLA#`4u#bebY4N26n*j$^MH_)0kBRO3jguBDQ zA>d8fOH0j2?XXG~S$6aFHdFS%$`*rGIlSK9niSIrbo9KQMiU0s<7Sz_&uY>%_bDP} z#=e%<(6C%wrXe$j?I;vMDQi|kdautP(%ELp7HH6i>;vp$a93B`XHZ;R72$7$Kg6q&QqlLmI3ZbRD2 zw9gvHvc%Q1(yPJ@qJQM}Av65-tdY9WOgx=7Ld4XX!iW1q8T+ZJCb4FAyisN*NBCw} zCWS3(9lt{CpEOeZes-oVuh(1tzySFe>N-!LVbYKcDVKCM9SPZ@rgk}7-hET;Yx*>K z!Hv)khiaIOMb&YDMb3b|^U~S)?nmaSdbV4nSu01q4lB8wI*6!@ps4Lgk1hh~gPFsBi1td0_sO0PqGUQMW^wx>vzEWY zo>?D0oIjIh-;tRd%A#|aJuOGQesLBnKBooRdu*}UI0+F?7OyWZ7`&kjwOd~R`|#a* z-jWQ%6eB!^~#8pNJMFqUR zR-2PvkkiD*rAyda@xs#l)Tt;>17=VTcsZnLKn2Z*WRbgU46E#(x6Hs+gq;%8VN?ZF z1JaMIU4zFNz)WBkFq@#nHhSH3sZecr&EU1rUnnQtBg-q;9C2p(Ox7w&S6CAI9L|N& zJZZFTMLL@=4y}03g*ya)i(oNpD{}#?76N@Wa%?g5y~-BeyE&UtZ`gRlrS76VIw zrPOpeTP9-bRt}fvbw0H6#1b3oa&uR~_j2f_L#hHeFbh}+Xs_EZ*X7dd_UXEGW*5Wj zEy*iUCv3^qi-q+mtX`<~M<)Le$MCMe&uUx-^5k@qpODEO2ykZuO%lF`z73_Pgslo4zX)+r8QsgST%Bsn#$zkC z_2dW=Ejp`n*cMWuyR@@wh99pkF-F1AB`j-}4L;o6DDwbbzz1vqxD4^JHD>Kp^o!Tm zlnw4z0H#4;V_&7}wdZM@QJYw^Hhb`mpdF^Nrgne1Z>?GDOow=Wtz~c{efFDBQ>&D- zuBVaBLmX^fjJG5H>5)xNd8fL8vc~0rT|zF9hyg#+4Ydc0gTCZZCbt@}+wkhXx7W#~ zR3XFy;;BWc=LokGk!nLK2eQ(Ztc}SQgd4sgUMy|)+A_6q*gEu0N{&N6pQiO`n$OF` zg!MKfCIL5!UF*lQDDn9EsfO*Ope~rrd>cteDSE$wIvO=BR!1L7vg|GMp|=WVRklz-bXOE|+tPX23r2PV2}NbYuZ_M9v-E7Q-+dOZ}c75W`*Pn`;p!m1En& zeT)8W6&0?WrK?D3wUQ493A~v=@0~ET){+u~!R3^Tv|6p&qtpS*Ekh{jtLib=j0Ff# ziId;@3h2u|r;opi315N>RL@4gVvvlN3YtY+r8|3oHm zj-aP8;Plexb~)kA&UU;ftGs|Vpq_2LiN{g}eig;9jL;hQcnZ!|w7Wt&kB7cT^fNu4|a&xt@1kPMs$qyTtt;u%0DkOhnea)3Ml?*n{1 zfD1S;1d4!SU@|ZTCNq0gz4s;Vj;&X3h%)^ijxH~Fhx^Fv+>VD4mRa8o$!b7A5d~xscp@MW1qD=Gh)ROE;DW;A0pEisZ)4s=AtqIm*fcSV zdebykP20rA(l%+8CTX-uZDN|uCfc-V^VPIzPJ7y%W;bb@o;LRW=TpE3Htjj(9DZ-+ z&YgQ_y)*N@bY7f2FJk?%u~B3AFX!Ezoy(5KE}xiJQPdNZMIL{f(^KSew-yEZLY;nJ zX<_lqqM$pZ6$G4ZUCs_IIIwNvQd^21?FY{M zX}O||?nq0f`m}MjN_Hiy28DTsU>+S$s}(xg(pNCore{vpW7_<_kk%V=cr;&7k80)i zbUA|V>ouJyy+>S2kyCS*Rm0jsU=c%)@%4BeU0WQTnzKD9mq1T>YI8}t3z@HP!C*gT&{#{(5764EX>K(fMEuyH9!Nf7FY+Y2Q~nWv^On* zj%K8bCOVsu+PV?KtAI@md%UzG{r_wUb#F|h_ROiGnRaFN^6-9^nU>;!7uCTQq?|x2 z(5BkAEGt8}s4HuC_LUW(-2rr}Dh1j3Vl!>X?kehn&;xjZxIrW#Bks!lh`hbl^B!)k|E_5%M0Rc*5j(Sy@It?Gg17C=qNR-}4?K0wXX^+;hcgj?K3 zujfn_+vt;=U5nKe#LEB4+zqgKBk%=ayBdtMx!Ga|{WZ5PKWu(&awoKI0&WIw0d@gj zR5fqPn=Edn`|~y==w|2E?zg9Mk=-P3hsJJ-vZrUNp&GJ+lE!H4Nr%hX7V=A0!xC$@ zCyBc$WY=qTOGhBo{k8=rZi6`?ccYTU6)2vqTUuSkv+WVOHQ4D4XtDrWcQJHpd#Ep< z=~gz`)~Q=MogSA?`=@88?}5r*U>`uhJ;0ZNd+FTtI`IJI=Qphmu%O>05Au(0YuC28 z+cdjX9zxctc>|$7-GUvh6y#wR+sDe!vyQ&Km!Bz)Q2dPA3_X5}$K!RNgN|TlkIUuJ z>}L5bHYNLkd(~L%nK4OxhrT^y`OM3wqkp)&??V4!;1S?^!1q=4vVwTqmykV1bp=Ip z!)!zjYw`fJh7A1x+2Piz>yzkoL7I4s{!*|$13gxK@3*Kyk>7-1P%0l)-nSO!h!b>w z;qGNWMDcM(|F~g3mAfCI=tBmUxC9De5SGkcGpWppSKV z{LWDEY}FPnIfYu!0zUvgEr(*DlRP(zan?3tWo{>3aYEo8PQU#X``i)|7lBST;0GCck9*d zmA~c+c3XId2hHf_V2_u}hjzEx@+wf=LK9~#73ZjB)*rX4af?=F^s!PiHto;=4%xGK z+`*7Mz+QE8z#q_Ud`xS;cHYlD0p280hNm~sjo$*w)9;XalcC4>dqNJE<_z_)6Fti1 zafTdjUm&h0q(`d^mj^gQznEPs-l3^w9pytqCSXP_hSxd8(>&w`9`tCpZ_u{CP3($3`xbhskR6d~w^3T>thQgy)?%PEd{%19)nLzb+_Mgh^Z z(~(HBa+)bt(EiFhZQ~%liazuuWG5h*2qXa$fH3zHmHRDK*&>+^R4o&eRQ~T(`CSf|6{fSQ;BmNigtnOa)*@ zE!>No`&6`q2p5|)1 z4z2ECn~16xWJW#?FS)4gXiAw9)(G?PZJ~TUx?qyXqodWSIhU*UTaC4$V*B@DQ=Lxl zt4hPQ3z3Sa>Mo z_i(GWQRJwzb&$?3Oe~$jMtOAAN)B%=8_=V1L)Uuwq7e!j3m{8%B7f2B!cwl=HjcF} z{UOb=F^l+LhPCl&RqcUAsp4unxoAWeK1A`p#Yr|b1G8xI;?(h%Ti{y|Z#9k-O^frI zX2W&VCBOWO^c7rl=v0g6zm65k%O{H`naTylrzK3ff?fF;A3q2s6O5^uL!Kp76T`Nz z$?*M@via(gbW^3WiS~~=Och)Ze&e0XGKY!fWmHwOMr<6|SM#cQ$|knJkypzDY>p{@>|dd0BT9Z7<(6CN~b{GwDGvf=vJO=&10;V!*rys zIBCeb+F{kOzJT7X3y2zOUNK@8f2q28|B57IBVEJlSm5F7^(CeDDXXb9z4QuduTXV; zsb$#}OR*RptxvKoN2_Y-Onu?VurXQ$z83o75x8b$n&mpU(r1ilZ;aYs-&~m?R?u@R zQzwQk%vkw3F*nSi5p$QUN=~XnOX?YVM93fLa=7^wTtafyO3_ZIRu!bIM0p9Y6jQef zsnx(5)uOc3xuRj9X0=5$#6cPlj0e^N>wxuuvZHEmK(-Os2y6nH7>)dV_wxNfbKnsn zn;~~7C&$)QiWYi*%_0$`(gu6nkU=MuT9wlFhE&l;hZ;_K)a~p8Zmm7hSo-bI(tx3w z>acb}_9XiCUtEFJAatNcC*TG)E7xzX%@th~v2N{E>f~L55}ZUjdDmrUx4^y!vV};g z$fTZ@waBgk8q_v^VO^F8aAZoPuVqD;q?@AG+Y9`t7zZVVB&51oHqXp2T7;aaD2uQN zlZg12>?Y^>ZjT2c6ke zKC*LnLiH}-?n{-DXkJsI5!3h3`lgKV{ce_fp?W9nX_{g5VIMu+WDmbC@G-8`0Ak%_ zN^ib+RNOPl`PMJwUe)3on_~^D_tKu`RGSfOs5mQumM@4-@oFKb`mA;z&!to&_!ah` zi_jIW5^#SXU<{9PF~^Z)^lv{J5+0tv%vZ{iNM-t~TygZPkm}nolh&3ghRFlm>O`t& zskLEF)%b%d*n_I*yG`Z_&9EMo8tx-#YC-8@Kt}A&W zx^XRcLruMDhh>aOq+F24DcUnB@j5h;%Mm~V#?Nh3?#WsOVO<^D*bYZK82rwIVqFaj zF%(j*n6Y(rbw*anfHn3}g#6|3Vb8*JG_WyNeRC`1kMGhc`}9bB<0{mATY@@`^QI)| z(MsU)cXVh{;@r@w!kbs1N4k1^Z6UYc7c`b;qPrJQP)!!L<70pdsO>TaZF_+Bc&Cix zhyBGGPLG^J$Gw%?&!9VnP$>pVfC``rmy0GqfL1^@s6 diff --git a/vllm/__pycache__/beam_search.cpython-310.pyc b/vllm/__pycache__/beam_search.cpython-310.pyc index cad0282ce93b3ac26f3fee6c74b2c6f0e97dc5ea..4e88877a9fd2f760fbf685d5cd677f797e88f465 100644 GIT binary patch delta 62 zcmZn{ZWiXw=jG*M00P6c`!;fKV^T5KFUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E QFQ_cZ$j{sSl4%|r062COj{pDw delta 66 zcmZn`ZWrdx=jG*M0D{VG4I8<)F=<%qmlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} Ur0NzVCTAz6rxtI1$~2D+0Er0|p8x;= diff --git a/vllm/__pycache__/block.cpython-310.pyc b/vllm/__pycache__/block.cpython-310.pyc index c27aa2bbe6a9f10c654d53bb37c3255453728025..2ec96641779c401381f56d0400f5c87333e78e35 100644 GIT binary patch delta 62 zcmew>^;3#FpO=@50SFA&?%T*cmr2D?za+OnzaX*D$wSKPNLu Qzo4=tBR_BR1*WxJ0B&{_WB>pF delta 66 zcmew<^;e2JpO=@50SGF$HEiUb%cNndUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*54AWXJ0K#<^bN~PV diff --git a/vllm/__pycache__/config.cpython-310.pyc b/vllm/__pycache__/config.cpython-310.pyc index e54d5eed7ef19d37beb5bb3bb44c26b0c19346a8..7f93840b6b46ff79d8d45ae39ce3d0a7a5c33dfd 100644 GIT binary patch delta 401 zcmaETn)&i+X6}4mUM>b8FkHKDBX^XdijjUvZh?M5W`S-=Vo`c(iLQBWX-2MLZn=I= zW|DqEWl2VU-sE0IImWihYZN`%co=yYnHV?!S4?JO%46J|qS3_4*fROKt}h=KP@IdA ziF{-g#aw5un{XOgxM%%$t2}oV55rj$vb9V&q_C`p?F= zd48G+4`agQD@E2UKsAh;MT;|dnesR`*EeKw`sC@9FgG(438ygEFvK(Esg|$+c~U7X zV4hqF!vfZY3`I&QtYE$vkk1C>Yo)M(`FthpK-GpR>|h@IX49^jGD6pYwsVAY0BvVs z;$Q-jjGG@VJHx`1C$M?L>I8m9tI2}9WffTdGchp%Rj~YH`On1)@*a@K!t#fOjpY~1 zf0qB7gLZ%57syjDVa(#HWzJKsVFHp0n}bgO;bi7uV%Z#c^%olt7tjcxHlT8rf1AVa HOyL9oI=gAd delta 431 zcmcb7n)&rb8sNB}DkvmFJ!%V-lxJW-IKRGc+KPNLuzo4=tBR|hr&(J`> zII|>Gw;(Y&J25@Acygzr9Anqy6^fo*T#QWrxtN&#F)?rcu9(cmROq%jMx%+9v19Um zU0)#%pez#;7bDAm4rT~@vX!2k0797M35Qgb!ejw`kTfG!q`iq{&B$tl7Zom^L#PXYeu=N^H(;$l~-Vv?yV2 zW+)O)VXk3_X9DtAfIO)b7ATKl0qa7BBBc~oIG+v3*Ggf7^4Wo^4O7@5yv@p8Gi5|> z0A0Wl&cVpR$il?I1a!xL7N*VTmYrc?DpcD%XLSNUquu1cyJS^>Uj5I+%mh@$@{i>| z7c0bsEoFrsI5==jG*M00P6c`!;f)U{*2LFUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E QFQ_cZ$j{sSn^}Y(07tPDY5)KL delta 66 zcmeBH>sRB>=jG*M0D{VG4I8;nFl$)rmlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} Ur0NzVCTAz6rxtJi&Md+Y0GVhNdH?_b diff --git a/vllm/__pycache__/envs.cpython-310.pyc b/vllm/__pycache__/envs.cpython-310.pyc index bde38c9aca6f0032716f16a7f06449498d8746e3..223d6c0c4bcd0899aee9a1f381c67fd167aa2414 100644 GIT binary patch literal 11644 zcmb7Kdu&_RdB69PA|+XtWLbVFeyM)Tu`NI1M;zPn6?rAmqDYz#*}83fN9)j*97do6_`rP0vG-#OI4^p7<;rFSpM&4~lktxXMfqnc%>S%H;SB!D7eb1X zQ-mVaqGGz=s;Q!^6}8EL8JG;3!N~@*VKQWfCc|cUve9f*l|tYR)&4sXFq;a^g%u)r z68+7VLStcNmx6M`Nu{9PYn@fhHf|50J#4lYR-vsCxXJ7&tORc6eyh>1nftBaa;INz z;qn^4yb|TGxt8U$0xRY^mea<3>wUghZd=7|kN9mJT;AZ9S95uzU+(1cCcnG} zb5X8tzPClJomI_lp3geJZawNg#dTfi_lUWb@dn_qxsCPQ$ap*BO~3(j2lH$O-eT@# z9lL=)W$xnot-z|e+aG@$%8J>;eA~HgkKeWf<*@lE%ihU&FXLUzx6kL>jk03yXBj=f z0kfCK+5`Nkd4Ta=<~hhb`+!yRkl%kl%3<>`%kGtPf2`0g4$Nxi5$=5u9EZ%K-1{(d zA7k#v7$0YR1o)`=IOAi$$ITPm_wjiWPe9@mT>At#PMRlK;wi?b7@r1y(mc&PXMk1n zNncN$%V+#@AIf1<=Mf`}`xr+VM;II2C+hd<=Qe}e1{n7<9%MYgI0k&y9AtflfK@Yw z{$Yw@j^jAjo%Ll7bKfEEn_wJgoMb%AIK?=@_#CieCRu)(>r-5x0nUotUBx^nM#Oo1 zrzaF~MqCi1ca=9)p$k)@KJjUZBH}X=^^2z@8W0yH>JpYj>%^}~6cl-h8pI`uLSjs! zMj<3xAqo;Ti^~#S5#tiIhzW^SimNVyuC3x}Sz8p75~anIL~UYPqIOY|Xq9+Iq7Gq8 zv|5xU>J$};)`%I2Hi&ByZ4}of+9aNpXtTH>QMb4$(Khi}iMER8T=anoZMTc(W&I9u zOQN0PwnV$d=OpS8FG#dUyeQFLaYv$k;;uyd#Y+7(AhGK~UC!kN=a2g}|VljWISa5>TiLr_kj8Bv+PGhoEnV6o+ z7ahfE8HvY-t-)j_YsFGd6PHrSbk^x$m`+8kK0RYtDLp&b@2uv^9LmGVs1eUZk}2cC zNhsiSyX+XbFW291q^Q+4BkC;uzvdM(iAJ;R3mY&TfoaT5kqQ|YYo)~gEBe|$G;i+w|e)F<;TVgz1NDxNvDm6jp%TOl};wJH(RNFdg}7T z6_>%aMI@Q%j}0)#hik?wl~VacZ*RGhuax(bnEm+)XPunBK44fdTs8x3(j!J%dLogu zav8r(8Z?@;63MKUP3w^%StXg0xpc&Mppw7Vx+<~;xwK)$lLIi)fD?=*`jgW6vd)Sd zBSzd=&po_4sXK**)P=?~to~dgLN=BIz)wbkZQciMU^8cfoDo>blNb)clF^4#am;GR zVvT9ztidvUHrFbtloi)U(L1H5v$1)DMp8LzXv8&tCIzjWE_b%5PY$Q7>|ol^qZz9& z27LnHb~?Eo!JHV0!KQBbNLBsXg(9~v?Bb4Txr3(CMg)-vE9_jzWh8V8&vQ8)Mlp@3 zb>4^#3}!P<)3e3A#StW}c_FTQ!eHVFMNt(wi+-eE6!}NFo=Xf_83>Zjp~OtIie8%w2= z5o_4U4kn{cC|@oYDrFgQdM0BaTG<{C8Ytr2_=ycuxb_>_$e@>ovPI8DW64jn1jlAX zUPfb9PY)msrEeOC^$XV7WFJyEF%pS*K9!!NDUlQ8Y^5jJvsCS_0&<0ti^Py&q%1ui z8!;@b5OT?g8Wi8{kzswvu=;W_tWLDbI$@+>UovAjo7g0JJf1v{6vA>xYVq2LtVuZT z>XkLHy7niLdsctyI9Ss0SYo1m7mVUA1hmS^HA${Wsdx_Qn34IPMc+Y8DA^C+rLAbp z%YT}uTo?88=j0;nYLm_(#D*!c)4G*QMKNcjx4VF6hGHozbtvWT7BURnZc)QE5JIF6 z%j*!dO~7MmYviExldFt0ty~-2d5#>wY6SD;vY4MCoj(TOFZeW~6v5xzW{`?bmGD)H&-GsKGl4>ye}m7Lhzi)%ZbFvaMSH zTwBAwWZ6K%K7%^@Ns#-ReV*_IBEGTajox^&n4i2P@~1C>V@?BUQEY*)WeuqCfLg-V zNj`O1Y!H@rg&GU>1lyO<+5=&I#9CL_@W6_vtIsI%%FI#NM6+3bGM30|6> zF0yT$Fal!2o}O|7@I+1hpFuyiPkXg#0%#+-bM$QB`eIfN*N>X|bGc3($?(n9g7LiI z3ho4;*;IHo@`8`2nO#OTMfxN7wksg_>kLc@Tyx;psBs3QYA`Rw%InekFvUtM7zbp!1rs)D zWz&*jhUIa)zRSM~)-t(#ef6NUp_1*(w1&DCzoytLE7Ak5>od6Fx|vQ9XHSFl1YN`9 zJfYYWtTl6<-9HPCGKE*O+Wv7+t(v>9hMPyclq2?L{fu9MzTTMRVyCfEm@HkMz=fn4 zc|-*IR=sY1%Zp2t4g>9yW!F)6kzUmT?2B*fRyhKQDD` zfUDeEoW5SDt-^P~!(LchTZy^W`AYbcZ$s_X-_^+2AT=Q?;GZ@u!| zOd(DxINDK4aQ5rMS=Jo&54}-46sL)=P_!%6G`Iac_-TQ>i*NfDkwx|kj-4M+<86?o zg;Dg>7xt&i7q)6iVLx0_Sb6cNx<=`QOeQZl!7Re5N3(BIK|N^GQd!d&e~Cs;q;^G9 zgC9Fv`Pj(k!suv1AI7;i7mp95_0%BFI;kvfWL0MKf1T5|uI8t;HCEpheoB>rtpiQY=!hbHZU z^`q&>#Ia~-dN%eayoOj`AX0b2KOv4qCtRf-g;ss_{)spiRj*3ex+R7E>+*%s23B9Q ze_y_^t|f&%SW?)+brp-dyPIvIjvJSh|I?-AyUQt^T-?p$;l@GxsvGE>N_AJd|0dqL z&M$8Vi@!@@gDADhk|ww$0wTzJRzt$x0$#Ia{v*zE75N!@mT9l=#OWxA4SSK4_Cx3k z;G>l8#<$a4vZuw&7`+PCkARMzC_ebrT1P&j zE{pE}0klM@wFp8R(he$&5ve8Ym()mi0^(Zm@ojPm)npTLm%WWhU5Tm+jsn=KBznfM zUzHMfk}zI4zeuQ-j$x9x=!AV8FOx(}co)g3tKO=b>V?oZLj9*m7$&@%3anmup}zdY*^(LZTDE<9K}?x7F0qo3Ok>($SZX zpW3WEbMGge_kr}tBOsrD8)izSI;YLuHD^#|liuaoWM55*-VFR3^#PJt*JX!mnxjg+ zgAmq_Odltqd>E~p>BnoTSrw~C{E63%)h9{fqOn>f@#yj-8q1e>j3mBHq^^!bH6{Aa z@dEa75_X(OT@Rfji3PA#Whm_n5&X^3I_&N~)z@`AywTGeJxkyy`2;xm+H9X7bd5-@ zr6Grb=iSWP7r&WTg~=(%bkrku-Mqd?lUj6Dtde({bo?@rx)R4~O7zTRzX2g+gu^6^ z-VW?TMCux0oWyd?*Ve#0m3&-g8(Vo#Lp z=ZL$OKDVIH9GRyRue0?IL2rVGoE#%*Y`M1xy-lQ+@Rw+^?|`Gq$=+mbnY8j}hk4Kc z@uVK5Ujl~ptkWQ7CMR#yPv=)?tiobrRk`XcxXgxw2k@yMP_NZ=RsbSsiJ1SYq}pM6 zMIzS;wM)UF&VSDv0_%tBUT=S+Cl&gos5nvkee^AiU2X(p2kybz$Bk;04ZWZ)(~(3z zr{Rb!lo`ctmYU#^=ix(}_qrIT;nn@~Uz_Yv)Vc4AwVe4iQi%MvR_Um%jDJoVCV@+5 z*f+?;i)NS~B3|Sre2Gg(-nU3>-N^gIY2@L3Cg~5usYPb58Q|ZgVHRC(eeGXCf6ANG zLa}wPNxw^`Cik}R8%UMstAwZjAHu&+I^Q9!+T0bJ)>k`9gx4@$TsX_WLUoiZHpQ<^ zVPmsf*%NFho)wMmtdXz&lZB~@buDjC(Ep_QyXs-|Xlf&zHNWrn~bMEOD1+Dur(3 z*833VwCY}!VcXNT(`Z?wf@Srn_SeBM&zDaT{|d{(^D4=)tUvbb-l#R>rz(3E3{}Pt zpfZBLatjFkhHwuDS-!cciJpKHEaLx-xT*x7F5D>38;>)K2Mt>m9&;`0hcuuDIW4OF zZG82NxNG=zU?)_$QJR>#VpF?KquS(mn`~!OaM)oYO(0GHLpp7im7kiL#$0eWEnAjN z8?<|We3sA(BBZo?(rhKvMx>p{Dk2?3RukzY!cRK<3bT%i>xuAd#lzKtHY@(Q!rnw^ zGZDI$+ucOy0Oej0cMu|PySFh~vg{rrdx$(rWG@lE3-l5?K!nc5wn^kL5e`*8)$&2~ z7}fD{kI!GHsL02fGlX;^eMHDz^CG;TiUUL*#`-eC{2cY*OuI-ZPvm_f6ejGxMSb0P z(v8~F@U>Dd!kf)XquQ;8v=+4;|61^mzCGlX+7W@B+)5lS7qxllVcpt!Tpsr1c|C}` zQ}%Xywy2GP#<13+g+i+K3vC7H&$U&c|D~+~{SR#e=)Y)NK>tzO1^V~eAF6X%|6fwK355wDFJ{d`Bw+zo|U~`kGb&eO0>w`m**s z=!?p2O$({Y3)(M%pbyY5fSMWo4^RuEIiOZXKLhGu^i!ZtM*j)4meB*CE=K=#PK~8GRpUn9=V8r5Sw>=mMkf z06oR%n?QomyFgbNy$w`i^g7TrMy~+fWb~498#qW9cKC=(O>Qapzf=mfg+ifVs38=_ YKl-Lm15gwG!qlr9qbj#sMN9bq06);a_W%F@ literal 11501 zcma)Cdu&_RdB69PA|+XtWLcK2*p5}lkI1nlzwP)HUy)Z5EsCW1kgeM|H?$6I$)+B; zq?Fjr+jg2Z&7*bOv`f-i8PdTkhHgXAVZ%0H8-`)Ph7H*M=q@&_z=~qtqu8KrK)tQm z@B8lIl^p6)rr?jibIy0Z^PTT;Ui9?p)r|^1*M9iw_-{rPbw z`kPIK`oii?1?9RENE9QEZ)53fkJib;nFrxs&U+0;}fZ-uRE9teD-*w~gC&d2QQK4x3M~>>Z4EGv3L3dpy3!QC7?zmeCCy zFnf8dUBFM6dl~O$o_)--2Us=td;NP*4x0y9cCVcK!9thVJFl6Cxc5GA>^Bc{?*q(z zgt-qgKFatI@L}^w#z%mUn#Z{BlS?EXgT&)pdmJ1m%o8l}B;%8ePXRw=o?@QUz^eI_ zr>D;4(_Xm`<*=#qh!MtpjH8Srj1BG+_4@R4o55`ZjQbf6G9F+Y13qI8vOYt=su@H7 zFhw!Pah&VUcru5%?-2J*Fpe`$G9G4}Vw_-n7FaQpEI$pL5!suHnG!iMg732via0IK ziSsv=+p5sTs6>6jlqe!TFHygETA~4QL84Caj6~~&B~eg3D^Z=uOB50pC8`%=60H(K zqDE1W=#scBQIi;#XtkJd5p-=9S7hx~QIsexCM9YSQxdg`X^GZ|8Hw7&a}uo;wnXis zB+)uimT04xm1vWglW4PeUZO|E3lepSYZ5&su1mC4e8EMZsL*zscv04G7cWV)L%b}} zTDHn?W-p?udCrWLBsdrTgQ1w8JF2L(b~# zXv(l6gGOX1mKbmX`qVY2K9VmM^B0Q+Cm5X=D?7pXM5*l5CuhnN(^L7Pqc}|?@%XSc zn9O9YSjuVOQYx9wI&BQosfg95XACQ)X9xS8wOpA)c{mw0;+aS?W!yUf1)MII9V7SU z`umNvbxuzwP_kl)tdSnk<4!Ac#1fgTo`@J$Eb6S`nnWZLw=zi{!D)#{t$3_2t*1xb zibuQ=v*}ninXvlfdS=klv)P2x7*9s@xRuruLr!}n7uBtiSSHpNH>{{J5{noaXAAc> z5(BXWMuZ}IHU=5l*szhzWvz^yzMhI%L&m7nnmJ(U5p>K@kyLC)O~#0%jqH*Jrv1J5#ydp{_1d5WDRm@!-^*dV59*j7)$ggrSoN-6*oqVxU+$KRO+Pe z6c$n!8qcu$bBPGqSPlR`840#|AGCqZoQ-luU?optI0Q>ZA5O(FtL@7*rj0WO%k ztE5s^Tpva6l%CGUmJAw6<*cC**Zi3jv~oJ#*`huL^=cm!x$VI&?wFQ4Xew<)5Q(tDjt9AngihgkHmAcVrV+Ky8L@%EY{qGL zp_sQgf}}Oi$MuRZn0P`_R7K9BAL$oG{!y;y5<^x7f~0dOG1K~}l}QalbTT~zle$x{ zv_vrfSRDPM`ao7{w_KaWSs5AB6A8G!t~8T>e#+UzlX2x*!?}1imP#ih*07NsOh%nh zzEmodOETj0OvXU8vOVtAQN+3N6C0**?KiTK!Acs+7Cje@B|p;=9Gew+8I4&zJ%BWn zzNsJ9&s%4beMsTNNF-A6sq`dGiJTy3D?Q1crD}H-kSmm2B!&zlW$E$Qh+$!ckV{6? zp!jZ$4C_ON)t8H5b)r?)2_psjk{QF<%qG#}@#HzA5SBYqi`PbEO~P?kudIR9wLgj6 zv-(p#dAoHt8HfY?u-|ty{TN6mv#;y9;<`D3-EP`%~_2A;ZA!7ByT0Aw>GHybeLz1U#0u zM)pZRxyne>x@*H2{QJPC9;FEWEj$WRR_>@mEh|^FI{~Iaq0OrzFt5#P*ujDcr}=zz zKt}sua@e@9zI;98uBUhF9BsPfgf17#g{e6wIFm1rJHac{6H`uO;f0y}l$b3Q?7NEn zc?`tl{=wealHFUJ9?KVdixU@nXRejUr>73|?AzO0nkX0c%;d+e<}VjYyb||9YN==D zn$v+1EK#_WpDmW%M6~Sb>GA+gf@Tv`HMLz0{=&Y1g719oG+Jp!Ej%N4eWxkeSu|V^ z%T2(}p|q&7i=IZEv;F}!c*kHp64c=tBF}~7ErUYwpTvTd9&0%F3Ro^k^4gs=WH z=*RYHtu{>nZ6tSr9s^uo%*)~WQB!*^bJURx-&idej|Q&bb^w}9nP)?ezTwUY&ZdBM z)V+6u_GLnWiK%jJr?Wq z0=ZjbU`k-$f#0UaGDy{6l@u#&KRNnGu~(O+2VB=@aBp=pog&Vj0_hIAh99R23Rd5oXZPO$M~T9#UTym{ zs8-G0Q^U<8Ud|DF^IpcULf^`mG=YmpBl3s}V#4;d`ghUAz5-G;vS;-U zw7S73RGK!8E&^BG4aBBUaq9Z>#S(5hWqY=O_~)gL4S>@VT8q=q7yMQD9(dRb9sWuz zG%r=cn|upu?*=|Ip6^_L1KgZy&D8@{?7Yy%169_mikm6KNd-qcObO0@eQ=h(qyC^W zYMbIT@KuR+C0}#fFM^*I$Q$^!Un1g{s=q^xFN3TsjH0Kuus?WsVQW?t_QxvpoUn1h?qd!L@tEDNeP|J5n`xP)! zl$|AMEcdlqa{rPVX{}ya;@XFk_&2^1D=UE)nzRenj;0?G$FiYWv9UMdb;SBAk(v|! zJK|V&!d2=~Xw_El$HcL$dR4;KuPE#%4=;>1u-cma^x=hdt|;uERuuN&x{Af!-OV;r z$4x8B|JRk}yUQt^T-?oLapQQDI&+|ND%D)+enz}ConP7p7H^lr1~JnjOPb)42#6r> zS#=3}3wX_@rH?fatH{5jXNmUucASoa*szyLX)lDn2tG>bE_^$UGxoHY9i!L3+7Yk- z?&V{%k~#~tn$sz?VpLw3Fwj=&O4h`lxVT06-8uODai6*@yZ;B!5~0?sAhaQEr@}=d zev94zQezRMYEklRLf0Fz3AxLDj7Uw1czf}=tyGL*e_2Z0LBcqm-Xi3uV~8X!J7G`9 z0!hS#caof%>b3f+7eZgQ-XsabgdZnitll&sKlR#4;&b5eH(^D+T_mTbdK-MztFqn` zo_aN{w|QmjN!W5plx3Q0#_K7MNR^32^sI`84(+#?{Lf9qyv zW@?-^clyqt$|k)ef8~hU?JKb|1Mfz?mn7D7*?wPhRH?TQ!upZvblY53U@fMMqI-c>B=s713Ar!DrlCYyhYI-O|5(U_* zGPDtul=BN)LEPP^`nrzCH+p`fX9*l7kAsu1&Gs=uvqb!shAakNax-sT{$^ekCMO}& zQ4iTQ^ZEi!YS~q>O5Q2b@vB5?O1$VRv0^6sT?io~93WvOBKwKdG{R*P`ySY;tY4+* zL2#LM2lgL1e6+TzlfJ4}#c`ArTzM6LjwCLd8C6;uBoXY2{SFa7=g;}-Sc&5WdV=vz zK=Ph`CrEeo%B^aUMj-9+9C?c{-K_4`edhj*-yF*J#Eks~;_%bwCFrw2=4r?4Y^_7k z*T6$gj*&FB+-*W%C*mjkCQbI6;HYwPWwLf2tw>t=^TLv6{&-T4(u@DFo^|TP?BwLN z+UfizjkRn#SGnp8#x(2p?Zu~dK)p>em(8XCM9>nk^i@fu?`^;%%@jjFEhT+tzxrcm@hFLa1Jni3vILe#UgJNr5lfF-;Cigb+8%TGv zyR_0mXh(_gV#BKdr{nunM^SB4pxNYKo9)jg;|bC5&N}%rKUtV6TXT7Pg8pAa$q7#7 zCkta3)B6yvq)llD3NIqS@NC*p2I^F9P?*yXQrZUy@)wm4w2y)})Ynxc^7Zf}u1Cc} z*Y&op@qDRkYPu_5#xitqwp{2!{C@~xPP1OAGHiR=cIqvQRIsdW)&2+!OBR%;iGP)4 z;R%%FSk@0KwyD<|@pF=W2MkrI;iYF2THPDgyu!CDHPIb#f<^ov4p)`n)xx#XlJPkD zdC;(B;lb6iexC-^Ag4*Se+6INId`3%19n2?Ycms5mu+gdX;hmWZ*o3sZotwZSSgLek&Sr6?@~irliG^ECj8NN1yxF|2)=f1B@UO1 z+A3(Vu44&T1y|%%dJuQJ?Ctif57dXXCM^_FwV!LNK>t%)1Nt*<9q2!68$o}fZ2|qU zwiEP6+J4Z#&`yH>k!FDYt~Lbv11$ymeJuz2YuYI2ceQ6g=e04=54G`-8hl?X0^io2 z1ARv;gTAF*1ARk#3G{X46-~o!`!((VfS?c1&w&~l{TEOZqXnR5M*jiS#^~RG+8O-| zPzR%XK%IiKLa|(=ud!7G5SNG2&3Nv8f5g_ zK*NlF3n0g<3+PP%u;%3geHy=~D;P5DHSCuDit5{7h5${{be}p*{cr diff --git a/vllm/__pycache__/forward_context.cpython-310.pyc b/vllm/__pycache__/forward_context.cpython-310.pyc index 539b9090436b32853ac878620ae031b924050e2b..135a5b33518049c1589474ee3e1e62daac47d592 100644 GIT binary patch delta 62 zcmaFK`jnMBpO=@50SFA&?%T-C#HeDeUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrqe^8z~pO=@50SFA&?%T-yhE>H#za+OnzaX*D$wSKPNLu Qzo4=tBR_AmJlir(0AZCBoB#j- delta 66 zcmX>oe^j13pO=@50SGF$HEiU5!>VDXUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(Fnr#^;0JTUJtN;K2 diff --git a/vllm/__pycache__/outputs.cpython-310.pyc b/vllm/__pycache__/outputs.cpython-310.pyc index 448d4fea40015f4e5f0a3755a7460931921fc969..932e79bd5c98d9742055dfc3846fd3a6dd1b81e7 100644 GIT binary patch delta 82 zcmdnvz0I3DpO=@50SFA&?%T+1$fjbfUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS jUr=9}iF$3o{cV%YQCLF2>ECD#eTd1VI;o delta 88 zcmdnyy~mq7pO=@50SGF$HEiTIWYaL$FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` pN!2Y#OwLYBPc7b@z;;zufDfpXg_((w*D$wSKPNLu Qzo4=tBR_AmBGWfU077XLUH||9 delta 66 zcmbQtF`a`upO=@50SGF$HEiU5$EabaUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(FmgyTK0F(?BZU6uP diff --git a/vllm/__pycache__/sampling_params.cpython-310.pyc b/vllm/__pycache__/sampling_params.cpython-310.pyc index 31c99bcddbbb56e9ba0f857edc81b16af1a23f59..371575bd70d6a07d3765ad30cc3774f25c97eccf 100644 GIT binary patch delta 109 zcmdne%DAqTkvpH4mx}=i4A<`4$bExJ#ah24w?Mxjvp}~bu_!&YMAtmGG$YqAw_HCb zGfBUovLquvZ!lYgb+vW<@$2^R4CdU}nvT-o7 N{AXd>eAnnAKL7{XBY^+_ diff --git a/vllm/__pycache__/scalar_type.cpython-310.pyc b/vllm/__pycache__/scalar_type.cpython-310.pyc index 8aa5fca6b86f470e801c8ed4aced451ea1624d75..5f2f2da98c8e9b064208bb56545f9570c2698fe3 100644 GIT binary patch delta 61 zcmZ3-wu+5ApO=@50SFA&?%T+n!=z%aUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS PUrE QFQ_cZ$j{sSfJsjf0782dOaK4? delta 66 zcmeCu=+ofN=jG*M0D{VG4I8=FGHICWmlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} Ur0NzVCTAz6rxtI%!=xt&0F$~ETmS$7 diff --git a/vllm/__pycache__/sequence.cpython-310.pyc b/vllm/__pycache__/sequence.cpython-310.pyc index ca6591b5f54f099a40eaaebb5bd66414fb6b48df..de030385e1eae8834c7dc1b7b6aaab0d983767dc 100644 GIT binary patch delta 7581 zcmaJ_3tZGy_V*6M2n-1F1_u#AWCR5Nz7_LTprS(AYKjQMFak0R!(|{DHN;nGzEA$u zd_VrCv_>|y+gfX-+gfh_Hvg5oO|RAJ?`~_at+s48+xtB~hC%TYpAX;9x#ygF?z!ij zd+z;>=bEnLn$B1s78cS={S7;L=9KZ0A#FsCtInC@tZ`<$EV9bx${tF)d zPNJOTBzh!ivRFo!lFXuMd;bj4O6LBr8hAlBL(Bx+0Qp~~9o$EEzq2w$vk1j8c zr+@D=(pSl;aphe)Es8Sh#WMCv|2|IU8`(jnu(nGo`1E^KV1N zzB5NM?K9IR80K7bMbqckc3L)Qy^4Hb`ZPlo)Z8>DJy&gfP5OsMW^7bkZvssok`OOZ z%d!wqt-u%P9i9V&TSOvjv&Iach87Gr{g?SoBkagW09xVfq_iO|q1|H8i-y^v==mWF zV!D?QSFKx3qfLY2Xi8?3*hX_RC*8EwX3gsH%xopRlg%yg5g#G0eEw}Knv}7jW2)DOVT9vyq zs8lgj6)*Ip3@ZxKx2qA=k4+{T+t&z@wv8t07<(j`4_KE*bX){&7)M&Y{SvBfLag(~ zubccNhS30y5-<9=8hQg%C+{rh1tBURbxv1Vt*u37L6;#L)ENrMn;iUGMVbR<%O;wY zHz37tlM}%SgH8D&)KG4l^HhWLJewCPQo024DX6e3F`ar~JkCAqEM1?l+345R4$L_^ zc1Kmz6H3i%wAV{ZS&hS0R#Vw|oX*pTiFbtk4n|&9pz6GXS|`Q{ZSDnneBvZk^VcSR zl5t9j)palqs?Pwp*Zdk>gVwBG1NVUE`XsAJ;goTbe+8}wfU;8-IPM2LE2ad9fy_q* zc=gqm#%g)Ko5~xQvz-o4-4up=bjDe}!F#<(#dngCr*p+<{_ZB-UBiWgM%`sie;U&_ z09fl`P${s}y|rFqV-M4tcP-S6ZG;*d3jvv{Q^UsV6-Ib2gc zoj2X1Qw2FuQ>~sh zwx=p*PE!RrMN@ryTCoga& z82}$DG$nZ!5DEwZoCBcD1Y87gX$=6y<-^6Xsn;Ym=8ST#xZiRr zILI76ZpnYfym5f{0Ph1n0C2zZET6qY7(c@JV}P44`P|~UiOd@Up1DiP`}_obuHO~K ztW-&9#GXQW>2;w2p+cvN7V-)neV(hus|<0ol*}96XsL7BYaCT&PK&hEHOePw<-9!6 zLBE}MBM2c@r@fBO-B+3kbvYYQ1SkgFt-u^D{|fqV09IR_Gv4shG;^G@_);$V>PQM7*HH zzgFU}gA@^B2%?utCdB;!d!7A&C;07!zocX@z}~+U;ZCPlN=!6op}D6IXJJJ10pxki zxlT_moX}I13s>9FIf^eWjOc3G^7no#sO-04tA3peihKt;f1qzmZ*BgQ z77f-8cE}B-_JO9hcF{=jk$U+=(;pWN?9V|Akl(>#R{{Il^GB#-Piom1n=6&`y+tXg zdgdzXO?OvD(IjhnP^9{7(%;Yva#&xF;Tc7+HVc3PmqAMPEh9_r@r|Qssx40ZKb6?7 z1fv4I!XZ~s{^B79wjK)Wp7o0jBIZj>84Jh)WCNUZv}!^m`}8%&BNf0g`nqblfeXb= zP1Tv|>3yhrVno-QRYqa+=mHt)HJVWK8}TJqwv(>bOp9PkY?B*`ne@>jkj|F0~G zxj7u(0E^wO^$v9hm)z9+`0!|L1>`1F#@pm=JRHLf7DcVC%876jF4p6&amLFKa8Daa z4aG5}YZ~2p8oc9xGk_)l8lrp&a29}@=(e}(4G8$u^OdbfK=>;-7*q(r2nYuZg))~y zG=?#N1TkJA=aIh-P--#^l0Ja`fE2($KpKD#2nRs>F1Sje%`b?nd^i53xlV|`((I+n z#TEW&u+Ya#M;Iz#^*id{k~V?AGRzqBTOte;`c9;^l`_ttIV-xc1mb!{c%N3oueOD znGGEnXH(YdRguprQuW~xu*v(%q!(Am8#Y2iyJnWtKUPA7uTa~XN!@f_ z?V28PL6P4>=MVJxn*44$Kl*i0AU|q4mbDHe0>XP&9(dOdHT+wN-I>@IrLCJDF$UtX z0QTBVE7pB8$*jiSz#5lLJ#d(P80I;?h^4kS&K|7$zCR{lmQH;J9pF}Sm|lMHVgzTA zUt=F>E*1wx)9Ht%h@!VuP@->VT0GzFOP`9lR2sj-fpw0nC z!pTtpPEI0toR87qEys{gpa0Fur)oT;d7_U()Ea*j%Sk8;F`PbKKSwuQ&>Jl#PsxVo zgt$asQ3B;|w8srrx~f-C!IY_hOISeb02emyNMC{BWC&J)x>?T`ygO;_rfpG2l!Dh# zU$Mkyb!lfLAIqCDJ4LS^sLD4yQ1wB;xd?hR335w@Vq{~~QXyJ}v3fMXz0*=W7 zOy-QSS7I8?+?t@9#zCRgTbGG{a!lg4StB_nIyn`-Gp$ zniuOH8Qsl`cOS`!VK0ihykK3Q16ezY4AUT*MQuCcZ@az;Q!U63N?GM6P_G_IDm!{v zq?OF|9es4^bxPtoG*>=iBAH@fHkv4Yya`W1Z;JUhsy5wqyx`g-*Pd{L82 zy}gE(mDz0$6?~i}t%Sw?vHJ$$79kV=;6MGEgny4N$)vYTbJS zR^;xDD_uPTZQBo-4OQ@{opKJ%61AQchx+Q2wJk>mi3)n=NKK**Qa(6!psE4&0N*_} z^JvjcKf3ybAxo6rI|yOhkqbvfK3ie&AvnUO@SChRz-n`xO^kzs+WuL@5#@dHkIPO-VNS)C8>$No)@-K}Cw7;!RvDOF z47?B*Ll}G=4gs&=fBifF0SAps#eZk9e+`(?2&e%xbJ5u8x%R2T?)jFM$U@wE|WuF!z!7gI)^oVyzZXZoo3Y z&zkTCTJ81fw{^DEd8hI2IE7jC?%rUrj<%l~7#gAr`AH}A!tk{_ff_oZ>8(@gtsMUh ztisv3B?;^j|02bi_<6rLsdkw1Z<5^(sXyL01+fv4k#UA-^?#f} zR{Ae>`^+R3(y!B7MHNl%(N{Fk;vR4GbSS39C?nNh(gvu)K%`uX_A*+SF;;k~E#p9z zRSg89ea#++-CgaFm>1~cYw|c9vX&|{-_8U<>tR`>v)=2Ii!r#8W@jgh6=cs^Y^u=% zjddyXm#jHSYtbF9z#?R=7AbBlR(~7aR&r(A#VWd#Z4pc9yX<_imhyUDH1T39sj)7Z zqIxYeH-n31gKI6LgT4A2=0wnY2m8>cy>iodYfM<7SQdkXo8%leY#9~zo|?81<3_m# z<4k0i=p|0{wudb}CZrQ2EgF`SAzEp6&VA7jLxECE$8!cGY*rnUP^@B5-SkmTbzf)= zm~0-8!&NPpV4S@JkEn&&AU8Gk*_kLIV;gSTW?t^Zv`rAOw+xa=H_3P9&h9K{CEC#V zzA0h{_31k@yc6Z~V0_@mb$tU_+pz%0p~Isg(}Ph`jwjMK+|d$^~+ZKU)%4p znFqHiNuURfF6faik>7F#pk6`9=RZWy{3q_J5g9y#S<^!-?H8?jyyZDF^vOK{okV-7 zcR{oHcHf*Wn0L#rkUl~Ch8Jd-cB$@)96FJkPVU0oTbRqj%(I0VVi#R1boInB(uQ!h zV);N9uTLG|V~B56{~ALZQY(wz?>}i6j`Tqp^n+wF(K;N?#1Pn96}>W7k1P&?5-j`vaR>*dM%bKBOEwj$#tJ1%NyG zx&;C@CmtW8^D{}ht__;Ucdpsqkw||j?iOh9aa!0 z;VoGRIKm~eiq;JJQ8bq_As3)h`Uej#j;6*DJ#$WjmZl&Od%w-uEyWdaOCk+v9`oUy-zo$Xo0$|owv~m=LYMmPcud}kP^z!8STG=*? z>eGqlAcN}epo%F)X>UL>T!Au#HF8>ODw;zy^_eNdI#byZOr^CYk)~mq+PmZqR6ZhF zE1DxTb@QF5d{i_Q%~6{ARmrH%2Jq3+R5ZtGYIW&|&Qy+^rlL7PQ(q}9*AC*tuaC#r zsT%|n>Gi2A6=;Yv#tDNVMaU~$39pp5n$pS? zDUjf`HF%u$u3D?dCT$H~d6HIDjuNNn=atu^;b2t-Ty$>E0?K(HIbGhXMl31vBlVa3 z7yulnF<0?4Gy2WER-_z5`y)^>8@3+MP3Q(_%>D5T&-$%a* z-srS{sdlJ7@Pweg_eQ6g&Oz6AG;sd3&dYLE>SfVavS_@M8PtbCawl28mCeH7|9Ax~P;QXGxSTH8OLyyXZQ#7jTE`6?JZz$S3nzpX$ zZo^ePh?42$>KJ;psz*6`awH+y}{LN+hDn9{xTJyzlmI<(m6evQ3>hJ-uL}{|X zfB|3xM6%q!dZABb@j2mp@Ed5D1r5Q6wCQmCB9X z8|gYNw*N7e+2vrD0g&x7hGtg3YGz4=?)P^Th`%V$B-3KY%Q48hfN;q*G@+)z#G2#% zvPON~eF6FiK!3mhKqIx)j!t4*zCs`63kK0=wW~~=7&zpG>YaYDZfxROP;jfr6l_|b z{~L9w>Xn*W|8wyLXLBQ6sV_}rZLF6|iKdnDA1V&bY|NmqmK0ikgbC_W4(mMwWAHKyxfy)bKhxzj{Xwe4ggcaou9C$Q5KL+9O7lD>vb$gNP)w)0bPpvPkPGQ^xGdee)Z z?80_%J0|FzY{3{?2a7{WzGNl2jk_lGh8;NoPW&jIA252{9{sX|I|3%@XmBr8k7y`k zJ;C(m6}8{QT)s$-5p&E#WN{V5|~g0Tcq_0lb?5SZyF6 z0b@mI9YyO&02fBRfQ5E9=OtN`++qwE)mNsR4~G6~x!mlG9?X&GuLyx?ucOggZS&dm zbyujy?vq%lOkblX^-?rADw%e)#>5R$B3(iT3$m4^B`i{eKO@FJP?8lr>GS2Obh$M) zv15NaWEbcktrinsngc0+eQVM$)I3#@?}k3!RDb%#`gGGatf!M=HT`w{qML4%+isn& zu;@ivy3F9TWKe`JN}xf{iXS+{2y- z*2#}HW}3c-szO%P>%nP>BS0Am;BDw4x%I*K#uccsKo|8poq7SW=rERHufxN7!yHen z68cOTgINak{nUo~M{T}Hy0Gbwi5yveu<_ldS9$uOiKZu%QcHo#o)*p&&Kb^>a57b4 zT~3!wv^be~-A~c&0pJLyqjkrOg5W$L7Ql~!Vc5cO0LL>UVw7rf4DZ3`%n>NdPc{>2ie5Z{6E(4F)Dav>vTnnIT6{rghtPrW{d(fXTgRvBU1uC#*ypGl9lz z&y0r>Rb>}I&3r!13GFeoe*4AXa|P2UMk?V3TD+r=m`v{;OhFBfn1~tEV8U>;`YXVd zjP_()Kd~iBR-$LVvtxWWD3Yb%bMUkgSyR=(I7Q+&cXULgdT*<@g)v>osU2RTmPb}b z{#{LHCnY=-L)km$Cb5$YawarF*x{dpJB!)OZ2D&B&7q38fJveoI*z$~$)+060|GnpB(Fn`Z16D*Wvw0ckaovb;KNzd=;ZYb}t#sBr5u7*OF zS}!1$1jJJH+iL|hAWHg4^*7aOMRdBU@fAa;e1CU(Yp;5??M*YYF?`tWCHLO$X=4>7 zbQ6cw+)t10T^)ZfWWn3Dg8J<%G`*`dujs`J8}{XP{%sXAg2m>)_QjiafSw6@l+)o- zjz@}RQ`G(}ZO0tY*%h2on_=^xX!?F>Mh3`vTAQjQ3COT*5VHkYP`T^C_+FJ@JOEe# z;2#Hd9-^ynv)R;qAlopT{pW8#kSf$GIK1a-&S$9D5A{3f<41>Q&Bbg^eFvyP7gS?( zKJ&5KK{kix9vt4;4_HBGLmq5uW7Tj*O1ayu{&ip$f3^*@TElJ`pU9zMm+|c~ zP&&69&J%VzeYifO1~fh=F0|?a9zf`xEIl$SX)Tt3*VS+EVPWhN#d{MDY(4zjBVr0` zVe#YOvns2i1dMi@PqKQq>duW_;gD{x)mgv95h|K2WK-M}ceKc8GQ|1E9L*Agp-x?P zu4>0}br#?t*$!9<2%jr_E&L0Xq|=rsiw1>v(Xnc1C0+!EOD}*`tn`2U` zi2cfY!X{)R0P2*7x!yKmfSK*|#Ib!gW-Y`Zrvop<>A)A`PzZR1@UyA~n_!3W<1Bo) zv3(LVe1OG(W%~YTptJuu(a@lynb00>F!4fm%06B$1i6k66IbbpEj2uY*jXds?oQcp4Z55>f;tx-3$X)09FE4 z0r*RJHCk%`SE029t+jx43M^gaaJPC_)4F0_Z9L@%)3U7xiHt#8%0N9;0L+P;y^$yZ^?*|ZB-Lfic5Cbrm0?f$n^xp?SIo|r`^&g55@ zf;>|}z*OOrP3oOdiIFP66~Ko8-Z;Bp0+yZ%;ETB&t=Rw@fR7CC#fdI&ayd-wPUTNu F{$HxGiS_^h diff --git a/vllm/__pycache__/tracing.cpython-310.pyc b/vllm/__pycache__/tracing.cpython-310.pyc index b4dd2a92feece7097ffe654585ee96b84546bb92..0914d51351cfb170c5dde0f3f9e8267b06f5f08d 100644 GIT binary patch delta 62 zcmaE)bWe#ppO=@50SFA&?%T*+%&cOpUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrSy0Z}9Gcuzh zI?8g{k--skUS<#n+HnO@aXpTXj>3%pY;L2&sOUVGaqy_`e$@#u@4fTRd2sUet-IB& zs#{gJ{+FJzJpGi#5lTtvpTPenJ@DiS#}|V}PMR1EgeQi5;i9NpHW|^PX@R!pz@$LO zM8B_LVt7-uITVbINp}n3qOF5>hziQd=wvL2rY9##BVt5Pus6A!Vi~25N|4onRTLVV z8A~1Vo=92CZKp+6fW4O7o^(-3gEIA$bfTLNzdhk;=MP}jNBY{hwvL|WA0bEs{j6VZhxDx zP|A>$*C8OQ+w1LhzAbNNwjZvR!nY+Z*Q9}v<0>hd-WCk|f)}9GOt$>;-hkKTe>f2C zoEFnkTq5fsuc4L0wuyE0&ai9jKFD~ulsmjY)X<#a_h;zPQ4@vvmNx-vRJdVEDcCnd ziD0MVkZqtk7@Ub$51JXS6xkNkLqWYaQm=C2qt6R&%kPGPO3w1y}fOw z2MUY2S3@yV&gLIE2QU{<2T(bZ%9Lqq2!;G|1DMwXW&jL86JR4C02l}e0U7}jz~uqN zhZ+V?4R143B*$imH53|AVOf(vD?8I;zaBAPaMq@e8o}8&ZPX9Ot1;XLtF3_B0k<+> zTKUIi54HvLP{YQEyaSmN`^Ts}k-q{8Hn|1LR~-BZTux+~JmyVJ$>I~giiVG!o2JGK z6?qpxZH$7OnamIg36W$b>EjdL(A{VQm>7q=cXUEnGqAcfTv4ajeM?3aG zz5}pVW%SzCCwC;vOaXZd{?bmkP$8cfg5h?F_fc17w*n&2cvj;z7`Y2?gRO)Hq?p z@a^CpVQ?k;BD%ZX?en`E{DxEOQ|*}$7Cn?*^s^Yzs z0d!ySHgO_0b>bKyPSX04T(O%aXB{N8)y~b|uj_CAIxpp!7ta zucVlqR3gL^d>Rd<$0rwBPRAvGpBxlV$F9F-ruQ|k1ym(R|BgA)Ti z$d>?RfEVfcsfFU@*oCQg2(g0NrcD>m(}U9t?N^Y#LfNHV_CGSoqkJWHcWJG4uu40N zv_k$GBo?`eY_l4=;{umM8r)S-?`SrH@>OX48d_;)lEGPQNO#mwG0E4NZQ5FlO%Z8< z+HV1B*If23e+QjJU(^UhaIw^~*MLKO*ynm=VkZ`;(e=r>2q>xpryMiToVhGJ$QmqXIGm~~N87Z>p z@g*HOKWB>`VJ3Q`o5F^(pW5&882Z>wl}jh5Wy2r`kPCQ#?pnG;6vTeJbh;3a(!h%R ze6@@7A;k2WiEX}Mw3LG=1ZxB>uV~T6f_ymkWW^Yf`w=UB$bbCr?K3@A(-!e{8B*C7 zlUTmAQKe^+e1sLGGE^f&FJ__<2uC-`;c!>b*P}XxooUhu#yG%uzyv@MARY*)lkiy# zY7G5i`7Chqgovr~b2EA3Cs$B~v$6H+}rcv6;-Th{Paeo5cSU-|pTRA8T z^C~}P;7q%cBSPM#CVzjxu<9 zmCsTvXyBf7np>NZg6ZQfDxg|S?%MSJl}rxiqk!wK8*A@z{1Os1M-P*8b>3JQxCRH@ zoqB+)7`aJz`~4vgpDx~b&qr7v4k@_$z9D6-Y^M5xzNpXb?=|Qx;%3!t9t^Q7xzQKA zA}puZ>qhb={Z-xO(eWffCP(Bvgn`iHwE$Skd4R<<>Cn*WaxT+@IO<4$7TXgtEvZ&} ze=bhJ=MB*h0sHx6oXKs|8g_f*Il3(N$(nJZ6nWy*Oe<>v!tsm!A$Dcj8r%GS`7V>Z zonS3104l?mQPsM2!)my_hFVDoLjj!+ z=I|!d!gt9kmN=9ChyOm0O3vj-SXUccRzr|Y!>*en>S)7t2defXK5ING_)>Ay@;a#H zN)B=<*TBov;tMvh+U1m&tI=UGgS{@_i_J*oB!GZ43Ji*$8)K;HoamK{XLIoEdT<# z4Qd_!pk4zTsm(J>1n8uvL<_Q|CxPBsow?JyR|~^Whz@y6MQiN5_k_rUJr*%&@G>I{ zu3F}ebhPo-DFc{k+QRN=v#A-KyxI|YhK+dHl&#h4ld}E48*XUI5((7Vw3cu8*PAki zMxmgp0-Nf^#a%W;T=Z?zaM4cr%~QmUTnpsI!p(`6Y3jxwsBZif^XFIUtE%+s^4cZw z)7B18+c5z<01pFp0$SYVW_j!wdq8LC2 z{WBaLaEKAf)AY7~pY2X=)1UWd)1E*Ezffo5 zOuMc}41c4pgKBIGdUTz0>^}7JGeDV&ir#G>r5#86LrUqW>hs#rQCAS3Y1ZPS1BK63 z!!B1%daI)}_p+9JkiGDXD%CP5{DO))3;AhN-FaF}Ky`Gms0-z72=8`k?aI>B?R}QEca7BQA@b7WT{*lb z&UaOdv#~KZoV95&Xs@8px_@7Q(qaYQc8Q))TQJIHe$Z=l#t&Cj8l9w%Z_0`f`7Aj$ zj~9>8w9W0}x!Cc|l@?ylZ+__E7oUD}o$Dct%^_7xFg0y>Xv!Cu?MjNc8x4Lv@lE?V zVnPwa6`%S_qD~(5+J2O|PP=@LE%>3*88w0tA6Las(tum?L_MF(LoJ-vi*C7b>^3+# z1-;}*)E)JC0tSDU^2!0=!;O55g{=JXEqP;}0$C2`Nv1k%ToP34&g}X!<7PHAZIxVtn2DSfo)+G9 z74*{XT>cdE!EPtN$kO)wH0AH;?o$R1y@Hn;UrzT$$dx5Z0jIV1Yl%8f z)VX02;SdJo?U`}yd3KB)76Z_pe7Dh5iuAiL0f1h5%^S&)w* z5#xvV&uQ-dd&EQZ_Wq%n55fqin#;ijp{KbxUiiL10}d?Zy}a(gRB@EH9nkrm_UVB& zj?r*63NVaT9vsp)dHqV$qMKr7%zKsNvv^_5#s-i@ZZl#YNp3OLR%SDs)rQ_E!& me{Bgyt5w3N<41l5C3Tu$w@S5@v61A*fKLDyW0MYLTK@~OjaR_{ delta 6222 zcmb7IdwkTzwP$uWKQ`F}0wg4aB#=Oa1rkCKf$+$KcL_;=7+`t)vf2G5S+dz(W_Lpp z?kzgYGrzOXTV8tJ;s~asB=zCH&XeDJ-0}Iq(UZnU!*aYo=yChU`+be$L!FV9 zU|?d=gyQjGU&JU3xjn7!W+NOMF~}{1N!@8XMHOYFcQAfGJy%rIiS#LsMeI>72Gr5L zB^j~A!S9Qd72I}OWEI#eXw&{dViEPr)a@>2^e~^q&`jE%IgouE&8*SDmP_exnZube zc*w0;V3>}!V7sA5g1Qm#_E_W2R#W$oDq+wYL&|8No<;>(O=1n5FG#2RvUIHxe%5es zX_PfIN%*K>sLTMwwbO=L-iN*dv#xv9xx2A;iUn3nngBK zQ}!3xDyF1*w?AskkuoUdD%e@wUN3jqkyD-32EPj!c;rf^#a*)ae9kc8+m&0PV!k!^ z!T`vf7SmExELX#9DJ>edL%8Vo!zS9-LdN5z%;9-rDU}X?D7^tXDp<^{+yq#v=5-w< z=It+4BG{>pWjm-224})QjoXzXqX9h_=p8Lj0~Tj3{Uz^?-0#7_CL8!C-WR$t6Fh#y zEqi;rje7D6H`YTjQ_g_mOh6f689-%2Kc-AuV=(BKI+$)iDWD0^0%!#U00RIaKr#+I4S!VjNm+*Sa93e1{mB4xC?MM z;C2Q~EC0CcfoPi^Y+M_b+hXSnibZY>gf@8x6dM4_cssaA*P>Cs)|4zh>2;Jnx-3}EP$^yw2$X2RabChRu5-L564$Zk3^x?Sw1bmu0qi}pEhavXr&F2H_H zku-Y8nJtdcSI(T#`krTUmz$CadWP`M@cyK(+2y(`c>h4Hjwv1 zbd*}gED=lSCu7En`{=@$N#cIW8T*z4&P;1ZC@K%p*JCF;4nsK}2$he^6F;EFaU+KB z1or_3S2BBdx4V6Qccb5MYFAYs92XMDXmH^x4um5gg=#TX7Y!y$(NH^bf#>>%R8X{B zoZvOep+iM`#1pXz<3|Y*qZP&3PIO_~JW;RP)xXUhh`RlHm^Yp7_WR{A_(b;DkS-9W}CKFqcbcmP%{B)=Uj6w--b>CpYUyA`6lFV0e%DcE#P+y&J_7N|J*G9 z0M0uA)$Q*=y~|(d1ne_CbulHusu9?3OA5%lw1L6!Nl)osh(97i^yM&#PUsGj8nMDZNToKhQNN+3c zoIi*LRE`!2RMV0}%PI@mu)ESN`o=C)uEC7YojoDn4qg85<8;U~{NqZjuc}(4*VZhl zlb>>1entmo56^j!Nz>*FGzH}s;QpO~XWt6zf6!aAb&*21%n6If=-8ZWi&fCi=j7w( z(wr)7Ae7GVNRJQ0$V^KxZ1%-2mBE07WBCxgSy?A>UaiO=*SrH6>O^XY^E2UK2%wgd z<`;`Bnl`^y8wy4?k8-5Qp_B914?WJ>J;F@zMmj@=v#&Y<)RvPwY5sze)La-00}KcJ zi0)c2UlhcCwP30cPgBam++4Mv^C85vnh8-~ATosmy9umOv|wSYHV)*e*pC;E64`%Y zr3?Jef9Id;v6{B9ugj3izJ#t+Eof4CnJ7=Qf>efTRBB5n7;T|QryL1)1y_4iN3b(h z7J^X(7!N20OaR0K0TqMK5>R95_@e1z8-28BgP0yOs!xdYiQwk}ZU)=}m`u*v!i^Z$ z4e_V}V_wW;!*8@<>#H%SIH$nudVnfJ2mL=|gNv!~FFIWPTaC0%-Q)JO7<#zH9WrDo z#2k5TzL-YIi}yIn!FZTs^av`e%%m3=XAQwD%fB*kzFp52As?nM7ng_%8ooP?W-j?U z>jmglz`-$4_XCaqj`H!BNr9!MqEacJS?aT4=IB2%hD?|9p`z*$q2`l&sRB#QZ8<0f z6`*jJrSTCVtC{G^p~dwXw6|_c?MVpLT%Kael_8BVAEhC~-Kw{7y(ByJaKs%6E1#~k zHh0HWHlN~LSVj!*4QDxS(zUlfC}vY?eHvFb1@*hrW^=f%zwIfs5xKa#KW zPwO|0if0tkJ}fH{3j&q50AMNS0u~B7S~7U5oW+fSJcw`-%k6zKE&Z(aq~rv}=k3!M z;raOhEn_{?8ghH%8C@OwXxSJs1zF|POe<>vLb3t9JjGzznxcFueZVAdK3K~dfZ7k$ zv~b0WVfEae%loMsd`z&J6ym$3cSOtR+=>slG&$zVuYsnTQCCuv47TZfeup|u3tvFX zSmI3lKmMMSf;IhJcj*UE!62N9z+9vS?pSn7D?5tA!9z?EMk zFHEa1(9CMrHi=xpVlEa}!bA;g6{ux2Yt`L zO*5g%C&LjZpIN*oJgw5eG+KEbrJKbZPXofS@d@EuNvKZ&1gqOI+Zp&aT7Y{)m4*+QdG^LdtZ2;8Xb-c^$YHWJ2wc0r#UhE8_KeP^_js6TVi1ztQ9UI{JdDuKl z@A&ug10>p3!Vl?3+VZqcu!&x4o2KoB+P+w7ASklY%||>Dy?2yNq9TxA0WQ;_U{=|+ za@aM%YlNhs&U?Ley<0Yi)m_IW^*(lJ_WPDNEDxZUz4Uo-U9KVzbGyf?bmcut#=y1T z0oojzTe^~aH0}JALOnrL@h%BkyP;*1@tDEb54aaljwp|ibzKoZeoEGz6YJ@Vb$Pj% zP%~NQCygiA7V`P|dfE-mM*t7dBzd!TKg@ShkQ4pk-WxbE_L)o++QX2XAxorQJaSb+ z?U4$HS}?U%57G;fD$x_`A1xMIe0pe3`>>m%3^?Y$kqe(u>u1vem4<3J$u7kom zL)SSkkD-?nfN}(NoZf9O&|+v`q{Q_#SG}%TU!Qkv{`s7`2<7WTuTV{TbN!U;Yg+P2 z_QJEORF(6m$k~xEPGT^zhK?SQfwJzhy|B;|3^e(gFIx%=FN+ym#|-aE6Q^iW*XUH0 z=MC__9WmWaZCyh&RaU%6+qy>PuZ9RGFJHKcy6*A2!(m;&VPBr5H@a#QRZ#O-jo$O7 z$I3T6WYbQ=UkzQ__;xu8qiVj36Fk9aAi{5zfY<1VAMmQoJH@Kz0DjB4y}XbJRd3?O zy!wLsIrZH%mS2SvH?@nGW5+gCS$O%s-0Tq#(aJ6LuBR~#j_W(twBhwEUuCu{G3;(K zlwSJ_G73dxyFRe+H^0Ab8&PE8uKy<5A4_Mc);ZU2s~ zJl+E{IJqw1Cw}+1lGIV42i$FjX>E7=IZe%LZpsmH1>k)u+x2*!nq76msFP4VoD$+a z{s~4V4WO}(k3lM{i!_f4#6@bO8nKhkP^0*S^LVDFw(?H$?w+dcf%i|Dn@K;}{Ym-|DzP|p5>(p%B<9~rown*sXzXEK!ys*3#|SY2T- z?IFo2DEZZ7;2Y{j`5AL}u>UYVrQst|k|il2NwaAEgpx_sfvWATy&s9x`J>Jm%iKD- z8GWBN?R*r6+%nwzb>K~eayPo21!^9sw*lXviMvuh$y7o7ef(Xtp8;$IVEW{bp{TBa z$7u3_qs32go6Abnuti+maarlI20{_}81!&1x*S~DdRidl68=@{dvF0i))ya~Bp#&O z59<6py>M`uV+?#d0V8O^p^^MqFK{SlP>O9~Q0AD2J6@Wk_2}^-}0V#m~fPsJvKo%f}!KKyl z{^#$(>anYeXZ0eU4h8k>s{mCAm_@7a$=p~E5(T+*0h$3QvZX4WHU2JXa2RL~2!9NF1f|Zvb_i ZTmYr^_C-*i06qnLhBsEm{S}9;{|lY3g@6D6 diff --git a/vllm/__pycache__/version.cpython-310.pyc b/vllm/__pycache__/version.cpython-310.pyc index de6fe1d0894e09dc15a2d9173a7293c6e43ec19b..42f846be885642d77121f9b13d62bf15bb6f9dbb 100644 GIT binary patch delta 59 zcmcc2c%G3vpO=@50SFA&?wiP6sbZ{Ol3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEq%hIsge;Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrE QFQ_cZ$j{r%%+$yS06*Rn&Hw-a delta 66 zcmZorY*FOS=jG*M0D{VG4I8;HFlxBzmlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} Ur0NzVCTAz6rxtJi&)CQZ0F_o1-2eap diff --git a/vllm/adapter_commons/__pycache__/request.cpython-310.pyc b/vllm/adapter_commons/__pycache__/request.cpython-310.pyc index 46b7e60dce37c9fea87cdff8d32879ee698f96ac..c5beddc2851796a64104cf25c96fffd281854118 100644 GIT binary patch delta 62 zcmdnaxtWtYpO=@50SFA&?%T+n%BbS3Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr*D$wSKPNLu Qzo4=tBR_BRSH`C-0Ak%0mjD0& delta 66 zcmcb{dyAJlpO=@50SGF$HEiTQ#Hit?Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5BjZyR0JcyTrvLx| diff --git a/vllm/assets/__pycache__/__init__.cpython-310.pyc b/vllm/assets/__pycache__/__init__.cpython-310.pyc index 6f5c7c64d266bbc573f6611905711c999a36b01f..6d8da66521d1babab7d2b2e4f99fd5b69d9686f0 100644 GIT binary patch delta 59 zcmbQkID?TppO=@50SFA&?wiPMqhhUJl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEogI7Xb1j66gQ` delta 63 zcmbQiIERrtpO=@50SGF$HB98T(XiJqEiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuNUI3jjV!6ZilC diff --git a/vllm/assets/__pycache__/audio.cpython-310.pyc b/vllm/assets/__pycache__/audio.cpython-310.pyc index 4a4f7a8da17b37b934d14befdb8e1549b9c6396f..f0638ff696d3c3ee124fb33cd694cf8940d43183 100644 GIT binary patch delta 62 zcmeys`G%7_pO=@50SFA&?%T-S!lYuMUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrz>% delta 66 zcmZqVYUSe2=jG*M0D{VG4I8;xm^7^QON)#2bMliDbM$jElk^KJOEU8FjP(o+^ouh~ UQgsUwld}`kQ;RnnGo51s0AINjQ2+n{ diff --git a/vllm/assets/__pycache__/image.cpython-310.pyc b/vllm/assets/__pycache__/image.cpython-310.pyc index 644befd731b43d81a1c868912e217d61e7f2d894..7abde64fa33e6f531c52ab6bfa8ce0dd2cd1e864 100644 GIT binary patch delta 260 zcmbQnd6bhkpO=@50SFA&?#syD$lJ%rSUhJueokhRenDkPMtVx`G*8729$SZWwkm{VAKnSvQKStoB`igMur zniHbQ7{ybbnwg$aQXHS3ms6?9TEq$zF9O+I#0Mm9v6kc)C1>1X$;nSlDG~q)gB$=M zgeTiFD=_j+j$=+&7XgWi0*NTLkkq{5{GuXpxH@DVZxfqrpjNvdu^Vsdt3dTQ}xSEdB^A|9X?P3Fnxn4*k%K}^;nRv=XbGQNl( zNZevA$uCOIxW$r_pO{i42oeU_0wF{u=P)ZUa!u}KPFEKNiHZSE PFQ_cZ$j_U6mC+0U8%Yz$ delta 65 zcmZo?>1N^1=jG*M0D{VG4I8-^F={yJmlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} Tr0NzVCTAz6rxs7X$Y=%tYCII! diff --git a/vllm/attention/__pycache__/layer.cpython-310.pyc b/vllm/attention/__pycache__/layer.cpython-310.pyc index 29f52c1ddbb9fdf745ba0e00aff90ab561945780..38235bbc2d9527658056d59aff8bc439524f035b 100644 GIT binary patch delta 62 zcmZ1>xkQpXpO=@50SFA&?%T-i#I9nkUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr~Oe~uZv2EvMl$cy4aJ;@msF|UttA?$FA&W7asVEmn3+FM` zu+_4G#e{)kjV1gGL{iumG8WgBa4z6VVPD9|$N*9o%mC(d)UYjNf{DOQx(wFE3Dh+g ztcnY&OSG0P&#Z>2L@Y}ji0dWNn93N7)`699BPmg>VNPKzWh^>c!@NK;g=Zm<1y;ig zR>QeKDuoY8HD3)&3cnabia<7V(PgkYL4+*KNfQ{0xT<7R1X6@@q;q9zIT;yhI3pIw zE@Y_Xs$r<%0y^UhSgUXi1Jpl2w}vy+umv+fNEU_?xe1JwK#d>>Rx5(ACK9Z&987A8 zPF^XradWfqTP8;N$%SHtn_r5FF)}WjBw@bUS|XT zII|>Gw;(Y&J25@Ac=KWAA56?_Ol+I?v2EvM)S6r-aJ;^Tt%M)2vADg2a{*Th$3l=kpt@iNFrTxA zZ6Om(1a8tDur4m3u4Q0V+(2FRAZ=o`YmL32Wl`#g=!6R z3S%i_(YYGt1yU)z3xO=K8a}WZ&IQsb{79<#YFJVP#28Wpvzd$TfYk{hWMNL4z*t`- zTqT<#m?E4blPg=x$;eQ{xj=3qLoHVgLk$+nfhLi{$n2)|`wRG4feR>*#fwV)_7uVnLL zF)>EQRg-s#n=^AUacuq|9>OFp&d9(}%mYj$Obu+p9L!A29E@VjMM0CJrMww^Coh+J a$`~~HK8M8QrP9^h)l7^)_@9kY;6DIM$f&IV diff --git a/vllm/attention/backends/__pycache__/__init__.cpython-310.pyc b/vllm/attention/backends/__pycache__/__init__.cpython-310.pyc index 19f3f5445f40b17f9c19a2fc8e9cdfa95d9af77f..c61e24b2a2e74050917e32f81af3f0bd3a064909 100644 GIT binary patch delta 59 zcmZ3%xP*~ApO=@50SFA&?wiPMqvEb#l3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEohz5&-#g6Bqyh delta 63 zcmZ3&xPp;8pO=@50SGF$HB98T(eTzUEiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuNTd2>?ba6es`y diff --git a/vllm/attention/backends/__pycache__/abstract.cpython-310.pyc b/vllm/attention/backends/__pycache__/abstract.cpython-310.pyc index bb167591f89ab5315bf285b888124f82a27f5062..ecf40f5f231d03460830a417a0846a814c926b00 100644 GIT binary patch delta 80 zcmez1^va1lpO=@50SFA&?%T+Hj7h~^za+OnzaX*D$wSKPNLu izo4=tBR_BRPo{IcJRCq>Yz#b1eE-=PH(wQ)EdT%~;u)g= delta 86 zcmaFm^udWcpO=@50SGF$HEiTQ#-!n`Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> nlB!#fn4F!Mo?5*5E7Lh%K9E*61}-M1e|(H=|2Ll(m@NPR$DS8FBbz47_Qy7k-L;##Z$i|w?Mxjvp}~bu_!&YMAtmGG$YqAw_HCb zGfBUovLquvZ}STF4oO}v9)bT%j7$woU%2=LHrpy5=3(@i%&4c!!okSFxY$gDEc~)8rQ4QWgP5CYH_reW$Si00aUe(EtDd delta 132 zcmeBO$~bi?BX>S8FBbz4RBmh7$X&{=;j3R-T%@0qpPZPZpOcxSUrU9>pMz<$ ko}Rc6GaD1vW)BBbUPhM5b-tx+Jd7;=nOHY}_npQ90A_b8FkHKDBllD`6;J(=+yecA%mUq##G>@n5?%A$(u`cg+;aV# z%q0DS%94!yyv--rX6Q3UO-?kkWZ_^GV%)sIte%mXkBM)yl0~l&Q=ZA@jb6Li02dA) AIRF3v delta 103 zcmaF1i1E!LM(%uGUM>b8sNB}Dk$WnehOd5UaglybesW@teokhRenDkPMt+{Lo}qz$ zab`)XZb4#lc4B&J@#Z6JGxQl_CdZmtvavBT{TE`|Jj<+}k(q}{V6%)xuMkt=<;|;*_Cjr=#M-|utZjX~A7DpWhd=z8`YXXn~ za0Yx4d=eA@WD#oweHDBakO6WdlZO^R0W7n}7K8=@{s5Cr9Wn$C0Sp0?g&j-*2(!{1 FGzO<#F5dtE delta 159 zcmV;Q0AT?^RaA9L>VP|D?v(f{X5CPm-IE&?Cjr@$LlxKrkO6UMlN}aE9S3|A zWCm*jkO6Q9d=Y#S6aZuqYXp52d=-!ZawL<17C!+kv%waG1_A&9lSdsg1`GiL{|o|? NeH}~z3bV=`GzI`SFgXAK diff --git a/vllm/attention/backends/__pycache__/openvino.cpython-310.pyc b/vllm/attention/backends/__pycache__/openvino.cpython-310.pyc index 2b35a080619468fd2c708de30dae1f66614ca242..c57a295b2a9d2c23fff8a48862cef672f793ef05 100644 GIT binary patch delta 62 zcmZ1>zeJuppO=@50SFA&?%T+Hmr2E4za+OnzaX*D$wSKPNLu Qzo4=tBR_Am0P_qU08_0LNB{r; delta 66 zcmZ1?ze1inpO=@50SGF$HEiU*%cSA0Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(_hj|7M0H%Z$SO5S3 diff --git a/vllm/attention/backends/__pycache__/pallas.cpython-310.pyc b/vllm/attention/backends/__pycache__/pallas.cpython-310.pyc index 08e0554a84b195e4cb71b8a41433267d8b8e6d00..8d92265b6c3370d01d3222713bb5cd99e7641378 100644 GIT binary patch delta 62 zcmca+dC8JHpO=@50SFA&?%T-yjY-8-za+OnzaX*D$wSKPNLu Qzo4=tBR_AmCi7ZJ0D4{(DgXcg delta 66 zcmca)dCihLpO=@50SGF$HEiVm#-!n?Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(Fm3gfs0MF4DIsgCw diff --git a/vllm/attention/backends/__pycache__/placeholder_attn.cpython-310.pyc b/vllm/attention/backends/__pycache__/placeholder_attn.cpython-310.pyc index 5ce3aa730bf91232c8fe44b8149b749bfd9c03e1..3a982f1df732508891ad219837057f52c639010c 100644 GIT binary patch delta 62 zcmZp3Y;xqz=jG*M00P6c`!;gBGpqRPm*f`c7i1RbmLwLXr*D$wSKPNLu izo4=tBR_BRKbF%9%p6P{o6o2| mlB!#fn4F!Mo?5*57t3h{W;Q0S%_mf!@&Flpn>QGxa{vIBUmM&2 diff --git a/vllm/attention/backends/__pycache__/torch_sdpa.cpython-310.pyc b/vllm/attention/backends/__pycache__/torch_sdpa.cpython-310.pyc index d0524c213c8127df26b3865c6f8de45b3fae29ea..2647e0a560cbe33a81071dbf7e924133ca4e9925 100644 GIT binary patch delta 112 zcmZ3KGbe{TpO=@50SFA&?wiQHQ!Y=Gg&|d{GK!G_1XCDOxN<~tC8H!686p|-*f&1X zXIAmlFUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>EFQ_cZ$j{qs$?{%}al&Lx?NAmz MMmEOHE!y+A0F~As_5c6? delta 118 zcmbP}vnYotCTsb1Sl2MY343P|li5nm3 zGi&(jmlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>}r0NzVCTAz6rxtHEWqGg0IBBw~ Sb|@PUBh!C2rpbpeY3rDgn#T4n-MbJ1;NE15%Q_aPv}{ zT4k)3YKv$+{-_JLj&;U`^EUn(b?J0m_+!RJy7C`zMrYKG&UnA~QEX8bpE>uObHDf8 zb8a4A$3KhL7#>gc1LCjuqc1S zs&6wkO7HFNXQS4SyQiIOjQ06DT8|^?ao{n5vU|bcSo)ZOp>pR8{|~03|waf6ld9)N@t~`>@71!^HKm!F znn@Q-{v^a?jZs*Tfl2iP>V_&aLm;P3!rbi&_vR+jcC*4sT( z8ti7+7eVMLU>=YS!jZAMVnJ7vTHY*jJ*6&kEx*Jyq$GeOFhO_xA@>5zI8`;4V_OzjAzybR8=*IwLTtqP zqRGKnl)h>n7W})prCH8Uc4ZH;B^qH((Zel2h0h98VX|WrikDwN%jnfjy?zu z`($V33%HEXy7haomj&XmrS6NcUIMNNh&!#*SlgjJad>2cZ0S`jU!luw1GeBg)>3f8 z`lijp#*jb9pN9MYWGl-RNh4oU`K!o4@_)ts`+IEh4TS9zXny~vY|^T2zvyU@4<22f z5uX)IKjt>YNDa=j^nT}F_eE@r((TSOLoXv*k1p#ubeZ3M0E*L|t!#)qV#j;CMp|f% zZCF2t_Bo>OK=Cc$ZGjoZWtV@y`_`7ERFkFekleH;4}R#Fz^<(h-6L7SUx&VI%l*3i zCIUOOZqSjgg*7=6uLvt_LQHH;STjmJ=h#pHOaMPd?f~R3@OfA-0Ox`0K!rfrDLzfy zh2?9&8vp^Uws1r delta 1669 zcmZvdT}&KR6vw@@%TRVf7Pqia78XKbnSQW^Qj`jzr7bMAMQKq9woHd*fep(H+!-QN zltxt43jH`nB{9aB_)v`xW|Jm0G4a8NrWz9;>cjZvqwz%_H1S36|4zHKr2Fv8x%b@j zzvrBL=k7NbzPk{#N=gEciQm%AOJ4{7^ff0F3pP(=t(1{XWHaN5xg}@XG7q-29!S_3 zC%u2pNX-~iX**ZvANMhrRtuA?HTPp-BV!%(*N%T!JN;hN8EqAkyhA`M;ZMSj15W{+ z)DzfXUAdnEcNjZLo5hC&hZ@4U--=;EujWs8*un*`JaMekR&l(Qz$INjW3+*}5 z1yhRd6_ys_1DJRQI0eLjFfasQ=g}g^nn{~_Hf@R|Zil*5nOP$?r<$^z>0LSP=r>pAo7PjtoU_0)=9H#*>C5hvLqwty)=An| z{Yzp@m>QD@(x;X3C3t28T>s=kHp>rVYyn<_sWlp7^E4DK4`wl&0cL4FTCK{9bWzs$ zd32JEP;pIv4fNb1T~B2V8`VMOeo`ay_O8~1SsZs`SZtr~`vb=&TW?^War(A)S8S`z zURU9ft(LcTn*Odm6~+0uC5Gde`fS=UaACB7S6q_DV)YHnhQrdh3pL zuXkzw8hsY)4#}eAX|Ez;O{T2W)v~C}NN)KCJZ}PT35e>}sH=W&`PKs2y0@|5U0Sa1 z@I==zmZIyjXLsxW?M28iABE>p$~)YGlr^`c^9`(cw0>E`0Z)G&YrIW_{w+3;3+}$C zRLeV#b`Odd1_wQ=I%(6kI5+9jrdstCgeB?wrgQ8as*hL4wmKliwq2sj^iq6=D? z*D3uUA@&2{LxDlf?%{|-1^gQHWdk18<(qJ9 z)4EP=`zKdq|4W5iV}0UyE(vQ;3v(L*4zK{=!{Z7dzqS=vuLCaw?*Rn@u1~x>+>hZ^ zfPnXb%fJ=jI*?C=zDxuZzDNx%&$30bTh6F$@Xyc>Ez7F>z@DbliDpgiBlm8CKmS+2 QyD-FS!Fzy3@eX|aKVBtv&Hw-a diff --git a/vllm/attention/backends/__pycache__/xformers.cpython-310.pyc b/vllm/attention/backends/__pycache__/xformers.cpython-310.pyc index 19ce1069d8bdfcfeafdc6d459d8214f0b775d7b1..e6bb8877515f81adcf73783b73e07017e73dd54d 100644 GIT binary patch delta 123 zcmcaKiSfiFM(%uGUM>b8FkHKDBllz$6?grT+yecA%mUq##G>@n5?%A$(u`cg+;aV# z%q0DS%94!yyv@g0SOmlyfV#MtSQxpO*qFJP_!zku`55__g(iO#5uGH;wn@~SNyq_N M30Qiww>Y~I05q{1y#N3J delta 126 zcmX>xiSg1TM(%uGUM>b8sNB}Dk$WR_pO=@50SFA&?wiPMqvE7rl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEohz1OWDD69fPN delta 63 zcmbQwxR{YUpO=@50SGF$HB98T(Qwl*EiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuNTd0sund6chje diff --git a/vllm/attention/ops/__pycache__/ipex_attn.cpython-310.pyc b/vllm/attention/ops/__pycache__/ipex_attn.cpython-310.pyc index bb52c4940b56f43c447fe2d8d5a707e7b4740275..34922a6ee7c20e8948133d03df3c55e42ad9a25e 100644 GIT binary patch delta 62 zcmca3dqb8xpO=@50SFA&?%T-yjY-8>za+OnzaX*D$wSKPNLu Qzo4=tBR_AmCi7-)0B^<=^Z)<= delta 66 zcmca1dq UlB!#fn4F!Mo?5(Fm3cEa0K|b71ONa4 diff --git a/vllm/attention/ops/__pycache__/paged_attn.cpython-310.pyc b/vllm/attention/ops/__pycache__/paged_attn.cpython-310.pyc index ddc8a86322ba9a27a0c3c1f3d6ee89d62431faf5..5fe7b1e37fa432dafc584e8f5cafb7a52b745dd8 100644 GIT binary patch delta 90 zcmeyS@j-(-pO=@50SFA&?%T+%#iZh*Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS sUre?HiW> diff --git a/vllm/attention/ops/__pycache__/prefix_prefill.cpython-310.pyc b/vllm/attention/ops/__pycache__/prefix_prefill.cpython-310.pyc index bb82b227e276412b7b2dab2964aaf32bfe175136..b31f3a18b07380e0572d63d51231df04fa8fb62a 100644 GIT binary patch delta 78 zcmcZRdnuMXpO=@50SGF$HEiS#=GE}gFD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` pN!2Y#OwLYBPc7cu#2YThxN7n(ZAC6FMyCI4K+M6k`M>r_CIIxc9Vq|+ diff --git a/vllm/attention/ops/__pycache__/triton_flash_attention.cpython-310.pyc b/vllm/attention/ops/__pycache__/triton_flash_attention.cpython-310.pyc index 33c30d579e77ec7d9c687b795edb911ffba47b50..f8bd2f51275a0b25ff5aee7fcca8d9b702d9ad46 100644 GIT binary patch delta 69 zcmbOlI5ChrpO=@50SFA&?%T-yltm>#za+OnzaX*D$wSKPNLu Xzo4=tBR_Ak1gi{F9^+;y#cFl{__P)5 delta 73 zcmbOjI5m(vpO=@50SGF$HEiU5%AygXUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> blB!#fn4F!Mo?5(EgjI&Auy(VUVl_JeS34JX diff --git a/vllm/attention/ops/blocksparse_attention/__pycache__/__init__.cpython-310.pyc b/vllm/attention/ops/blocksparse_attention/__pycache__/__init__.cpython-310.pyc index ec2a31a7434398f1c59f987feea94220cd97c3cc..4231da05daffc0602b56bfedffabdd4baf767da0 100644 GIT binary patch delta 59 zcmdnVxRsGRpO=@50SFA&?wiPMqY|NCl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEohz3jhP&6I=iQ delta 63 zcmdnWxRa4PpO=@50SGF$HB98T(TLG6EiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuNU|1prY}6l?$h diff --git a/vllm/attention/ops/blocksparse_attention/__pycache__/blocksparse_attention_kernel.cpython-310.pyc b/vllm/attention/ops/blocksparse_attention/__pycache__/blocksparse_attention_kernel.cpython-310.pyc index 71fa12dd917320cc2a0c9e45bcf4e832b0de48ba..45bec7c65b57a8046d34358f51045ea27bc9d678 100644 GIT binary patch delta 153 zcmaECeA}2ipO=@50SFA&?%T+%!z7a@Tf?w`C53SzV+|vO&Som=tzoWZ$rIQd%p}XK zlA~XeTcBT%S)f~zSd^YxqHCU8nvrXmTdtpznWSG(S(1^Tw|NHZG8V=elkK_Uneyy6 zFW|~&WRCO$i*ne$g!D|{}vYjqzfz2 delta 165 zcmca@{MeW~pO=@50SGF$HEiV8VUj7FTf?w`C53SzV+|vO&Som=tzoWZDV)1Gm`Rpd zqd>p3xJW-IKRGc+KPNLuzo4=tBR|hr&(J`>II|>Gw;(Y&J25@Ac=Ht2Wh{(yCR=mG zGZp4dF5ptxe1OZFkzKJyVgh3k<75FIEtUz4g^oam%H#wdMMk~NO*~~xoNSCNj9iRj Mj9i-;`EPLn08djdV*mgE diff --git a/vllm/attention/ops/blocksparse_attention/__pycache__/interface.cpython-310.pyc b/vllm/attention/ops/blocksparse_attention/__pycache__/interface.cpython-310.pyc index e01d62472321f02a16e844e44096b800e9591b97..825470f062ff6ece722f72c07d922c5869c2b6c7 100644 GIT binary patch delta 86 zcmZ2tInRnj24q$iz>44F|sgj780Ap1^{^l8HoS@ delta 91 zcmbPdxx|t?pO=@50SGF$HEiTAV%3P%FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` uN!2Y#OwLYBPc5FjkTr&xgOOts+cSPftI5wr71?+gnf|jdZRQc1#0CHeMH`L) diff --git a/vllm/attention/ops/blocksparse_attention/__pycache__/utils.cpython-310.pyc b/vllm/attention/ops/blocksparse_attention/__pycache__/utils.cpython-310.pyc index 306f34687d3fe37e23de0238ed84a28204a1d14e..3f9fde49c9bb4d82e2438c125f2248d0877bf9b6 100644 GIT binary patch delta 62 zcmX?XvfqR|pO=@50SFA&?%T+Ho>?VSza+OnzaX*D$wSKPNLu Qzo4=tBR_956N{r50BMU9PXGV_ delta 66 zcmdmQa@d4BpO=@50SGF$HEiTQ&#V!tUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5AG4zv0KwxHUH||9 diff --git a/vllm/attention/ops/paged_attn.py b/vllm/attention/ops/paged_attn.py index 1741dd1..c90e8dd 100644 --- a/vllm/attention/ops/paged_attn.py +++ b/vllm/attention/ops/paged_attn.py @@ -4,7 +4,10 @@ from typing import List, Optional, Tuple import torch from vllm import _custom_ops as ops -from vllm.attention.ops.prefix_prefill import context_attention_fwd +from vllm.triton_utils import HAS_TRITON + +if HAS_TRITON: + from vllm.attention.ops.prefix_prefill import context_attention_fwd # Should be the same as PARTITION_SIZE in `paged_attention_v2_launcher`. _PARTITION_SIZE = 512 diff --git a/vllm/attention/ops/prefix_prefill.py b/vllm/attention/ops/prefix_prefill.py index 9a39e2b..a2a649c 100644 --- a/vllm/attention/ops/prefix_prefill.py +++ b/vllm/attention/ops/prefix_prefill.py @@ -808,8 +808,6 @@ if triton.__version__ >= "2.1.0": ) return - import time - ts_beg = time.time() _fwd_kernel[grid]( q, k, @@ -860,6 +858,4 @@ if triton.__version__ >= "2.1.0": num_warps=NUM_WARPS, num_stages=1, ) - elapsed = time.time() - ts_beg - #print(f'{elapsed}: {BLOCK=}, {Lk=}, {Lk_padded=}, {BLOCK=}, {sliding_window=}, {NUM_WARPS=}') return diff --git a/vllm/attention/selector.py b/vllm/attention/selector.py index d1a0bd2..ae90e03 100644 --- a/vllm/attention/selector.py +++ b/vllm/attention/selector.py @@ -204,9 +204,6 @@ def which_attn_to_use( if selected_backend != _Backend.PALLAS: logger.info("Cannot use %s backend on TPU.", selected_backend) return _Backend.PALLAS - - if selected_backend == _Backend.FLASH_ATTN: - print("selected_backend == _Backend.FLASH_ATTN") if is_hip(): # AMD GPUs. diff --git a/vllm/compilation/__pycache__/__init__.cpython-310.pyc b/vllm/compilation/__pycache__/__init__.cpython-310.pyc index 004a0887615015f1eccfcf3f84e90e809067dd1e..8f5fb174fd9d28bdf8caf5281e96aa7e5f8ff27f 100644 GIT binary patch delta 59 zcmZ3;IG2$-pO=@50SFA&?wiPMqvD`nl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEohz2mtjj68r!F delta 63 zcmbQsxR8-MpO=@50SGF$HB98T(Qwf(EiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuNTd1OP#j6bt|W diff --git a/vllm/compilation/__pycache__/backends.cpython-310.pyc b/vllm/compilation/__pycache__/backends.cpython-310.pyc index 1b80e5836bf81ff36fbda5043e567182eb279cb0..3cdd64f25009c68e06e082ef0a37b33d0d745d52 100644 GIT binary patch delta 77 zcmcbnenFi(pO=@50SFA&?%T*M%c0_+Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS gUrTXEa{~Z1pc-2M diff --git a/vllm/compilation/__pycache__/compile_context.cpython-310.pyc b/vllm/compilation/__pycache__/compile_context.cpython-310.pyc index dc22671e4788dbd00ffcb9764367104639a525c7..237dede535d9ef8b7d59c70702638b11761a9496 100644 GIT binary patch delta 62 zcmZo?Yi8rl=jG*M00P6c`!;ejF{-%hm*f`c7i1RbmLwLXrYiHxm=jG*M0D{VG4I8_ig0f$ExC_Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr*D$wSKPNLu Yzo4=tBR_Am2HPJdraZ>YYMftK0sqhz{r~^~ delta 74 zcmbOxH%pE?pO=@50SGF$HEiVm%Btb4Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> clB!#fn4F!Mo?5(Fh3yX$Q=!IYCC)Fb09*MOGynhq diff --git a/vllm/core/__pycache__/__init__.cpython-310.pyc b/vllm/core/__pycache__/__init__.cpython-310.pyc index 9f6eb9f54e6e1c4a5e0700e9d9758ea7c4aee753..41f568833782bb5d1ea2f7ad1340efed190e8b50 100644 GIT binary patch delta 59 zcmbQmIE|4zpO=@50SFA&?wiPMqhhIFl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEogI8vyX@65s#; delta 63 zcmbQnIE#@xpO=@50SGF$HB98T(XiDoEiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuNUI4FEj)6Yu~4 diff --git a/vllm/core/__pycache__/block_manager_v1.cpython-310.pyc b/vllm/core/__pycache__/block_manager_v1.cpython-310.pyc index 8c402a8d92d8a07a478f3022641f8f599978a21e..8c4fe9ec89c0a8f5797e329a7c268d8e7f79fc45 100644 GIT binary patch delta 121 zcmdlwhjHy3M(%uGUM>b8FkHKDBX=9Cilcr>Zh?M5W`S-=Vo`c(iLQBWX-2MLZn=I= zW|DqEWl2VU-sYXG0!l(kKwVs{Y)m|iJd9jG$j7+(uKH09AtRtT8yirRNrZ`wi4RC` S-e&Ngib8sNB}Dk-Lpm!&SeuxJW-IKRGc+KPNLuzo4=tBR|hr&(J`> zII|>Gw;(Y&J25@Ac=J|P0VNR?piVAUHYOfM9!4%k4o0T`d`z3Ks~_bMF#*c3u>r-I bM3_MGO#gY9H?K2z&&ABaF0^@pb*~TrB!nQ^ diff --git a/vllm/core/__pycache__/block_manager_v2.cpython-310.pyc b/vllm/core/__pycache__/block_manager_v2.cpython-310.pyc index dd98dec979891e845fd118842fe23fe13f1c2db2..7d29f4e038fcfb90e01505b86e1fec18249f468c 100644 GIT binary patch delta 62 zcmbPS)?db*&&$ij00f3>_if~k=TmXiFUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E QFQ_cZ$j{q6iLX%y0AKVJ>Hq)$ delta 66 zcmeA#n_R}7&&$ij00foW8a8sr^J%#1mlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} Ur0NzVCTAz6rxtJS<7?Cb0J8fP`Tzg` diff --git a/vllm/core/__pycache__/evictor_v1.cpython-310.pyc b/vllm/core/__pycache__/evictor_v1.cpython-310.pyc index c3ea008442750765187d9d35a03a4d5413b2841a..2caaca764921766ff886aa674f7834c6d26a89ac 100644 GIT binary patch delta 70 zcmX@5a7=+apO=@50SFA&?%T+Hmr=!9za+OnzaX*D$wSKPNLu Yzo4=tBR_Am08;}eQy%B$N!&YF01xLD>Hq)$ delta 74 zcmX@6a7uwYpO=@50SGF$HEiU*%cx clB!#fn4F!Mo?5(_hpB;+sZeioANLLx0Br>r9smFU diff --git a/vllm/core/__pycache__/evictor_v2.cpython-310.pyc b/vllm/core/__pycache__/evictor_v2.cpython-310.pyc index 6f0fe90e23b6d7725256dd9bd1b1780b96a2d4e6..d0da42db3466c8381c2f562423030a7efc921cce 100644 GIT binary patch delta 70 zcmcbqepQ`2pO=@50SFA&?%T+Hg;B*?za+OnzaX*D$wSKPNLu Yzo4=tBR_95JJU2CraYd_^ZBe;0U5v+vj6}9 delta 74 zcmcbrep8)0pO=@50SGF$HEiU*!l+@dUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> clB!#fn4F!Mo?5(_nQ0miQ=!@B*?d;40C$KN>;M1& diff --git a/vllm/core/__pycache__/interfaces.cpython-310.pyc b/vllm/core/__pycache__/interfaces.cpython-310.pyc index 444f4a8e3b5301acd492bbec6c7f40456634c9f6..7fed706c1da60d0ceb4ec9e86dd9d669e3837ce9 100644 GIT binary patch delta 62 zcmdn1x>J=qpO=@50SFA&?%T-yh)Km-za+OnzaX*D$wSKPNLu Qzo4=tBR_AmDDw(_0AHpQj{pDw delta 66 zcmdm~x>uDupO=@50SGF$HEiU5#H3-bUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(Fka-0^0JAw2p8x;= diff --git a/vllm/core/__pycache__/placeholder_block_space_manager.cpython-310.pyc b/vllm/core/__pycache__/placeholder_block_space_manager.cpython-310.pyc index 34b1c478da56c9d03f49faa69d6af4f9af7cad46..923858d68061d4f3a4c8cdc7f7d624f0cee555ec 100644 GIT binary patch delta 62 zcmeyX_*0QPpO=@50SFA&?%T+Hnnfi*za+OnzaX*D$wSKPNLu Qzo4=tBR_BRKbHU80Dx8&L;wH) delta 66 zcmeyV_*aoTpO=@50SGF$HEiTQ&7u*aUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*57t4Qc0M*GCQ~&?~ diff --git a/vllm/core/__pycache__/scheduler.cpython-310.pyc b/vllm/core/__pycache__/scheduler.cpython-310.pyc index ac0dc4050f7b5bbf49952a5987d041b6ab6f290a..0f0d191743a487abf12241d567d2537d659604f4 100644 GIT binary patch delta 809 zcmYLHK}^$781Dbpb*0-_Hw1+-=Kw(?WbR;O8_@tU1e6OyC8CMI6zE);-GE5mP=SLn z!C;<7V@&MgMME%XxtI_S9!!iTLcExGP!lgE1`p~^3jUoK+ob)!|NY?2O6#NicMc=p&nXsw9^Gs#piHJob5^l5`kQo|LjXTx} zSvF|`M~DN2b%9KT*p;&F?C91K<9Jz91yS9`&Aq2Zc*pXMOK^hChXd|}`ilM_I1K`ddqnz%g4r(N1V% zqfx)J=b!C4(0YtqRJX!1YiW)GVUx{%UIGWO`_1(TSDK#_b&=g@Ss`khake!qz-^|t zxAHPb7UN61ohRx6Bi~ue!z1SFsR-va`7*~5W-yaP3i&jVAEqtg6&1!SX&F{Zv2EmDbK Y92#FPBC2dyE?;+9#IL+@Yp&7y2ZDU+I{*Lx delta 786 zcmXw1O=uHQ5Z-y&-E22$vx)sn)0&22Y*3p95!$3gY7bH&m!_vQf-xy=H=$`ZsnYra z{h=U;wEDz?2iXXo3PQW;LBxZ2Dg`AT+lxP-pkfamyx2HN+r7-p_r95L-nY-#An!Mb zC0k!FbNJ1@T-dZs2;E`-Y+mzcvdKiopP9PupP4I6W~a~h1bY4XslxcVnM5+3m>AC+ z4~2O}v0|sl5h4TmCxTcpPBv%TNG@Qk_Fj`(}g zTcK99Ic0KkdP}K_w5rZDudT3O{Z2Sw=HMCMCNerxCPZr)B{w+Ci0-N4B>*lZ6m8U^ zy<%fQmt_xUbfx%N$Zxa7pfifKeu^qJ9u)1=uKhv8OBE`VNYOzZh0|(xnrOdio!)lH zn--{ioKsu=FYX+}9v8JzQ;BGI*pFZUysRS>fnk;ox$9%c8?J#CGuA`80B=~|V93i8 zi8w?N_==Sfu<{ZR%q4Od9VU!;!qx}R0?*zJz9qR`cKgx?3`T6IUxY{O!SImSfGn9e zc84uI$*maQBVHc1m~F&s4pR{&!)##Wqiqq_3{zX7S#8DZ=&U{JhE+BY?YLZ~lG;{O zC`r|!EzhoSOMoW1YSoLQ%Bhv9k^(dtBU%hvxnQPbxyDr6(}GrJdbF$S69v^xWol2! zcS-(BO|v#v+dt~xXJ4Zpi-HPv)q&e7Oc`wf8|xmu+JXD#o2aP!sJZ$>P(fIRsw(m# z#*@*DX4qz*$0F!PZ`|V&@!}1H9LPe|u&Ql{pn;^q8k%_UBT#}W}>g%kTDB-LIlM$QVkxbGF$?)BLT}N_m*D$wSKPNLu Qzo4=tBR_AmI#;_U0DTD+CjbBd delta 66 zcmZ3LzAl|RpO=@50SGF$HEiVm!l~h=Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(FnX6qB0MfJ;Hvj+t diff --git a/vllm/core/block/__pycache__/common.cpython-310.pyc b/vllm/core/block/__pycache__/common.cpython-310.pyc index 5ac6490a780699b020ac7ebd9fdaada6c4d5796f..61171accf208778a1fd0efda2a185feb02d06a31 100644 GIT binary patch delta 62 zcmeCn?8@ZM=jG*M00P6c`!;gBF{#+*D$wSKPNLu Qzo4=tBR_Am4iA$70Eadd UlB!#fn4F!Mo?5(FgNMlg0Nu3}^#A|> diff --git a/vllm/core/block/__pycache__/interfaces.cpython-310.pyc b/vllm/core/block/__pycache__/interfaces.cpython-310.pyc index 5b72ccfc9e91d0f84456d8f6cb70e5ab55fd12b5..209e865396714efa17c12a64dcaf83f4e741b85b 100644 GIT binary patch delta 62 zcmcZ^ay5iIpO=@50SFA&?%T+Hl1ar;za+OnzaX*D$wSKPNLu Qzo4=tBR_BRAEsD!0D{XE#Q*>R delta 66 zcmcZ_ax;WGpO=@50SGF$HEiTQ$)w?`Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*52UDy%0N834)c^nh diff --git a/vllm/core/block/__pycache__/naive_block.cpython-310.pyc b/vllm/core/block/__pycache__/naive_block.cpython-310.pyc index 859d45abe505be2c8625a7a5daa051762a99cb90..b6ab38de37619ff9908459c61e2e922cda385654 100644 GIT binary patch delta 62 zcmcancBPCvpO=@50SFA&?%T+HoI}M)za+OnzaX*D$wSKPNLu Qzo4=tBR_BRFOE1P0Fx^g8~^|S delta 66 zcmcaocB70tpO=@50SGF$HEiTQ&Y|I^Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*58%LZG0O{rzEC2ui diff --git a/vllm/core/block/__pycache__/prefix_caching_block.cpython-310.pyc b/vllm/core/block/__pycache__/prefix_caching_block.cpython-310.pyc index ccc5f07350722665b8124c92c293d72f2e56e8cd..ef023112acba34c1dc517d1d4868b4408c4879d1 100644 GIT binary patch delta 98 zcmZp<&iLmVBX>S8FBbz47_Qy7k-L&v#aq85w?Mxjvp}~bu_!&YMAtmGG$YqAw_HCb zGfBUovLquvZ}S@F>DCe=KwT`{9E<`iT#Q_dEQ~DwIhdFlSQsZ?kd)h8YtOC&0Nd0X An*aa+ delta 108 zcmex!jj`oABX>S8FBbz4RBmh7$X&^-;jdp>T%@0qpPZPZpOcxSUrYpiUNU4n_eM4o0T`TudxLlIb4@3sVCNW0m>jM0uIb IrS|MP03QY(^8f$< diff --git a/vllm/core/block/__pycache__/utils.cpython-310.pyc b/vllm/core/block/__pycache__/utils.cpython-310.pyc index c5f938659f53a697276efbb5b7fb2bd05fb28f00..bf15d4d89cb0cb686f3460d8a840fc25e3ea8f30 100644 GIT binary patch delta 62 zcmeys^M;2zpO=@50SFA&?%T*M#H?bYUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrz%3pO=@50SFA&?wiQnqT--ml3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEq&482}^76es`y delta 63 zcmaFK_?D47pO=@50SGF$HB97g(Qwf(EiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuOg93;=VU6*vF@ diff --git a/vllm/distributed/__pycache__/communication_op.cpython-310.pyc b/vllm/distributed/__pycache__/communication_op.cpython-310.pyc index d3c14b3d6fcc702777d2ec84a969402b89fba9c7..52ccfdc211b24fef223dda2f64ac0c7a34f9c911 100644 GIT binary patch delta 142 zcmZqWZsg|9=jG*M00P6c`!;g#U{vwYFUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E zFQ_cZ$j{sSnsGKGW7On!=0HZl$v2s&>j?o(C=vz{Aj2R8H;5$$B&313m<>p9F|#o8 aF&2qUp2uR#C^GpDi!+-bSkYuv)&u~x$RS?< delta 146 zcmZqVZsq3A=jG*M0D{VG4I8<4FlzYdmlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} zr0NzVCTAz6rxtI1&N!Qq@z&&K=0HZF$yb@D>j?u*DG~t@AOj%;H;5$;B&313m<>p9 eF|#o8F&2qWp2cFzC_4EDi!+-LSkYuf)&u~7CnDnj diff --git a/vllm/distributed/__pycache__/parallel_state.cpython-310.pyc b/vllm/distributed/__pycache__/parallel_state.cpython-310.pyc index d3779a13962bcfc92211f81514e3c8775a0a1b8e..f696dc6c037f430b9170ffa1a5a545a7b380d44d 100644 GIT binary patch delta 130 zcmezUjPdg`M(%uGUM>b8FkHKDBX>E6ikp5(Zh?M5W`S-=Vo`c(iLQBWX-2MLZn=I= zW|DqEWl2VU-sV*tk0hBnnAkS=D}9t@^qbu1V9p}ID8RURpM#8&iXPB7E>1Q^mj7%_ cEQ~<-pM{BsnF-8dVq*En@}GlcQ*yNc0E=)W+yDRo delta 139 zcmezTjPds~M(%uGUM>b8sNB}Dk-MBj!%M%kxJW-IKRGc+KPNLuzo4=tBR|hr&(J`> zII|>Gw;(Y&J25@Ac=IxjN0Q8JOdOlLl|ITc228GXFlXaqWcn|_w0VbvjFOrG&`>T; kHb$2JY)mYSK=_}9iG!KtKNE-tBLA`c<6zzVBdJ;d02YNP-T(jq diff --git a/vllm/distributed/__pycache__/utils.cpython-310.pyc b/vllm/distributed/__pycache__/utils.cpython-310.pyc index 424b3ac9edaac135100b2c2ec1afc6abe7f331c6..c4fac5b03978519367c446f8895585a7379a041b 100644 GIT binary patch delta 62 zcmbOuHbaa%pO=@50SFA&?%T+{j8Vl_za+OnzaX*D$wSKPNLu Qzo4=tBR_BRO-5%<06_H=O8@`> delta 66 zcmbOsHb;y*pO=@50SGF$HEiTw#;D<_Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5Dx)(e0FoRPTL1t6 diff --git a/vllm/distributed/device_communicators/__pycache__/__init__.cpython-310.pyc b/vllm/distributed/device_communicators/__pycache__/__init__.cpython-310.pyc index 58d43096a89571bcff2c0ec977ff767873803216..2619583b2e1c7c4eb825d60fadb4846d5e0fd30d 100644 GIT binary patch delta 59 zcmdnSxQUTFpO=@50SFA&?wiPMqY|oLl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEohz9RLCf6HovE delta 63 zcmdnQxQ&rJpO=@50SGF$HB98T(TLP9EiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuNU|4ggPD6kq@V diff --git a/vllm/distributed/device_communicators/__pycache__/cuda_wrapper.cpython-310.pyc b/vllm/distributed/device_communicators/__pycache__/cuda_wrapper.cpython-310.pyc index f0c42255df0df528a1f113a63e08d5e6012d88f3..b88d48c347efb91ca3df0d029f54cc07fff088c7 100644 GIT binary patch delta 428 zcmZ3dwMvUSpO=@50SFA&?%T+n!=w_aUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS zUrID-f`5Wxp0_(3d?Y!`^(KDn5$LlSP{E!L#UqSQ1^ zW{ANalSTMF8GRp6FfOjNCoKj$wKoOy(Sw82eVm&%&^fyya$OV9e10iw`1lG#H9Z{;-N)i+M delta 65 zcmccOaKnK+pO=@50SGF$HEiToW!6a2FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` TN!2Y#OwLYBPc2>?!Ym5_o8c7; diff --git a/vllm/distributed/device_communicators/__pycache__/custom_all_reduce_utils.cpython-310.pyc b/vllm/distributed/device_communicators/__pycache__/custom_all_reduce_utils.cpython-310.pyc index e215e78509374015c962a68cd6aee1151fc5772d..44034d54cb45ad081f002fab76e49fe98a4b3cbd 100644 GIT binary patch delta 103 zcmZ2zGS`GVpO=@50SFA&?%T+nz|54#xH*?Oj!`8=za+OnzaX z*D$wSKPNLuzo4=tBR_BRXO=cbkdA7$xdMz)lO@H^Fy?N4CZ5m8m^(R4(upx=@=VDN E0Bpq}bpQYW delta 107 zcmbPhve1M(pO=@50SGF$HEiTgU}h?e-<-=F$EcB^Us_zGpOc@Qn4_PQnWSG(S(1^T zXRK#vpkJI>lB!#fn4F!Mo?5*5Jxd!SQ(@NTa<;hwjJGC>il1T3+x$p8pOG*D$wSKPNLu Qzo4=tBR_BRXAU+F0DGJjH2?qr delta 66 zcmeyW_*0QPpO=@50SGF$HEiTQz@ZVYUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5JqH^H0MOqSMF0Q* diff --git a/vllm/distributed/device_communicators/__pycache__/pynccl_wrapper.cpython-310.pyc b/vllm/distributed/device_communicators/__pycache__/pynccl_wrapper.cpython-310.pyc index 19d5c14d28bf309a4e3ea0298693c78d10b0bcb2..0563cd488969be41e11a2e52f656ed6153548796 100644 GIT binary patch delta 62 zcmZ2uyuz3}pO=@50SFA&?%T*M#H13fUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr`p>`0mX5 zj6>@Pnj*C&3LuSCq44{KH>#$mN<2m4trahoklO0r`Y%*SNGVdgvzAh+e)xEHW_M=y zJ9F!W2Zg8;jkX5(Fa2bDDYF$l+%=k2T&t{<&GKGXV@1Q=d&sITS!t`Ll+2t`zU(eJ zwpZ?22RM$e-#iqF1tSm&1z!jMY5&_h);%x58gBOaa2KonNqM6lSnhrpaeMTZM?nba zZ`7qb0X=-LX;so&h22(fyA!wY|}2X_v!d7#>P&) z-H_HPi-WgQiP#1=e*?a}K}nlg4~6FNd1`g$Iye2WVOK4KX|BPUUqZkZ33N>x~iHk3K!PWCO?LYZE&ZsDe~53b{LWkeD39p~O`I9Dwc45pe+W2}V` zqUAT~&=7~;hlx}l{EP?pJv~On{Yb^tTr+PO{G-?ZtI2|NM6^Muyek*`h5}*2cc`SN hVFp=xT%s;8hWFDOfH=8-xl@dU7>*2uviNwv@h^CwCE5T0 delta 1164 zcmYL|U2F_d6vy|D?QFN*U8>sJU8^6_t|@l92%#0!cRkShUUW@orn=kh%(^qHA6E1M zMHR{MAjDVV5y2!P9`GjKMB-)Qx=S=I;b4hEhkqsNytX{ zF>`q+AXNMb2wt!7OZXl7<+NAt6-gd0hg||-M&fl7MNhW+R=}>&e76PS(aMXJ*F4t+ zcphnN_ZL0sI!$Dpt)U&ZBSo<|jb)S<{l!YHVycXJqxSS$bF@n4jq(bf9UdtF(da7w zSh=m{SITm$GZ0OYNH-gXu1C}&>JXiX9(XsWgB*ZxY&EHX{jsdri|zz;H&nxiScrUu zFR?i3b!z60kft%QRP`rWDMe`)+v)n!X+s}Qrzy`%!TtLB$N?;|A8`<|15t_C37_g4 zx9mo94}!rGS)b(1rq0t@;@nilqCQakTT#}(#KJV40D$?NGZTe0~3hvCKv#?Xw zH>^-2V;rU{u*5cKZQe?9eE-?z5LxS7X?{jh28&6d($FUE%Of@*+7U|;To;O#g|HD^ zi~?G`JpLKUR~qstdWYdbe3m$ZW}F}TJ{}~t^ErMIn>;2pOMKq#xPc#6i`FOtHK2ot z((v#~>L529v9*@8a1q8ZR%CF?a;BnLrHm|k`H$NNoeSoRCveRL^7}OXNI@^?_u%}3 z@j5Q~I7Ux0NJ6RW6THi13#-TrXY;~)glY9{Q6qT+vlAD@Gq^hkcN4MNbIg28*m4q+ z%V-UTy5VEuc+UhgUB7M=hIFdfI_1N4VO(WM)$~!;t*Tgd+U(1+>yyr9ESqLZJhS)*GZ!<<EFQ_cZ$j>v@Gc?dI z&MZmQEl5nxPE1cN-dxG@B~RlPBLf2$6AvR73kM_9e-0+5e@x6wj4X^S|5^Sci%sq= o{=v+~%rUv6#8QNVk?TJbBij!q4yGSGTpU2fJWQJ}mlSaW0CGnus{jB1 diff --git a/vllm/engine/__pycache__/async_llm_engine.cpython-310.pyc b/vllm/engine/__pycache__/async_llm_engine.cpython-310.pyc index 9d8f931700a9e7cb883614fa704366b3a15faf7f..ecb32f47c91cbab6b6b42511f196b759dd94a9cc 100644 GIT binary patch delta 1080 zcmZvaU2KbC6vubob=}q~E!wVhm2Jk#)~@@oO?=H3!7lPn9uee#f7r*?^|D5NX^E`Q{CWKcL zfi(8H++=+oil^kLbQLbu;Ci|nF=t1}Xfv`JqNbZlvlu_-k z#qbz2%gZ!6(BvvNmsjM&27Ftyl*dAzqN_dS06&g<*MVPo?fsGm3-P({hPfDWa@Z<9 z?Jri7vMJ|w$3Teb6~R9V{M5_6U0}tE?oV1HmD|x4@Nm05Frs&m@s3WFVK%_@B^0Y& zOp3230pL=e2HOD4XbhztHM~$bQee`+e9#J7;HwD&Xnq%HXM+)x+o3CS3RdtAPJvmm zcgO~%czEanpKW3mt}EF1%34Zm*fJWqhK4l|)I+(<%5@e7SQB|OZdHokd2J)sNM&>D zs7^N!iN%>16yp-B$B5(rC#EFV&I+|5@1HFcW67wt!3-M5m`#RNC5kr$YoDNhTr^@Mst3r1zpUdg53kYMp> zLY9Kzklfdw&67jYK8dZvX}Joj(Vi@YT3nm-LX&bfIjsjb9yw}uZJ{QeG~+Je9^pQr zni4Y}rd4@z^aH?Fyf$2J-u9n@4tzg+3%29Mk#_Ln$B{wZ4qo+D!&`NsDOH5haVJk) zIzFh|$rIoHC7QX}m5SQ@vTW2*}vB}shm_MC=u^MKk>T7-0v90xfU1AAg%xc{* zIl|m=B_o!|#}YS!xO6kSAPtF#a3K*{T!;wXr;9{JFMfUA^PKmb^PcwAkm22s!4l5Q zG^fZ<=g8@MmPS*N$K9a`cWXGPw7Oec0`5p>G!$+xD_yqKt+hnel86#Ksx+&be%|!6 zfSz%zINy{(hF?abK3rUsPPP1U`J!aRVA2g`7aWw}0qCoBaxC#z)ZI}SvMmg|rG9wIAeC^0JM0mW{bDyN-c(C;cYr{`75e3wDkSFsja7D&@Y+hzPeu zqMARTM1!G3T2#@FYGMPwkCw<4XLsaL1+VDvQneoI_-wJFktmjRT^WCM^KyTeEvFpb zq_x!Q54%1P?c^J0ojJSylTgozvm?~Nm%F#p9)8n(#M~&ez8Ynzz3e@=P6qkh5%WG7 z{Prhk9IkGdD@&$As~?r$z=-V*&Gi8B9q_mI%krkWU|vJtgTq=v_$%`E&0{ zQn)pqFF6pmQGkcyeyOMQEzD8m&B<>F@|wO|r1HnULdj|U+vpHC^%tjykb9UoYrEA9 z?L^0BeYk%vm0IE1fI<8S4ybof89*+M?NC`jHh;UY8fP=}maU^h??SYb3k z*`Tl~F$)Uo5q2o-L(GQ462u%R7oY=Uz(E)RAPA^Hi1a5H$BAa@_Xp}y$;D|`#(o1D C(G`*a diff --git a/vllm/engine/__pycache__/async_timeout.cpython-310.pyc b/vllm/engine/__pycache__/async_timeout.cpython-310.pyc index 941df68391130f70feba32afe1fabc8ffb8bfda2..1f080ed0de8e97e226d05748f308b7223eb2a7ad 100644 GIT binary patch delta 1300 zcmZuxOHUI~6lOZLOqmw@6hx2~V!}XcDJmfHZrG`b(P*eKb(oG)nRX_pw<5+wV`5@t zdEMv_FkzvIA<>=x!R;*Ex-+g#OuXk5ow3l#d^vL--?{fY_x5e>bxyUT(Vi~xE585o zQB`EA%v18T78jmh%LP_<3Qo<*Gac@mEI(6kZPttR?SfU?C^$Q8({Au>c~MI8Px9_c zTGYS^gg%6R1my8S0zXp%PK&pReU+}DgpVRYYX5m~SBl3l=Qx5Y;Hn|>NvWSthZaji z=)`KER>%Rv2!jILP|K<6%+zEz*fgzs;PH5iNbt|0pRp0F`On$?Y$_w1dy=bEs&>VE zRAYNVpu7o8&LQLx{AD#|eJ~@OngnAQ(>fErDf$2=z*&UJ&hUEp#V~Dx_C%r`qWB%Y zlFf)h(F1pRs0aFDe5>bO%wuW~f@jr{*de~_>Xt@)0g}!Q8G6Gots{A7_rI&xqzURf zjg7JbG`Xz{4zI1TPm+Bj$^tjNmCzZWQraC2YYq#E6W8gg6)>B|rde%SrWR;()98G( zSdr!V*w@vJFtsRn9q7Cf8=a0`O!eAC#b-HUv;fQot1!K}Rp!g_zGAuC&@HQ?Gwoo? z*wK|6_O=_uEdQ91ah|`7^Q8;I)Vh7mNod;M3}(?<=F#eu9ercGoOtpyBTOv}w6NY1 zX>Xa;H2@oY#Q)TCBR6Vw({8bL2I)DA6bDMt>FiLdAmSgy+e9&Xq=*y}j}lPCEqlyw zB@@yTe~`R0pAk{*7|=Mp14zoEfPXtI3AY)OPvU9tF?es>E`b-iGvpqE zZ607yf{53uWjmy%BGiDo&sh`*=4RFmug8BGqaBCcyEDV`@PG)-D*G0FRS6GNhJFQb zo&cC^52M=S0SGe*Gr>02?jSU~9~@W_V7lG>DDi#>F98xnDs@o&PTU=Ck@x3&^F(gr~=Ddf>nDb;LPM}eQ%;WB^cIvvV`q$ zX?c|~pS2MG7f|#(j7p9?P~v$gqahv+Y@2vf(*9XKfgvGDk|g#w9*Yw#rV%wqUKxa!bfC2s_ zJJc`IE9*hXY$sfOA$xSk_p9szn8!KKjy|1%b8FkHKDBX2Af1EiFV86?EV%*F%~nf#{Eg$2aeY*zGDh;iR!omOq29v0@!v8@+b zq<9!PK#IYTiHYSu6VN6$MvfmWjFUaOUQ37poxs8b5(HrmpottnJJ=XE2X@aj1ORJ* BH8B7H delta 249 zcmccilj+@0ChmM*UM>b8sNB}Dk-LRc!%@GqxJW-IKRGc+KPNLuzo4=tBR|hr&(J`> zII|>Gw;(Y&J25@Ac=Kk?Ieua`K%HE?Y>XU?O#fM!nEr7vGyP>@*_;?*CCF4*uz7A~ zB0HniXhQn=jG*M00P6c`!;fCv8g!dm*f`c7i1RbmLwLXrXqWo=jG*M0D{VG4I8<$*fd=9ON)#2bMliDbM$jElk^KJOEU8FjP(o+^ouh~ UQgsUwld}`kQ;RpxWGi3;0D>kJ1ONa4 diff --git a/vllm/engine/__pycache__/protocol.cpython-310.pyc b/vllm/engine/__pycache__/protocol.cpython-310.pyc index e01213f1925bcef4f19457a5b2990a66910d2c7f..0e434b6c66a50fd905f9f7e1dd1937cf1056e0cf 100644 GIT binary patch delta 62 zcmcbpa8`jkpO=@50SFA&?%T*M&!S?jUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr*D$wSKPNLu jzo4=tBR_Am8uJ?#J_(>M4gnTM0Y)B1E~d>&9KYBB{OT6> delta 88 zcmbQHFh_wqpO=@50SGF$HEiVm%%tJ3Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> plB!#fn4F!Mo?5(FiTMqSfD}+ChX4zs03#bC+kYzi}AoLM(%uGUM>b8FkHKDBeyQQil=@_Zh?M5W`S-=Vo`c(iLQBWX-2MLZn=I= zW|DqEWl2VU-sS{$ZXu>T)y=t*tUOX;K;29YY%FYyLQFi2T+A$tT#Ot*$nt-4pXv@i zJ^`RShcXMJ03%SAX>*v#CRWC%&74-hm>6$O4sev1yuem?vc7EugtvKt?RsV~(-fjp z5w3HpqbM`uoyn_R+ysiic5?A?F>wi}B1XM(%uGUM>b8sNB}Dkz1Et!&kqwxJW-IKRGc+KPNLuzo4=tBR|hr&(J`> zII|>Gw;(Y&J25@AcykOpw-8g|#?6_MtUNLjKogi6*jU&Yg_w94xtLiPxft0Pnf`My zvHaWIp}K=lKnSRULz#t904UD(pNo03pUEax##@^it$r~v-k#iGt36rWHiGf?<_6p2 z%wPeD$qA0K5PgbB`nnxOnHld+Ug+W`R06h@i;s(ui$j1MOly5%rF n-h9ukpONv_?*h7bj@!sYOUIk15#WP7% diff --git a/vllm/engine/multiprocessing/__pycache__/engine.cpython-310.pyc b/vllm/engine/multiprocessing/__pycache__/engine.cpython-310.pyc index 2ebdd9c276d633fed78ff644ef24ca8fee5f3419..52c558349107bc629f50f4aa7de5c0031abcde7d 100644 GIT binary patch delta 70 zcmaDJ^Eie(pO=@50SFA&?%T-yiATj#za+OnzaX*D$wSKPNLu Yzo4=tBR_AmD(@FwraZpQ($YS{08CaFqW}N^ delta 74 zcmaDH^E`$-pO=@50SGF$HEiVm#G~P>Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> clB!#fn4F!Mo?5(Fk@pKPQ(@X>acLi60Int(3IG5A diff --git a/vllm/engine/output_processor/__pycache__/__init__.cpython-310.pyc b/vllm/engine/output_processor/__pycache__/__init__.cpython-310.pyc index 628012719aebfc0fda8762e1d781f7c93b874df9..d16adb25c09c70ac4491fa1b1c091d6ae355248b 100644 GIT binary patch delta 59 zcmZ3>xRQ}OpO=@50SFA&?wiPMqvE4ql3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEohz4gmar6D$A# delta 63 zcmZ3*D$wSKPNLu Qzo4=tBR_BRH8vGi0C5Hs`v3p{ delta 66 zcmew+{!5%YpO=@50SGF$HEiTw%%%~fUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*55}OJu0L5_@3jhEB diff --git a/vllm/engine/output_processor/__pycache__/multi_step.cpython-310.pyc b/vllm/engine/output_processor/__pycache__/multi_step.cpython-310.pyc index 5ab777190e7cbe56fed41b8cfe276600d61e2488..8dc16c92fd6dc503119de1c3fadf1ddf90ee50f0 100644 GIT binary patch delta 291 zcmZ2)ywaFEpO=@50SFA&?%T+{j7`N)za+OnzaX*D$wSKPNLu zzo4=tBR_BRO}1iA1&}s21|~)>MyCI4jGA0g96;sq#i@nGMFK#nsLgo-%8ZGFoR9&r%qABJg)mx8J}$JJDUWe;fv_4QqwVDB zB1VjMlTV3AG1^alDx%D2GMQ7fR>cgc;TCshaeP{4US@GdYKkULkrc=fuoYGymigpW zqLz#flb?tNGFogl6BA_=wFZfUyif$vU&Ie0EG8$2H#2%~ej;AQ$mljXUNQgxTfRp> delta 287 zcmZ2!yxy2QpO=@50SGF$HEiTw#- zlB!#fn4F!Mo?5*5DqAt95)V)(8v_#~2P4xzCPudZnp{yF>8U00#i@nGMFK#{TbnZk zlo{EqfXpI`$rA;$7%e9M5e(#p2!KRwCku)QGn!A%5ei|no_tVfIa8tQ<}6_~Mn=2I z6Ge<<>_LhcL4+od&}53@D9O)G&5O@WDRP*6UqqSFbTYGOEzp2QQ3;5#)*!_elb48E zGCEGaCmP6Tx!FKWlu^nCBo6XykvWLq2N9MaLK@_R$wlJXj6R$1iB~Z)x=)Uj3;+OK Cen>0; diff --git a/vllm/engine/output_processor/__pycache__/single_step.cpython-310.pyc b/vllm/engine/output_processor/__pycache__/single_step.cpython-310.pyc index c447d33beb1963ac24d9197824b3c32559811f4c..6bbc9431bcdf62c808227584b30322c6d6785c63 100644 GIT binary patch delta 75 zcmca&c)^f6pO=@50SFA&?%T-yhegF-za+OnzaX*D$wSKPNLu dzo4=tBR_AmKC3i8W7KAE5fv6j$H@f}DFB&t7wP~2 delta 79 zcmca$c*T%ApO=@50SGF$HEiVm!=e$aUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> hlB!#fn4F!Mo?5(Fn^l^h@z!Q{5fv6jr^z`IDF6bG8FK&t diff --git a/vllm/engine/output_processor/__pycache__/stop_checker.cpython-310.pyc b/vllm/engine/output_processor/__pycache__/stop_checker.cpython-310.pyc index f26ea791956e13b9deb7f78eff5c9ea9b0d3fd06..c77898239d896b996e14f66215cb8eaf983b3c2a 100644 GIT binary patch delta 82 zcmZ1>zDS%qpO=@50SFA&?%T+1!>kgZUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS jUr~UW^q+-g^D*{2%m8U)7_R^T diff --git a/vllm/engine/output_processor/__pycache__/util.cpython-310.pyc b/vllm/engine/output_processor/__pycache__/util.cpython-310.pyc index 2918745da967f322829a4f9058bd2f33e24c228c..14ba774d0e8d95582e3af360ac19310bebacb184 100644 GIT binary patch delta 62 zcmdnav6+KApO=@50SFA&?%T+%$)w_;Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr_if}(VO4R`FUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E zFQ_cZ$j{q6opm}ZW7KASZdFD`^U0w++Kkqd8+mGgEOeh%Wfm1>|0Wxhrwg3PC delta 305 zcmeyb)~wE*&&$ij00foW8a8sLuxhyJmlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} zr0NzVCTAz6rxtIX%sQQw@z!Q-ZdFD`i^+jJ+Ke`nYk6vbHlcpA5uk;s@jTp9_A#-4DO}yx-?J z=V`}_lSR8`w^uC^PxSCi|DV(L(>8Bsq>#%;@|k?Nkm7ymLO7lq?9WAWLy>G|QzZXl zp%Z^4Cr_$$B;pbQuTcIhXYmM}I>pEf$_m*y2B zu`b}E72bqr0{#I2B|_!qM|Q%n78s@ZiluCfCcPWm-V=tBrJFxuMh4+uI6n>-!pwa8 zE+H;wLfs<-I^uQHp@5TK^*I)s{UNdlm#2Oi9reX(NhqNjJ_5%$9Qo$PI{r3P1$YP8 zjd`k@Q1@M-5Buol1{eL_SZU!Hupxnl`TGK5t^nkPyT!ChRVJ6}ODB6Zu9;0c&|2V5 z)5Aeoe9m(}75#RXti0E(?7yorbp>2Zo|^-6hyPc?CZ_iOqHp+4XeRsa5gx9lU`X^z9SwBb0ajK5g zi)sCl4eX@;Qe-z1%XM$GXg?vmB@17Tpi{Ijntyg0wQNHvu4dFextK;xvSaZ1jJ7_- z2hyD5w2Z~cp7iFyfmHUkaR>#z06GD=*(Ze*a`1;>_!5|*Z0qCAry$DJmHT&Gs7ejj zvba^XkX8$P2N|uz&XKzEZ>x+xO=|2xVJO8~tmn;2S7H-vmbSKyvJ3Q2Tf%w~=JT{> z)f4Ozy}9ZI=PV3a;1ckfK*`20((<^=Is?mR)Eek)vvb)4@`^>JsD<|A%U3HH|wi!H<)zfM=lFe+13~tZ&>A9wdqm2sqO!-$7s9+l7b!zMHOO$<|>l7c(2G&X+RFyyZ<7xyMBHkb^%d z9()f)msQcw@@Ji}@)4<4DKD{cDXpz>(X8_0vKQe*Tl{I@WuOSy3lJTy_0fFIZ)_hm z20ZlBibj#Y;P=uhe?mEc5CcG!P_g~uaTwZxJ+w9Gp=tl-l?R17<>=z;?6^937td~i z3t=+5s*HrVlnM29>aOi{{?pYH?g`-uRq)-2-A8}cuBdzkViMR7yeeAuve#&1pg}h6 zOP~#YNI>)&guHkUm>^k}84#;arFE{`gE)hB8)tmgdxNcZtx3C9;Qwo3o@AN2ttX@3 zsb!B9{#U(fnh6H(Oy^sIv6ds?Flz5M@2Tr&tYGd4m9hs4!eo_i=4+q9WC zA?PR_tlz|@>F4@i*b$m<@cG|>SuR8dyeXpqsm384BjuqRY>LXm0al<`xTf;BFk3|f zM(^KMd&1r9l=*fz$&`1H@~%L#dLUyMnOtvbFsr7uK0Vu`apU%-YmcrsL7Unv+7bT*E5Qi5l{*Srw@^Y^hu2hQ`IsTN7KVypN1W0eLZJ zg%n!C*TC=rFh@hN$Cc9%<+YQyNA_32^(;;=m)CN6I-=Z9zsGj53pCR7hf~I%qmlS3 zVKC$M&d*R_j(&*mXP0Q_$}#pil{6>Hzl2%(botGsn&a#;O*D@rF2R!pE(6a9Ou4v> z?|`9Gz^V{$9}-(p^BFzI=U|_q^(`CORhn$}2Kg0Oa5|y8`SXw$smi~RZ@$r@c)vx+ zcL--zNnY>Qa+w_(w_yFA0n5fy!Tid;<8|v{wJh*h#v$cKuWG^Nhkg4V(hx yKMl^3e*}CCd;)w5da#3nxNossaVsUm9YjJ8(S!&ee zYE~V_sL3l>@33hD?J3gO+{ISG1QcQB^bpYjiriv~kB?$Y%}dYBOI^tbl#l0(Wwg=- z%BT+2nbg3X{8e0;M!SGG-vc8bsKF2w@NbG>Au^QE9Ro?{03e%jH3$ O3X^qNBqp=)=>Y)E&rn(b delta 312 zcmZ1{vq^?KpO=@50SGF$HEiTAX4Y`gFD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` zN!2Y#OwLYBPc7cOhp{~R7720)QpO!4tiY^izanR%%z8G-WA zoUx2nhCrE>97XIPEhZpB3PhNJ2y+m@1|pb1gawdT$#jb`zQ_{9wVM2iYXYOq)p9 diff --git a/vllm/entrypoints/__pycache__/llm.cpython-310.pyc b/vllm/entrypoints/__pycache__/llm.cpython-310.pyc index 0f22fd2935353382c918106c0b2b43ed0575d8b3..3f0bb4df328dbc41d49e9b029df14d6d927cf7f1 100644 GIT binary patch delta 104 zcmZ2=k#W&QM(%uGUM>b8FkHKDBR8kKinV@8Zh?M5W`S-=Vo`c(iLQBWX-2MLZn=I= zW|DqEWl2VU-ew#5w<1h=Wt+846ciYZCi{d)vhXl+FmBEc(Pd_InmjXH9>U)j{zd=* DuTUSx delta 158 zcmZ2b8sNB}Dk(*Oq!(P9%xJW-IKRGc+KPNLuzo4=tBR|hr&(J`> zII|>Gw;(Y&J25@Ac(aB4TM?$h51Z9Z6ciLpfF^LT3o&vqvVq`#78VX58w9x+nf`My tZB7l*Wma" if model_type == "mllama": return "<|image|>" - if model_type == "qwen2_vl": + if model_type in ("qwen2_vl","qwen2_5_vl"): return "<|vision_start|><|image_pad|><|vision_end|>" if model_type == "molmo": return "" @@ -172,7 +172,7 @@ class BaseMultiModalItemTracker(ABC, Generic[_T]): return "<|reserved_special_token_0|>" raise TypeError(f"Unknown model type: {model_type}") elif modality == "video": - if model_type == "qwen2_vl": + if model_type in ("qwen2_vl","qwen2_5_vl"): return "<|vision_start|><|video_pad|><|vision_end|>" raise TypeError(f"Unknown model type: {model_type}") else: diff --git a/vllm/entrypoints/openai/__pycache__/__init__.cpython-310.pyc b/vllm/entrypoints/openai/__pycache__/__init__.cpython-310.pyc index 84bcaef58ea31333410de4f393541f563cf63e82..d5f09d236f58d8c1a162ded2f8b67024e863202b 100644 GIT binary patch delta 59 zcmZ3%xP*~ApO=@50SFA&?wiPMqvEb#l3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEohz5&-#g6Bqyh delta 63 zcmZ3&xPp;8pO=@50SGF$HB98T(eTzUEiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuNTd2>?ba6es`y diff --git a/vllm/entrypoints/openai/__pycache__/api_server.cpython-310.pyc b/vllm/entrypoints/openai/__pycache__/api_server.cpython-310.pyc index 59e7f0556e6526e8f7bfe324c8a18c59130d3a40..6f95699019b7db329e8588e1ba9d3eef00949986 100644 GIT binary patch delta 3319 zcmbVOX-u5Q8Qxi7fra$~%fhY!gE=Kcs`|de#&M{BhV8wArjC_^W&UJEOB#Y`s$!W@5xhq>1{OM3eM0nI^;2Y*NtQ0vkXG%Acja-pO^E9^_t3*D{7X`FHtfs5AmSPl&B3h(*s!=RTXo==FV~r@K zrJ56?On9hA^A$$9sGt>^+l@+5MXNMVGpa=mtAsp zsClNbPBhUb&7DTGSWnk$o@Hzh8|g-|iEh&EY(w25byK2~cIvjv*eSf!tGV0g65X_0 z^OeRf(L;MQ&oOq3UfQd9uF)s@X}{)q#vZYk?$vyiu}|!$`!&xu4hTxA<^{${WQAqtfd3=Z;VMUuvd_OCmA(U}GW1_=6lbgmz+$Qi!z_YP6+%;@w zrL1f=9->A;@$eK@&Kyo%NE@kbFBR?F&U6QJ(|&z><& zQ6rYJo~@mYr-C(bHw1ejRU=ymN+70mgVMyBK?%l`eo)r44WNW#N)IR-*(Ok)jwy|x zJjFJHBDt{;W?L2s+p0$>0Ot#AYMY*I1k9ssJD3f;9RtAJ!CJI;Ona@`+ZOZMSiAO~ z(Mda&lR{lO*-ot=*SZ(N%(XG1#ttWI-8dz~?lF|NIt*iLXk?S|P1lzf(L=8bHWSFkZ&wCpl6 zY-QtY0^D;lQq?4mj*2?*OpP%%R1=zvj0OX0+*=Q8@Xy*OgtRJ%_rKow4kne%yaIyFBJ6y6nsT)Z_jZmlJ$gto13#okSr2 zq>`@dWLnRq$em5jsg3R{_8G8m5qSX~o@9Ai-FJ6bA~>CCRlagNxvT;!%iGVR@LVhe z9yC4ndKr%dCwO4&1eecaObLPw;UdBd2!#k42$x{&Oy}o)@^M;M(0NfM=kz7b1NFp1 zAy`g95+?ANVHy{6a-0ep@VPLBEkMlE8Riv4D)nZLm&~i=TrYV^?aft|IWXnC`bVxi z6W0^93eLv-zQ|;V!`h(sdAY?;oaQR*Y)81HH_0^>$}1w*)ED!rZ7-wzB>+fsQvED1 z`^jkvF!ZrB*VU?3MdZ5LwrYM`tb$Vz5>1O$kc%PC80_jN7qA#p#tH~;)cy*z_h9L6 zpz(^T&3~A22I*M11|7QgG8WzNU8&b^U zdTwFf+e_<97fMRVMRlj701oiolG%8ir3&Ucl~{9+ z%&9GTFp#`G$JEEJFHKp{Fmc z4drhld>7#d>YS&+qQ$q>Tb_gD?ov*9A0Y=+u%bBW0EEDCZBt*a_(|EXF#gvFA0XTZ zfCV7;#7S*xJ*qBOy2&rp?aF-ebM?c@#) zKcHv{kBtQUMl`XnqpiQCw@czjMc!3Et;$nwWEz8}A{xP$fLqwzz*pdmZ4{e6Tm0v;Tx z58G*EcnvMD@GWHL0HX1sU^pT#n_5745mmf++kHK~ vyIMQEExo=S9li1(hAbl7REL_^IA2AI2TtBa&@bdu^>T9|X$ooIA?eLc2)2aAm9aK zta?&yog{^-u_jZ~nVm^8?PMl1X*!)YnWmYfw%a6a^P@N0G--ddoiR<{_pn+!9rwrc zJ>T=Z?|aU9_nhX`?pH<3+MuLYHWsAW~#1P1W2Y(quYKml-rezY~#3Ga+}8$dcJKTiU5z zI;cZ?R*@rfY3_u6SuB>yJesF@qHxN5nlB4zfh?qjT1yhkq>H*Vw}~QIOp7&77A3Nj zmTFE!nJlN}nlBMULp_?OiYi%6t2Iv(HL{kr*XoyaQ77wZz2+HWxon^f znrDhexq`0HJWDjmX4`}BU=HAj42(UG_ht-{4u2ml$C51D1n&L2}%oF4N5SkG=Q>( ztp()(ADuJUx_QFZ>k$gTd4xR*lbs+m1ZJ3R0JDKVh5=xHg>BR;IjFr&+IuACJ;pX` z?~pFqx=CLGNH&XH2l#Fg{*ghRTrOOOxuQlc|#EcY|yQT0YIz@&>k_SFmC3 zT5uT|Ok^W$6xc~#IiFzOrP zAvKsd<%lK?7~B`;-mot;YBa&67LD^U7FAy+9w(dC@ubg5s|wiqZJl6kGPVL59g*9% z5@J4ZDe~`RMab63#gugf!rn{0lMziF;$g3G(C;7i4|zo(5R69NO^YKHJ0O#$NuM$5 z4H|&~9twFG_c3=;tR@!jLfEFhNN*=QRF@-zw5vTC^Q8S^=Gzv`H@ek(nS0CpNP`Fm z5VX?^ENX$Vx&M%{2j#u0H)~t!|AtYgdc*2i>|r?6eb?@TJ2Tf9k!P&cvBC0Z`mur`^@fI@TSqr zTc`&ISw+bnsP3roC5nMF`kBpd$BR4Zs)XG z#xP|@mF8|B&!~~yisUmWJasQ*KG$CSRa8n4k`c}$TtILkq$6BZALbTWzJ~OYN?6)s zJqOes4~yKpw6Ga7+-7429#M-7FfKwy3&v_#i|jH$B{7*o79i%ybn_BoTvo3wZ71hc zLS8$0R(0no%UKLPr|#tCWa1*CiITHnpEo=n913;Mxctq1;dwC!rgMx>L1AgP7Z79U#2MW)t-25Ukuh!Mq$qby@uF^k}v#OT?`|dvSe#BnUL&$D5T3Kw} z4IywQTh-;tcglZ-@gE|5gz#$sm^pGd=GxTy$Lg#nhul^#cnZkR)ek+5ssByU_p{pED9EGOt^M$xqA6I?L#m?+6)wQZg z@=2tmx(hDuYig|KwB2Yb-yr=h zK-AjC$2S^Az%WMD$+~j#2laAYmZuZ__W`K>1T0KpAmASy9x^^bZ#_Z|!td2*b(IBw zLV5?`&j^13h+1%W`vb6#TGguh>eSz%vj(9V;R7{RU+=&fnkQ|Ane0iCFJ$$_C(`CJiPGHjNgvmPu#TzHX<6oFAxw$JHG!2 z;V=T8K7CUeQ^=+f^y1z`HVY7q4+cVE;~A3^giEO69cw&`Fo!UYa8)%mJCnRfuOr-0 d-saM*7m?z5(*MFj&+n=$%`Va!dA+%j{0HU-Zqon& diff --git a/vllm/entrypoints/openai/__pycache__/cli_args.cpython-310.pyc b/vllm/entrypoints/openai/__pycache__/cli_args.cpython-310.pyc index d67a7cd3e55e875273e414d822cc25f52cc5cc39..e8274a598579ca986e60e5e24da4d18b9540502f 100644 GIT binary patch delta 62 zcmeA->o()g=jG*M00P6c`!;ghu&TK0m*f`c7i1RbmLwLXro?=h=jG*M0D{VG4I8;_ST(%$ON)#2bMliDbM$jElk^KJOEU8FjP(o+^ouh~ UQgsUwld}`kQ;Roevn~(?0EtQ!C;$Ke diff --git a/vllm/entrypoints/openai/__pycache__/logits_processors.cpython-310.pyc b/vllm/entrypoints/openai/__pycache__/logits_processors.cpython-310.pyc index f28c2a58f0baf34008d42e99c293613a076262d1..45a3dbe6f67697b744a54132902eca92b0c26d55 100644 GIT binary patch delta 62 zcmaDLaYuqXpO=@50SFA&?%T+HhDjwrza+OnzaX*D$wSKPNLu Qzo4=tBR_BRf2KrE0BqtFRsaA1 delta 66 zcmca3@j!w*pO=@50SGF$HEiTQ!=w?SUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5H&Y@f0Kp*^W&i*H diff --git a/vllm/entrypoints/openai/__pycache__/protocol.cpython-310.pyc b/vllm/entrypoints/openai/__pycache__/protocol.cpython-310.pyc index ddf2de4800ecb68ce2a270867ef4eaebc1f4f08f..a2b1492293e25ae800506d4463142e2f78d407b3 100644 GIT binary patch delta 140 zcmZ4ghH?2DM(%uGUM>b8FkHKDBllc(6?grT+yecA%mUq##G>@n5?%A$(u`cg+;aV# z%q0DS%94!yyv-NbC#gux0P136b8sNB}Dk$Wz?hPQrcaglybesW@teokhRenDkPMt+{Lo}qz$ zab`)XZb4#lc4B&J@#Zt^lT@T;0d=x5axk(mvN7>7vN5tSaWQf+GW};^T3n{X$yAuM WxxzGGKxPS=G65!p!p)3sY6bug${`&9 diff --git a/vllm/entrypoints/openai/__pycache__/run_batch.cpython-310.pyc b/vllm/entrypoints/openai/__pycache__/run_batch.cpython-310.pyc index 69572f50b9764f405791c0253ab82354aef575e3..acb744c7cc3bb2f0b88689f9eb77bc79d07c43ea 100644 GIT binary patch delta 83 zcmca-d&`zPpO=@50SFA&?%T*cjYGvlza+OnzaX*D$wSKPNLu mzo4=tBR_BRNe&lwrabP=`~t@~8KWj&lhkLtwV6%o1`7aj)EmbD delta 87 zcmca*d(W0TpO=@50SGF$HEiUb#-ZV(Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> qlB!#fn4F!Mo?5*5D2EF>Q=!FXZh>Q*jJGCVlGJC6+RP+%g9QNMvK;#W diff --git a/vllm/entrypoints/openai/__pycache__/serving_chat.cpython-310.pyc b/vllm/entrypoints/openai/__pycache__/serving_chat.cpython-310.pyc index c9e2f781c8edbfd7b13edc484152fb28123d38a1..ac60efec61c37a766c3192cc3afe429a9457f9fa 100644 GIT binary patch delta 671 zcmYL`OK1~87{~XUY_@rA8uK6<5u>(}Mw2X|HBpN}r6(106a zJAk*CxzP7sD3O!VChrF?m>W?E!3okEy8=JR%~%cY5)>Z>gJj}ixnzJMEr2G_=)tZD zRD0Y}T%GHZWhUnxEk2hy@tyOC}DbbV8^_r;Vt`#Cy^GnVNcm+h)N%=?IWiW zyJymLT7=$;xTg^`c&f74XYkk`;-=UO*{;4nfCEi1===XY>gi6WbA&tVX-G!U zkd&wrrv5nY3382)5n@h`I+LS@UD<=VIxIkK@)&mw^u2y&%|c@AhXEd*oc zgXB8EI=MZlMjYS=9{4u0xWNrB*bcUQ?medNu#~8MVtSe(!?4UCF-$SMrx+7){(J@JaZayH vmsm6*BMD$<}db6z{CCvnr&5uoYlhVSj zEn4C!5F7+W59S{b%Az2674aepR+6eHRq&=D;-S>WnM8Dl_j%v_zIkt!o%K3AtAk4w zMJGp}<;Sb*u7)deQLgElTvRjZqFl_+%a!G7PAyL)#*fN+zM73!(wRc~YF4+Ny7r1N zLtaWZ1qYxm&s(#B?|Yz3&PQ8<2l%cRS>K`(f(yhRy9Pf1GCP~JFa>)Qi zYJz5`*@K4)NPpB*T#f6woFe|sZkEYfyyWjzy~dC+q6BG-VrOH(^fqC^M})))aXhXdRqJ7c=9A4Kp-3k>=N|2^yr&>fXa zy-wFz?uy5h48I{MQ6)(Id2IJ{X21wAXO21xv&Nuu7;`mfg04+**P(i3m{~W#+(&b) zU((hrB;Q7`Y26wB39v&N6D67bJ_q7=c@_iwZ)9_W8;0NjI9Aav&kG=Q1)BhTZ#k{8 zVGJK%8EaGfN#aTR8 xRSVg&_Kp?aGxR2Ik>`^$(6&ZThHUVeoJ-|k%X*kv0{Ci$Pqz?!AurD4{s10JyCDDo diff --git a/vllm/entrypoints/openai/__pycache__/serving_completion.cpython-310.pyc b/vllm/entrypoints/openai/__pycache__/serving_completion.cpython-310.pyc index 1928b661faf42a24b52c39b2515db6dbc695965b..4fb40e4af8a355e4cdcfb1bfc02e8e3d5fcbe5ba 100644 GIT binary patch delta 830 zcmZXS&1(}u7{)tsv$k2QX^5ryuxdWE0ZXh3DpbUasp3U@NC|}yn>C5aZq~_co3?8G zO4Lwmb&TSn(1RX|D9YYFh<|_{&AmqzL@1&M=h+lL_weJHXWx0}o%fxk(dMX9?(TMV zh;Qim>sQJbIdVGAG$U>lj6s&6Ih73_)Xcm#q)o+3g|l&En&r#772UYcMN-yS&s&GP zC^pk!;2fY@d%Sh2|047y;4&~L&~loUOiqnC=ym?CFR^Af5&o|2R3%#{wbpiO&X>q)nug@cv+(l&q)0H)M{Au$a`YieXCvFyYD+ z_h?uB_d&FdA6I}I0x{2eWiU;SkWU79(2-G5B)y6lqu=qg{kN PvDS925wgrb54`vZU(?Jk delta 839 zcmZXS%WD%s9LGE9W^EH1qok4-)jTQ*qN&z`f*^WH6;HNW2!XIBYZCI((p#S21!frd4UIsHCN0teC$Lt2ES{QXW5Wa4c5MtMdMelrBhFxvB@Y9kP+0 zKE30u#aZMB&|^RrxTr^5ZDHgp^fh1(XmRwcT9xmPTIf7`?~VuSh}lX~J*6rIxm@iD zayqBb2J%&)$tFAj@iOEUmh_w!+mJF_^PK(fR_5@k_A=Iw0}E`?>mhme+#3rt5in2T zs%K5-v~q#oK=dZiW*golDX?i@kbGe^->Nu3gr5Tz=JvNqNq^#hL*}YHF)Em4Y1kA8 zW)T%B8ZpcM`zpGCh3mjAWbWLm4S`cY2e=K~0nDbM3=g_c!@!K;;qMk`5*D$wSKPNLu pzo4=tBR_Am0?T$T#;DCV`1+X{<2Pprond542AWZnFxg6E5diCe9I5~S delta 91 zcmcbic}J5wpO=@50SGF$HEiU5%d8QiUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> tlB!#fn4F!Mo?5(FhGjb!#^ond540h&{kIN3~O5ddb+9x(s_ diff --git a/vllm/entrypoints/openai/__pycache__/serving_engine.cpython-310.pyc b/vllm/entrypoints/openai/__pycache__/serving_engine.cpython-310.pyc index 8920d029d506da864ecbea00c42c9d8a6e483261..f33f7a0d99ca7e6f5a46af6d9aa158e91192f745 100644 GIT binary patch delta 82 zcmaE!{V*D$wSKPNLu izo4=tBR_BR50(f`K9Dvx1|~)>MyCI4jGGhm+SvhMa~Tx? delta 88 zcmaEu{XCmHpO=@50SGF$HEiTQ%AygdUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> plB!#fn4F!Mo?5*53rmEi01r?n8v_#~2P4xzCPudZo1^sF*#QG<8zBGy diff --git a/vllm/entrypoints/openai/__pycache__/serving_tokenization.cpython-310.pyc b/vllm/entrypoints/openai/__pycache__/serving_tokenization.cpython-310.pyc index 258edf8026ddd35dbd47c5574d7e99754b27bd46..73a6915ef8562a09fbb19e51c58224505d797df9 100644 GIT binary patch delta 77 zcmbOuGed?upO=@50SFA&?%T-S!=e(bUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS fUr6Vd`c+HZBeT*D$wSKPNLu Pzo4=tBR_BQGsXY_HVG7P delta 65 zcmdnQvW TlB!#fn4F!Mo?1Nl5n})VhVT`D diff --git a/vllm/entrypoints/openai/tool_parsers/__pycache__/abstract_tool_parser.cpython-310.pyc b/vllm/entrypoints/openai/tool_parsers/__pycache__/abstract_tool_parser.cpython-310.pyc index ae2f3f37f34db68ff9f4afed9f0f222d1476e5ff..77c6782979962b0f399cd83302ea12afe95bf789 100644 GIT binary patch delta 62 zcmX@DcU+G*D$wSKPNLu Qzo4=tBR_BRN9HJD0BuSYQ2+n{ delta 66 zcmX@EcUq4-pO=@50SGF$HEiVG$E=Z}Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5EpwDG0KuIWVE_OC diff --git a/vllm/entrypoints/openai/tool_parsers/__pycache__/hermes_tool_parser.cpython-310.pyc b/vllm/entrypoints/openai/tool_parsers/__pycache__/hermes_tool_parser.cpython-310.pyc index 82faabacf59f852835a9801fc44a58702a06f72f..f621c0262abbbd7a7c72f37e799857b9a847b218 100644 GIT binary patch delta 357 zcmW-dJx;?w5QRP7wY_oH`6EA=gnt@}$fSruO~Vn8ra%I0C6RWB6&V5z6yX9WLZXBN zP(&#xKy+M!BT&N zYL$HSGcVNIAvLi{Eo@~Vr`Bl$H^7MeXmbj<71dt0L-!SqjW8d|2P2eGb;@+JGyi+C z_D+L@;vgQz?c{9SkCJwet_IYhNuY-3L42DGMwg4Z{au8+*`&UIB*4{@ARP&2D!9;| zYniDDcFLLdW`Wt7mOwB8OS0^EYMaX}VfI_UW-fOZ7ma7|cE>&a%O7hT^`n~w_#f~O D(A-aT delta 343 zcmXYru};EJ6o&6kra{ll8m;b%-*>EG*wMlxTx4Uk0;?@s<6RrtO>ZnVKR2pbV zh73sRL6~T!Ul*3lU`9DAY?;MLRJ>Jah!vT`oXlfhF%zrOLr-N>6r_*7%9bd~5|(5c z%Zf8%O;)f1B=p1eG2lj+f7;~sGaM71<<33fPM90(X;bBJN^0)UVs*1dXY{Do8P4cQ zl7$;%yB%D`gFr-`mIy?z9rQ=TZgjc7yH^k5-Z0$hw>lTC^Ds_c*w->VOk=O+GtlO? yW`hHc>7?1B3*%_hSFfZ>N@*%IpmU~K`hWTDUF(c4C1-_4U|WO3bWZZ?f50ESuTi)F diff --git a/vllm/entrypoints/openai/tool_parsers/__pycache__/internlm2_tool_parser.cpython-310.pyc b/vllm/entrypoints/openai/tool_parsers/__pycache__/internlm2_tool_parser.cpython-310.pyc index e4db40f01361388a712a7b21827b5659a2dfe3a8..15c820ddb873622daaf8a0bcd8d4905bdfa2daf6 100644 GIT binary patch delta 163 zcmZouZ&2sX=jG*M00P6c`!;gBFsmf$m*f`c7i1RbmLwLXrYEf7rMSjbq*U&CLtak3D*AIk*B zLhH#%?5g@FYXpl=rZChBgen`d$KurLa2R_Bdm0|5EIJ8A#` diff --git a/vllm/entrypoints/openai/tool_parsers/__pycache__/llama_tool_parser.cpython-310.pyc b/vllm/entrypoints/openai/tool_parsers/__pycache__/llama_tool_parser.cpython-310.pyc index ce23591c1d6ed25f951a88a2a5107cfe305a1df8..dc102bf3f30c111c979a5512bacc610ff0e3ef8d 100644 GIT binary patch delta 437 zcmW+z%}X0m5P$PFyV&|6R_k9mV8NF>;j8A(b5!fSb!TC+FgWQ*7OD*GauFLXA=R44Yf9X&6MRg-_XG@}X4ii7|Phj{grTl5< z1P?Gvsm^Ykr${y-*PQWfNww#a0uA0%~6rsLYoPwKke(6q5(VCdJEjqKSX>7!MyZAQC zK9_rO{}vxbZ{Z0~jd74oN3qh&3z9Dv;jEK3PGRv3l}#2|j=GKIhj{Fs=-x@WnHMYr|_O`$r!=WJE(rL4ibrL@^PC<2~Vsoj9>W5$UW%m?mAK z?V=Q+wdhWwrslt(L`YOfNKsJO>{Q?Hn;A_pe|s0bU=#$5sM`N}IQ)JRtRGNLxFHNQ z!K6g7DJ-|ZwNs}?;O+~;10H@NJWT5|6V}q!d51@zsq!&Tluy#;%v2lqIDJhzrJwmT zS~S)M-4By-SBwUI(G^>p-JSit;b^<}=<#}YvbC2!-02VA_ur+Hd}#h*^rL(mzM`4@ z5?&g+b2*QmN53=gJh?tJ4YP3kOI}7#tz)`-CZEK;hL=UhbmDO`4Yp6RSaIXpj2rSW zuDBbzyCKiwse7vZsa#5q=(l{HbgcLRC4>cxGM7=~%Ch8-O0&#d|H@F&w;k$Ru_ETm Xp!$ZgoL7&ibAS9&{W!m<{iFW@T8V#~ diff --git a/vllm/entrypoints/openai/tool_parsers/__pycache__/utils.cpython-310.pyc b/vllm/entrypoints/openai/tool_parsers/__pycache__/utils.cpython-310.pyc index 6d3370427ca2be533e45bf94b06fd54f65520179..31b9a8141df05d0d2cc864c8c3b9cfef6ca943f2 100644 GIT binary patch delta 62 zcmZ1{zDk@spO=@50SFA&?%T+%&8!lrUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr05+Nvp8x;= delta 66 zcmZ1_zD}GwpO=@50SGF$HEiV8X4VMRFD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` UN!2Y#OwLYBPc7aY#T>u^0EWdBuK)l5 diff --git a/vllm/entrypoints/openai/tool_parsers/hermes_tool_parser.py b/vllm/entrypoints/openai/tool_parsers/hermes_tool_parser.py index bcbcda3..f3cc1d9 100644 --- a/vllm/entrypoints/openai/tool_parsers/hermes_tool_parser.py +++ b/vllm/entrypoints/openai/tool_parsers/hermes_tool_parser.py @@ -1,5 +1,5 @@ import json -import re +import regex as re from typing import Dict, List, Sequence, Union import partial_json_parser diff --git a/vllm/entrypoints/openai/tool_parsers/llama_tool_parser.py b/vllm/entrypoints/openai/tool_parsers/llama_tool_parser.py index 3cf34bc..f950ab1 100644 --- a/vllm/entrypoints/openai/tool_parsers/llama_tool_parser.py +++ b/vllm/entrypoints/openai/tool_parsers/llama_tool_parser.py @@ -1,5 +1,5 @@ import json -import re +import regex as re from json import JSONDecodeError, JSONDecoder from typing import Dict, List, Sequence, Union diff --git a/vllm/entrypoints/openai/tool_parsers/mistral_tool_parser.py b/vllm/entrypoints/openai/tool_parsers/mistral_tool_parser.py index c6dc068..b7d5d0a 100644 --- a/vllm/entrypoints/openai/tool_parsers/mistral_tool_parser.py +++ b/vllm/entrypoints/openai/tool_parsers/mistral_tool_parser.py @@ -1,5 +1,5 @@ import json -import re +import regex as re from random import choices from string import ascii_letters, digits from typing import Dict, List, Sequence, Union diff --git a/vllm/envs.py b/vllm/envs.py index 4c9b4ae..3361afb 100644 --- a/vllm/envs.py +++ b/vllm/envs.py @@ -66,6 +66,7 @@ if TYPE_CHECKING: VLLM_SKIP_P2P_CHECK: bool = False VLLM_ALLOW_DEPRECATED_BLOCK_MANAGER_V1: bool = False VLLM_TORCH_COMPILE_LEVEL: int = 0 + VLLM_V0_USE_OUTLINES_CACHE: bool = False def get_default_cache_root(): @@ -430,6 +431,12 @@ environment_variables: Dict[str, Callable[[], Any]] = { "VLLM_ALLOW_DEPRECATED_BLOCK_MANAGER_V1": lambda: os.environ.get("VLLM_ALLOW_DEPRECATED_BLOCK_MANAGER_V1", "0" ) == "1", + + # Whether to turn on the outlines cache for V0 + # This cache is unbounded and on disk, so it's not safe to use in + # an environment with potentially malicious users. + "VLLM_V0_USE_OUTLINES_CACHE": + lambda: os.environ.get("VLLM_V0_USE_OUTLINES_CACHE", "0") == "1", } # end-env-vars-definition diff --git a/vllm/executor/__pycache__/__init__.cpython-310.pyc b/vllm/executor/__pycache__/__init__.cpython-310.pyc index 06de5eaf40730cbada8d45bac9058514238f248a..a4435721563df6af49f9e31c1ddd53d1204119c3 100644 GIT binary patch delta 59 zcmbQoIE#@xpO=@50SFA&?wiPMqhhOHl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEogI9{}@P67T>3 delta 63 zcmbQmIFFG#pO=@50SGF$HB98T(Qwo+EiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuNUI4*)-!6aWAK diff --git a/vllm/executor/__pycache__/cpu_executor.cpython-310.pyc b/vllm/executor/__pycache__/cpu_executor.cpython-310.pyc index 0032ddf3b52621deaa1337bdfc62519eb89a7480..6286a080944c7e3af039b6c720b102d7ec1ebed6 100644 GIT binary patch delta 94 zcmX>cu{(l0pO=@50SFA&?%T+{ltaZ)za+OnzaX*D$wSKPNLu rzo4=tBR_BR4UT)fTp~bSJj`5-ER35EiCGA72>|(Aj9@;SrY$o7U?3SW delta 102 zcmdlTaX5lIpO=@50SGF$HEiTw%Aw(^Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> xlB!#fn4F!Mo?5*53dcQO9x>nn28plF5v*n@y$E85tud$4ZwpO=@50SGF$HEiUTWzuldFD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` UN!2Y#OwLYBPc7c;!}Np^0DZ+2{Qv*} diff --git a/vllm/executor/__pycache__/multiproc_gpu_executor.cpython-310.pyc b/vllm/executor/__pycache__/multiproc_gpu_executor.cpython-310.pyc index 57a1ff8ef4abdb34f657607ddb336e50371159ce..a9f62cd7459d5d7cc3fc7c2952d3881f7d9f8ee8 100644 GIT binary patch delta 121 zcmeCT@3iO6=jG*M00P6c`!;g#E zFQ_cZ$j{sSfuomMObe)sgOP)gi`VY{y&{?b delta 127 zcmeCQ@3-g9=jG*M0D{VG4I8=la%lMLmlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} zr0NzVCTAz6rxtI1!_mtup##*(!N|eL#mvMg!pQcYjfIbq=|30K=6;^7%g5bpYC?b=Dbsc{_tqz(kptdz!a+9tGW8`H#T_!A8c30+k&#(r_OUhi&a zcN-Up770`iNKo}1kdUBN51<}6M1})MrQ*T?PKXQI3ukT!apA_y+kz`B`P+HlH}l@S znR(wYJy=Rw!^4Sv_^W*R-Cpu$_~{qRZr3i`x_!iLK%2Qo7P{U}x6<7$8~U4N`$8F`EslP}0;NUrkI$aroJ%~kw6lxBQiL^=?PN0lVZ@qB!o zKTQ5zIf}xH8il9u3zGy(1T_R-4)RjN@XSEy|2~utDZ*)m*mDG{Je^vTDF_d~oSMuC z_7JTFl*l^6@1=fzNd&z@>k9<5k*~N6y1LnLS$)@n4g+yMR8dny!Qrow^Zz!i@`uW- z^c?>~DJgW*ApgPjrL+9>NCENU$S2Y=|7)Zp)%Y6+KcC-3XFuUKoKF3U$2Y~sQ-$7S7GPj_LQ*wYAVEV%Cs5e;&Sh$J-r+Y@`)Z6xkT0}m3R zMWFF7GJ8{+LL&v9Y3gP>7_H$ZFe>V{=X$_^qM^;-8U5k#e_6muB>luj!|+%Qzyi@w zKhn_+1A93mXG5^TZ)V?CL`apk5Y06LZJke#J-;QYA0tgB5OZ{ZtO)`g!IxJ=5`Nfm zA;@Hhw95n=1nUHY4iDyLng24TD$68O~W<0RMP`srdzkc zYBI-xHC`^vO%7)51O-kLh)c(?UJVzsY4Z09N9FS*Eb<41!qj8OAgK*K+OTdmx(r?= zKQWG{ZWl-MkF@~>KhAor>A6@(#%GIJX^XEGFXpyLifro!^OM1ZKiaGRZSk&@eV630 z-s)*_ll9y>TKB_nonJZh*{n&&y^o+q;5yki2t*Pek|pZ&0a@aa0beX-CE%N-k55ol z6bWB{1PxhANI;BQ5e)%OF*bpN;O}>La9CP6JJ92YC+^(1jjWcuY8c%a!)mwjQKraw zlt9!}A&V*r9}(Olc$wfJf*-A2#a;vh&?UA)th_ExfjMH%5{SN1eSmI?Rlp!XD})d3 I+>>wp12?TsRsaA1 delta 1482 zcmZ8h&u<$=6wZ3>&BmM5>!z_A>@00#~Ti5myrn*}ARrTzTod+*J> zUo+q3?&maTU?AFqzukK`_OfCuh<>G!DUu$8v$wU9a*i~M zJQW`qo<(sPKbJC5d&1I@kQ&i7nC*77gf#UuvP+o=Jc9o)MsS{B1;JN>m@_hrA1L^I zU$Xm8zZ}wq;RVt>PjHdPVwV+i#FMvTV?%;HL2Ch{B%R}(*e|+pTBY?X1n2plo)`~2 zah(YT=eLV`5;|siOjrrDgtSye_Tqt4F_Fzk7^Xb^ zh>QEM|4Suuxx()Z{`Jzcw3P}E2_w&|Rh|+ZglkAZj@anxuFI@OzFlK5LhJ%UrZ*_U zBoP*wg+*kW{I_HK$=8s$8wo5(3EKpl{EMOe316qN1FzYvHLJn+4U}=lm}P8v%mWL^ z8|wVc#1D^NBaxzjvj~24-LyR`58!}ksvoY`Y#SDDYsnB4`8&zCbm6f`9-_Y>R2zKa z_{yeeNH3`r0x?ZTNIFT-K=73%5rQwf41zdp(zOVR1RDegO+T2NW&ZQ=j82mb)JwQZ zaGI;bKZdUFb$=b6my)7gv9bqXHJQ-@r);?{tntTEPmUc-+jHbdw<<`v7prA5jHb$O zq^6YuDRTUqRBG?gF-R8s|J%@Lnhguq$xck@JW9Uec#Liz-R|IC9%>62s8-u5dkpJZ zqh*Md4rM8>MhW@v@pCUC^s6dgO<#~oypv8!>)m_l&!yxo@|0_pc2R9wZDyc!SB9Is zaiVjHp$^_h$b{i0$?p<~C_f}g6!HU-#9?ie{>D$d3Tau95+NlXm4Nti55FHxb2hp& zM-|m2Gz+7kNN7MzW=b>@?w|}i1iJ`+U+|RS)WO?)?Br*ApCDV*c5J&bX*<=b1rQ_S z1cB&>P7)0sd_?du!DWJ@2!15LgMAE!$0c@#SfwByOqeBRi9pN*RS&2LSRizwJVG$X Ia}U4qFD~+BjsO4v diff --git a/vllm/executor/__pycache__/multiproc_xpu_executor.cpython-310.pyc b/vllm/executor/__pycache__/multiproc_xpu_executor.cpython-310.pyc index 4b31776ac05a6eead2cfd3f8a35926dff1d405b5..af0c391250250035ae9881dc8b2b2271e6d9db08 100644 GIT binary patch delta 62 zcmey){h6CPpO=@50SFA&?%T*6&ZOe4Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr1pO=@50SFA&?%T+HfLX;wza+OnzaX*D$wSKPNLu Qzo4=tBR_BRXJ$Qq08tJUr2qf` delta 66 zcmbQMwor{bpO=@50SGF$HEiTQz^vh+Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5J+mG^0HbLYwEzGB diff --git a/vllm/executor/__pycache__/openvino_executor.cpython-310.pyc b/vllm/executor/__pycache__/openvino_executor.cpython-310.pyc index 79fbeb96bf9323c3d83b67cdbe0204f05d9bf83a..43c6b1f28a263d8c5882f6e152d2308a654936e1 100644 GIT binary patch delta 97 zcmaE8dE1gZpO=@50SFA&?%T*cjY-8#za+OnzaX*D$wSKPNLu zzo4=tBR_BRNhW7DJ_DdG9!5T9CPtS3Ow5~QICFWK^7JQni@7o7ac{mX#>WN#uTmTS delta 103 zcmca@`OuO(pO=@50SGF$HEiUb#-!n;Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> zlB!#fn4F!Mo?5*5D3ddrfDuq94d%YP;&mVZnvo5eVDd6^2GCbx>Y0jbSr#rW6& Da_AmV diff --git a/vllm/executor/__pycache__/ray_gpu_executor.cpython-310.pyc b/vllm/executor/__pycache__/ray_gpu_executor.cpython-310.pyc index 2aaa6fec54a7680ac9360957f4abef0139cb6695..e279213311e4251e15ab63903bdf08858ea6bdb6 100644 GIT binary patch delta 130 zcmaD={ivEdpO=@50SFA&?%T-ygH6R%za+OnzaX*D$wSKPNLu zzo4=tBR_AmHhYhNh!{{88v`4c&<`di4knggT%2tGH=h;X#=^zM$iTqE#KXwNw7FlV gSeh|vGqXhu6XWsC30A6%Y^Q+wicW9twvJ~404<*-U;qFB delta 138 zcmaD<{i>QfpO=@50SGF$HEiVm!KUG zlB!#fn4F!Mo?5(FoxMjuOaiErje(6z=m!%M2NTOL4o;?jY>b*D$wSKPNLu zzo4=tBR_BRI~Fzt#;DC-RfHJXx`CRD@+UXS2v1f}yTsVN`Lmh}BV*KL3k_AquE}v4 X6{0;L6}=z=WK$7XL)Yfl8m>$LsxT+* delta 125 zcmZ1zwjqo=pO=@50SGF$HEiVG&7$F{Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> zlB!#fn4F!Mo?5*56$_gJVGZUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS ZUrUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS WUrFcN delta 72 zcmaFL`;wPCpO=@50SGF$HEiUrVbbu_FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` aN!2Y#OwLYBPc7cOn#qfq@z&&TtnUFi>KO6> diff --git a/vllm/executor/__pycache__/tpu_executor.cpython-310.pyc b/vllm/executor/__pycache__/tpu_executor.cpython-310.pyc index 02db6b64584566a296857b8d5cbe4122b42b13cf..59a4791e18ae79cdc9d9563880ec080e70a4f71f 100644 GIT binary patch delta 62 zcmbQMHB*Z_pO=@50SFA&?%T*6!m8q^Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrB07zyO0ssI2 delta 66 zcmdley;Yh!pO=@50SGF$HEiUrWz}%iFD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` UN!2Y#OwLYBPc7cOhLx2A0Gas}5&!@I diff --git a/vllm/inputs/__pycache__/__init__.cpython-310.pyc b/vllm/inputs/__pycache__/__init__.cpython-310.pyc index 565b6e445aec2651652cba25c7c41d033e9ce53f..1ecbfd4b57076e924c54b03c5fbb65e7b4813e7e 100644 GIT binary patch delta 61 zcmdnav6+KApO=@50SFA&?%T+%&8%XrUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS PUr_if~!&8%XsUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrVeM5us>WDt=C)*PdMhEWA9Ed&xw01+UwAZj>3 htaK2OvDwFPDU(zth^+}CTtP$*h{yvG`IEU#;sJpnMUVgh delta 304 zcmaEo@hXEmpO=@50SGF$HEiUTVAF8aFD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` zN!2Y#OwLYBPc7c;&Q{7NA_UaQA<4tY!NkEVz{JJK^q-4q^Er_pLX5XIA6K8u$QZvl zT9c27Hvys$}8>0LNxT(*OVf diff --git a/vllm/inputs/__pycache__/registry.cpython-310.pyc b/vllm/inputs/__pycache__/registry.cpython-310.pyc index c03e8fdab22f1f54adde556bb0b0fa5eb11b811a..8eaef980fbccb0703357a29dcc683e0be6a2872d 100644 GIT binary patch delta 62 zcmezB|Iwd2pO=@50SFA&?%T+{g;m8`za+OnzaX*D$wSKPNLu Qzo4=tBR_BRb5=ej0Eo;LbpQYW delta 66 zcmez9|J9#6pO=@50SGF$HEiVG!m44fUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5F)N=E0N%qEg#Z8m diff --git a/vllm/logging/__pycache__/__init__.cpython-310.pyc b/vllm/logging/__pycache__/__init__.cpython-310.pyc index f37e9d2eee39cd16403ca85b276413343bdaaa50..84691e35306720775fa6a500b67c3328df08aa43 100644 GIT binary patch delta 59 zcmeyu_<@l-pO=@50SFA&?wiQnuVSNLl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEvQ45dbJJ6hr_3 delta 63 zcmeys_=S->pO=@50SGF$HB990*Kp7;EiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuOf~2mp9j6;uEK diff --git a/vllm/logging/__pycache__/formatter.cpython-310.pyc b/vllm/logging/__pycache__/formatter.cpython-310.pyc index afb951e18a9a949ad31d127114f83576d2fa663d..ac687a982c2d9263cf4894ee8acffdcf15095828 100644 GIT binary patch delta 62 zcmey&_MVM9pO=@50SFA&?%T*6!>D4bUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr{70H}Nw?f?J) diff --git a/vllm/lora/__pycache__/__init__.cpython-310.pyc b/vllm/lora/__pycache__/__init__.cpython-310.pyc index 73ac80f035a00ad4108e28137919bab9074af7ad..6a0040c8ba1088d93c3fe3b43df949ad9df13b0f 100644 GIT binary patch delta 59 zcmbQmIE|4zpO=@50SFA&?wiPMqhhIFl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEogI8vyX@65s#; delta 63 zcmbQnIE#@xpO=@50SGF$HB98T(XiDoEiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuNUI4FEj)6Yu~4 diff --git a/vllm/lora/__pycache__/fully_sharded_layers.cpython-310.pyc b/vllm/lora/__pycache__/fully_sharded_layers.cpython-310.pyc index 652738e2472e5dd6c047467caf53e7de744e1040..7e13e761607493abb5c4c8b51f44141ec33f64a2 100644 GIT binary patch delta 62 zcmbQ|I?I(ipO=@50SFA&?%T-S$gJY3Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrE08|JSD*ylh delta 66 zcmbQ`I?t6mpO=@50SGF$HEiT=WY+N1FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` UN!2Y#OwLYBPc7cOf%%mj0H#Y8I{*Lx diff --git a/vllm/lora/__pycache__/layers.cpython-310.pyc b/vllm/lora/__pycache__/layers.cpython-310.pyc index bcc2b16f9d13989a3154fa2487957ff926032546..7d1ee4c20c556161cb1ff8d12782414848d2ea52 100644 GIT binary patch delta 97 zcmaFY$@HR=i94T{mx}=i4A<`4$eqrrVy<73TcBT%S)f~zSd^YxqHCU8nvrXmTdtpz xnWSG(S(1^Tw|N%pdm|w&pe{Bx7DfR^E+Az2&&0HOu7$J)GY=Eb=G_U#Dgd(68@K=f delta 103 zcmaFS$@H$1i94T{mx}=iDz`OkEFQ_cZ$j>v@Gc?dI z&MZmQEl5nxPE1cN-aL)`BIZRpO=@50SFA&?%T*M$E;$iUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS ZUr*I6_)@2 delta 75 zcmaE<`BsxVpO=@50SGF$HEiUTW7e?LFD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` dN!2Y#OwLYBPc7c;%Ph{!%)!jDIi0PE4*+U!7NYM+soF)Ib(4D<4ENgR*nxy4 zO#-1?SEY~~3Ts&lVRS%wbi+)Psim7*P@tRkl)8E99^EM0w03Q!{ZX|NJKyK9?vKrq zfA{x2&N<)fp8NgBi2Qxr~i2izaC%T{e=HWW%ahi6msRJ{NK} z8CgmeibS_5%Y>TfcEv89NxI$0RtX5VdPuCwdDwGPN zQmHh2iqEK0s*Gx-8f_W+8ly(3F=~}slr#0owMLy%heDQKZ>&?+A-CxbMx)Y5B)XC| z9VAM#CaEnnxku8LY4#aOvmZ1G?RqU+bIeFetI#_&m(aVY>!4X_6LOB0E96|7Bjk1= zyR|$a=TRqZb4x^#vzl(3OX_`5BkT(Y!WB`K4bx~vy)m-Ws5bWb^uVAmJQm#<3dTOQ z{572%;P2UolB}jw!oQS#l^nR@_=xmnMWtQjlsulfK#mY5NA0^TT$RGEJRo-#4CXYyh74a5VF{$CID?dGFHf=!i z=BkS(N#Z_RUhItPEi;MpKwi0PyVt}bV!V{}eKatyR2& zhXT>Dc&Z*^sz0KKq7gO&_Co+iz{!TDKv1Kj{%FV_(AXT$EZyOJ20S{z!>Uml9twrW z*irsOX(5^7FP0wWr~4gbo_Ca87Wi>lIXTAN<((PlU{#j@k>NZKlozKS7Xl?hd!8RF z-%O74J=M9f&&sb6KGp8X-6*Uh!Wu~z#59#ESw+4wN#b$uN%>ns$ENw@s!DR2UtYC^ zT;QLt^5lF&sFyM_LK@ZCX7GE8`&Qre;F2r2PJq|UT7h2xxB@kebw0d|*q#Hq8Q=uK zG}kIVPkROEdVp)O-IawzoVG`H@RPpz-sgo@$r=f3YLxm78dU{R8J-2{u{i*!d)$fD zq@z($?!BQQb$K2fGq$;03HC`5r^UHys@@W#-vYhe{C)~ z#Ybz~?U0o>IT6%S3E!?AAZK{t+T-LYer@e0&jHxT1#lXim&&>1EGCXD#;WVCn|9!^ zyaj$Y0lrw41L7?JjB^3l3j&nXK{Z1Cx;jP~dmFSE=^KK@<-|+D9tZVL_=bkwG|cZZ z$YS^!mX}~d8$re{J_-zDNQ4IB9sX{^a`IFDX~PQnA}FHR|C+|bg#3!X*))=O6tukn zYXEit)BxO!^*0X@+bQ4}Hg5eazuD49ZpEDIn~60lZ08AkhkvDY*CXhIAwmn{W}ODv zC@h9_y_Q6Ue*=m;02t#hfZ@5n1%~I|=IL#lNQ^()cD^1f^;IzS0Za*qTbLRgrtEj1 z$OHH}K$8G(O5%_huWxTngWy;Xz(u$g$gBL>_H*`2p!k7+2ZQ)782Mnwohq0p_I&`H zf2?UHi1*z#1LBVXeuTP|t^v>QLBuP-% zQsh4haepDdTuW+@^jr| zWR}|s9lWlmSKN7rdip%y278-;2k!^Q`#xyT@{fA9Hvaj61N#dw>^j01JKq(CCr#oW zgwU)~y2(WH?z6jaQtX+HZnAXUzV?V(^Pl4wEJ_pytBa+>GGSS;-`@q7vwZ8Omqm>~ z+jOt^J)zj%EnfTo)pOk8I=5{8nz;O?HwU)i9yo8XZ#;uhBea+LL%K#IQHGIVAO0q+ z53+}MGcGe48PTH*GsIl6fLD3bmZNF7A)fVj_!{s}wj4?MA;jf1#a;7TU3{U}O`zS0t+m#EUt(ME5afOD4^hjhlYoWnNF^?I}6_ju6~zg?(RmZ zSa2kdc2ux8#wI!u@-QgYCfST8(=^SrrZH(dP12b@Hf_>0(WcYbu`}&IolfmNXC=vW z5@-1B@BGfW=bn4+#KQS_CmW(4tHqDm5DMmJPQYZQ>Mh?rRxh#+7F&A~A zrW*OIfEKVqTFBhg&5CFd^H2{fro|H&kZLSpUg|||HI}jxT7o>ySjI|eDO*mLvoczS zn$1|j%4s>PpcQDR8$Py@u0)<;RI*ic6|16EteRFcKlQU3T7y2jv6|J=T2@Ev&~_MW zSUsJnMXAngL(CG9q87iw;4yY*bXwa_HBjZ!PpJW}&C=xtKiq_+(b ztyp*N+pI0ow`gAZw^aU>=w5A^?$Fx`OD%@xi5ScLnH@L zZj&BI)U=Pxs^gA1GDEl}>fC1;cZ^%KtmDez!tpH4S!g=!mcKdjw`e?THdo8l)H&s_ zM^g_Mk9*{pigB~1#!QlV#X46hsTF%%#i@D6)B8<6SNw?UBQv2wcbCVXbmu7~DyD4( z;%(0}#R^gHSj|?FK~jiHY!VgVcT&u%ViVsjzOH^-9#vi|-s#PWN0#hYH=P9ggoK23 zFesN7ijF00MwkZ!5hEOp@T1_L0+@!NEOdoNH2q*88V-asJ|mWv?an(65t|^ws_FXZ zV0d(l3o%pXB@^PgvgxEBrol9P2G~ilYsF=9Qkcuj$th7;zS;gP$Xg`%6zM%wUTS+( z8ak2cyqGWVCXb5SJq2-l#Z^Ks!WweBq(3J85vwH1q|Kxfr?~Aqr=FHJpA@H7R+Bk# zZDr4ri&CJOLm?iC28Ot<w93g06Y#bDZW|tpY+Q>Hvn9TAF1|2k#qj@D;|>y&5Vs|!KfZ!dNe3WkmEeC zzQt~^nj$--y`Utg{1MD1=4-C!L*9gC(9naN;|Lsk37c_lb)|ysP1r|*OxFS|ti=pH z!jFg#>RM}m07Fv`1o=p4WSD;orh5XQ2Vg0H2LQ9;S$I%vU*q-S@?d4uKCDLrk=Q^o zEiZ=XbK=CBjZRpWFEv?fH^>i*57+dQr$l}IY1zwP)^GD10oesG2f=rHc{f<@A9*9* z+3>Qm8;{RVA?_N$=fm>Bd>sHwp9OYS0<{eUBYMCHj_I7g1u7Q*s$>cEfF2s&8|6bF z|6J@|*E@tu{yx|f0B#6Nfy>OBCG};0VUL?205|q)z_7Ap!C<~Afu@B8urBm4jio|WLUB&+@{2v8TtGT#PP3-CLDI)Lk9 zS=%=9f?#bI8fQWH20$MG^dn*6!I5E|CqRJS@LvI7YtoXFydZiuwx&aIyc1vnZXdZS z7B66AHqOZF!m_`v4z^e4gf z8o-ZH^KR+){1Hri9n9Pb9Ft@Mdmn;qARbbr`GHv2av!-Y??=Ay-(wLa?E@+XW1KkK zzGvb)FboU8qkln~iIjnG*x+&Sz;gInfGYq{B!2~<0N^!%p8z}sum|7`0C zo)>D@_NG5C2Jnx7)qVz_XZ~1f56Yh418Fs7C<<}k;UC9mx~j-myvpxx4c2`&HHQSr zMq#J1jo3155$^pn5OQ7&ZM!IYo_)_>N0Ef_w6b^e%P+p5uhd^+?Q!a$GGg9-A2#J9-{T$Amc7U*$QN zCohY~dK<|P;h>OL#Essc)qpc$9u1A~$^Xx6maobe+KFjD74P+($--i>oWILKJelv7 zczpW<>v1<6prZe8!0^m`3hWlZS8mfy@%0_+-8Ufy--HvurUCALD&srm z$&+9G7_eW9j{aR_JbtGCS+W+lvjOB40F3~6Nsa--lY&dQ4Q34hWS0NkfDhU6d++}r D4p;Ct diff --git a/vllm/lora/__pycache__/punica.cpython-310.pyc b/vllm/lora/__pycache__/punica.cpython-310.pyc index 1b728151a58c690cfed5aa7366f657e5de7f408d..aeedbe9493a6d132983e7284a864ebae27c916f9 100644 GIT binary patch delta 71 zcmaD`|FWJtpO=@50SFA&?%T+%&!%FoUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS ZUrwaa7YG0V delta 75 zcmaD^|F)hxpO=@50SGF$HEiV8XVb9OFD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` dN!2Y#OwLYBPc7aY$5z6_%*8CQ`KpkJE&!(y7!&{i diff --git a/vllm/lora/__pycache__/request.cpython-310.pyc b/vllm/lora/__pycache__/request.cpython-310.pyc index fba3fa25fb46f7dfbc8356f75ebae6fdf1b09766..0d466eefc64f43bf24342ac88e166a6599fd0c31 100644 GIT binary patch delta 62 zcmca9c~z1-pO=@50SFA&?%T-yoJGY#za+OnzaX*D$wSKPNLu Qzo4=tBR_Am6zhI=0BBVd$p8QV delta 66 zcmcaAc~g=*pO=@50SGF$HEiU5&Z1$XUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(FjCDUd0K9k=*#H0l diff --git a/vllm/lora/__pycache__/utils.cpython-310.pyc b/vllm/lora/__pycache__/utils.cpython-310.pyc index cf125f875cbbb815b02f721ceb1900e6425fac00..76b259e1d6f96312169a11b507d43a003c25ba96 100644 GIT binary patch delta 529 zcmYL`&2kb!5XW~nyUQ+NA+Q0me3*nlLU3^@Z!-ou*wH;GFm#9`E~#P-8EJ7GyRoDmr<0r^cj8mI+MHTWaY5Mj@l5HT=B>g zpM1$tP67%fq|mmsw^g3<`rc5RQlNrF6iJbaQlgUauG*3^l?{8UA~D5=eYGuBsv6Fz zn$)RoI8Zy1P$CU##L}duw5TO*Y8x4&kygHTv4GeFphmuliTc~4rZPO$4 zv4;cn(8UoB(LsV18fc=8{aKMR_z19@Sc!$lTzF-LHXm_>^1Bfial$23c?&L=;UP{e zuH2hxfn#26-+1)oZ+yU2r2hu~hdVl27BYV(Zu5bCarvF>Wa`}f>2ubE7J?(l(*J?E}jFxG=TKGdBT>zd=c-P3F- z^K5=GA1==p=U5IW@?j<;`IxDTx7qw^IlFwne(isbqL+&|`rp5M3!LNA`bT{0{05~5 Be~AD9 delta 526 zcmYL`%TgLa6o%){a2dn_2L=#DMJ1r)h1{$x@))VJL(fkz_7O|W!WF5C`;@!92UU5G zJVYKKRe6AP+Emh;{`!3X`8WM*_;VP|qNrf$bN}trlpmv$h0PW_$`O}b@yHXOdU7{Krg6 zT;Pm7bk@jkC%@NeONxT~WH*LC!i8>TeHh?|CL-Q3?zXV<5P$4A-x@(u?#c5dZ)H diff --git a/vllm/lora/models.py b/vllm/lora/models.py index aaadca9..8805d05 100644 --- a/vllm/lora/models.py +++ b/vllm/lora/models.py @@ -2,7 +2,7 @@ import copy import json import math import os -import re +import regex as re from dataclasses import dataclass, field from typing import Any, Callable, Dict, List, Optional, Type @@ -263,7 +263,7 @@ class LoRAModel(AdapterModel): new_embeddings_tensor_path) elif os.path.isfile(new_embeddings_bin_file_path): embeddings = torch.load(new_embeddings_bin_file_path, - map_location=device) + map_location=device, weights_only=True) rank = config["r"] lora_alpha = config["lora_alpha"] diff --git a/vllm/lora/ops/__pycache__/__init__.cpython-310.pyc b/vllm/lora/ops/__pycache__/__init__.cpython-310.pyc index 9ede1991ea6975fa75586088bedd7503a57b82ea..85eb3c184325a8abe767c6100a413cad56d974ca 100644 GIT binary patch delta 59 zcmbQoIE#@xpO=@50SFA&?wiPMqhhOHl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEogI9{}@P67T>3 delta 63 zcmbQmIFFG#pO=@50SGF$HB98T(Qwo+EiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuNUI4*)-!6aWAK diff --git a/vllm/lora/ops/__pycache__/bgmv_expand.cpython-310.pyc b/vllm/lora/ops/__pycache__/bgmv_expand.cpython-310.pyc index 217f22f5cec8172f3dcca3f0b4c66e0fade8c049..7e6e3cb3a254dce5684a26e04179fcb14473168d 100644 GIT binary patch delta 62 zcmdlbvrUFOpO=@50SFA&?%T+%#HQk)Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrmdq|c$pO=@50SFA&?%T*M&Zgp~Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr-zO06;kt+5i9m delta 66 zcmX>kdrX!)pO=@50SGF$HEiS-XVdV~FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` UN!2Y#OwLYBPc7c;##X}t0FdMq>Hq)$ diff --git a/vllm/lora/ops/__pycache__/bgmv_shrink.cpython-310.pyc b/vllm/lora/ops/__pycache__/bgmv_shrink.cpython-310.pyc index 0f980911de5c23ab72cb71523c9da80512d4f0aa..3938bb801de3b546c0b7d9a81989c986e7f54f76 100644 GIT binary patch delta 62 zcmZpbYLw#6=jG*M00P6c`!;g#VpVa_FUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E QFQ_cZ$j{sSmQ{is06cmWD*ylh delta 66 zcmZpaYL(*7=jG*M0D{VG4I8<4v1+*JmlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} Ur0NzVCTAz6rxtI1$tuAP0F8AOI{*Lx diff --git a/vllm/lora/ops/__pycache__/sgmv_expand.cpython-310.pyc b/vllm/lora/ops/__pycache__/sgmv_expand.cpython-310.pyc index 08cfc9faa3dac57ecc38f90d4908adef37bb1ae9..1e54c33948407a5edca1af3847ab7e3dcd212a6e 100644 GIT binary patch delta 62 zcmdn3vR#EcpO=@50SFA&?%T*ciCx7(za+OnzaX*D$wSKPNLu Qzo4=tBR_BRQT8$}091h#zyJUM delta 66 zcmdn4vRj2apO=@50SGF$HEiUb#IE6@Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5AbS}X0H)*>&;S4c diff --git a/vllm/lora/ops/__pycache__/sgmv_expand_slice.cpython-310.pyc b/vllm/lora/ops/__pycache__/sgmv_expand_slice.cpython-310.pyc index fdc90b3ea4f003f04e3a5262df6ad2551d9560d1..51f1d6a3469ce1be2d6cb99bafdaf8538e278a2c 100644 GIT binary patch delta 62 zcmbQMF;jy(pO=@50SFA&?%T+{jzh&wza+OnzaX*D$wSKPNLu Qzo4=tBR_BRLk=5m08R!JlK=n! delta 66 zcmbQKF;{~-pO=@50SGF$HEiTw$D!e+Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5E{6>_0H7rmqW}N^ diff --git a/vllm/lora/ops/__pycache__/sgmv_shrink.cpython-310.pyc b/vllm/lora/ops/__pycache__/sgmv_shrink.cpython-310.pyc index e7f1bfa8267fa39d50e6ffc9eb02076b92a278b1..00b0ff3e88b5e6d1b149efc72a6cb2647a0f61b9 100644 GIT binary patch delta 62 zcmbQQGFyc^pO=@50SFA&?%T-C$f4q(Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr;M1& diff --git a/vllm/lora/ops/__pycache__/utils.cpython-310.pyc b/vllm/lora/ops/__pycache__/utils.cpython-310.pyc index dd898540548e335b05e5ab5b514d79cca6af4c10..762bb6851e16706e7c1911ee9e09a2af04399136 100644 GIT binary patch delta 62 zcmeyw{f?VEpO=@50SFA&?%T-C%cx?dUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrtbX*D$wSKPNLu Qzo4=tBR_AmER!BP0ADc_8UO$Q delta 66 zcmX>ubXtfzpO=@50SGF$HEiU5#i-$-Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(Fl1Yyp0J7W_DgXcg diff --git a/vllm/model_executor/__pycache__/parameter.cpython-310.pyc b/vllm/model_executor/__pycache__/parameter.cpython-310.pyc index fe4df3781bede569a6089a2936768276e7a22c1b..78a8ef1d70abc3032a5191ed2054243469e12c1e 100644 GIT binary patch delta 171 zcmZq9_@2(4&&$ij00f3>_if~EW>Im`FUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E zFQ_cZ$j{rnjpZD-gbq*_7ZVpF6Ab=m`NzY|!nk>!z!^pvBd9DFBTxksR1Hi;htPdl v0g$z93`~qXj7} zr0NzVCTAz6rxtJC#Bz?CQEzgifG`^uGt*xdmd!H+&M?ZE0L|iJ;$j3rCMG6EF#ON* z52~g?=)SA~4^Ryo0~1KaKPE=D|C@6SxEUGUCRZ97atSc9{AXff`Nzkyd6S_l69DkQ BDu4h0 diff --git a/vllm/model_executor/__pycache__/pooling_metadata.cpython-310.pyc b/vllm/model_executor/__pycache__/pooling_metadata.cpython-310.pyc index 354b163d73ac104bf8e509d11e316d9988d3aad3..c03a4f1c274988316da0ad703cbb28eac8c4c924 100644 GIT binary patch delta 62 zcmaDU^i+sDpO=@50SFA&?%T*chgrp2za+OnzaX*D$wSKPNLu Qzo4=tBR_BRdFENH0A(u`E&u=k delta 66 zcmaDV^iqgBpO=@50SGF$HEiUb!>r-2Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5H1jN00JyRiJ^%m! diff --git a/vllm/model_executor/__pycache__/sampling_metadata.cpython-310.pyc b/vllm/model_executor/__pycache__/sampling_metadata.cpython-310.pyc index c02d2911e80578417a65f46f317b8c4e1936d4e4..d919ff254f24a7595b333dfb5ef90f30698ff04c 100644 GIT binary patch delta 116 zcmaEucr}qbpO=@50SFA&?%T+HlUc<_za+OnzaX*D$wSKPNLu zzo4=tBR_954~vm3HwP2je`h`axiY2{9n^jfP;~Rkq3wcfTRGBp6sV( P#=^tM#kjdkE1V4gBz+$l delta 128 zcmcbb_%M+>pO=@50SGF$HEiU*$*d8eUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> zlB!#fn4F!Mo?5(_gT+Xen~jO%KNBOP^0&8~`DIT-g%{;g>##s(B(Vd7zAVH9BG d0$Z2$lO delta 66 zcmcb`agT#LpO=@50SGF$HEiToWYlocFD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` UN!2Y#OwLYBPc7aYz{tf60FkQ{eEE QFQ_cZ$j{rX&Ya2w07AhN} Ur0NzVCTAz6rxtHkW=>@S0F diff --git a/vllm/model_executor/guided_decoding/__pycache__/guided_fields.cpython-310.pyc b/vllm/model_executor/guided_decoding/__pycache__/guided_fields.cpython-310.pyc index 8db14b7763bfa99979e2b3a6f1a135616c96af14..fbc73927c1ce5b7d369ad63001e3f856f2a4b948 100644 GIT binary patch delta 62 zcmX@kdzhCypO=@50SFA&?%T+1!K4zQUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrV!Z delta 66 zcmcaF^jL^HpO=@50SGF$HEiTIWYNgdFD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` UN!2Y#OwLYBPc7b@!1A930HvfA-2eap diff --git a/vllm/model_executor/guided_decoding/__pycache__/outlines_decoding.cpython-310.pyc b/vllm/model_executor/guided_decoding/__pycache__/outlines_decoding.cpython-310.pyc index 8de5d1113e6e08c878d320d8ac61bb36b8e14768..da22e84ae19bbd19a6a5dd77c7766d976daafe87 100644 GIT binary patch delta 288 zcmew_^;?QNpO=@50SFA&?%T+{fk`Dsza+OnzaX*D$wSKPNLu zzo4=tBR_BRW2QUITv6<4r6r|Bsl`!~PqN7fM+pE`#}}36&M(xRrTz3Q@;vh+omSmR6 z6FDR%vvO}$0ZV|js>5W9BtR@MAqirsOuol0%>lAcQ?5vPG9!->zbTM&i>WBJhy|oT fXR;H|40&@9QxQaHf(R`Tp$j4uK!nQVpFC{ zlB!#fn4F!Mo?5*5KGPj$%UkSer6r|Bsl~U1LNba{6H@~6^K)D)Qj<$d@{4YW}5=c)ii7zV6%gfA5kI%`^FSs@N3)>z>-N_r-BV{yzwijsv2~CzFDG*y4L}-Bs z?a68!v5b0~TR18h8TBXs<-8*R5eG?vv?Q}k?&Xk}%*ee}1uOy9stuDZk^r&5gd~Wi zG5Hp^GzZ8&O}Qe~$$z~J^p$|1_%NAJHI}>~9KCIbw z(^QIz)LyAn25|r(UP2<3;6Uyixk5PU?J9{g zj_*XK8`SHJ-?}&NgVOQqdeDmC%|czeP3g-GC)D9*`FhK*1udU4st5igguDL4W--z| zYhAYkKWuqSw{$m%^k7w&Heu7ULFQ9EYy>Tr>OLs-8q-@LL|SvA1_X|HD~y1(U5EKm zI3;xTmzff@Yg6Gn;Poe)j=bh{(`imd7O%5t@~GEpcn7_;Y1gSuH`k*^;ETP9B{H!U zCJw4(OnklV)V>P18aXgGeReZ4!^nyl9|B>Vc0$Jo-nSXgifn2>*&~jm^jr>=sVKP4 z{E%-KG&NP;k3o_arDnC84+Fz>gk9o6>P!VUCwIt4fQmKKv@O>)%^8vD`rt}0YIh=Z zAq*nS02rxdh#zo%1SOpqlEOf|2rv#$h#S(BoSIH1iTXH6a*ugYT+IxNytY9`#XarN z*)o_^)i`fj)M`ei+`My(ah^v-B2L(D$Y+7(ClETz$t|Z%tWUk=P*&UO>8_Dkx#8nz zdP)XpC;c?QCW*TtP1g!T)9mCf^K`_6^i1t2`o4g03?R-(TaQ7HD9@lI5k{Q%qk*gt zE+gIJ?7x9+hDCg4t8-`~D}x(*N6co1$Z@E{205|yC^MbNOrXIeLZ8U@R zZi~%x4y7)j?lc1CS539EI*S5Xme+tX(jlA`&w@$e?TX2DJ8ePNTjImslh%K8nw(aPfAd9b@;?3|$g5ghn0s|$DX2S9 zc!38t3t@Jkt*iC+)^QAmXZcHD%iF`iPa>T~=LCNl=?e%l(at_(J+b(oZvB+6kyoBp zho47l*%mxPancT&>kvs!e<#xa6z40^DvUojkM5myI{9MUPv8mhF4h!PO_D(}lH}*b z!$Lo_^7q0=Dopjpz{g}ol#3H%%NS_|AWlI~;DXvD&txG7xFo(SmdKCdz2dLndbKn$ zjWv+VR|$U;Xz;oAMASZ~8K140l-U7g{E^ryT|6w$CN{9DwvFF@>hTs*a;co%u>3lE z;`vY?p@8p?z@hfWs~IS7qcjj<=yT*Qw=4jx7h!=!v-H zhpPei7!Tz*8r?Ts*PCMgjnGI+%t%4|Z-5VAJe=$})s`58mzS1aH!shaE0^ZY^DE0s zi|6JqnRBP+&dkSMYZmvRC3smi6)tZK9O(A+$O-JsfTUy*wOKEqEtkDSz&1Ptp!I4* iBR%jPCYp-xJW%*IW}6@B2LWoAw5Jdnu0o7tV2o%zk|{(a_P zCeur&6B7LGe)sw2c>O`9MhXumckdC&mTb)#a0m54x2PB0l3sGldfBb$6|vXnRNWzc zNXQAN<__z_LQXn$x1l$Pv>@3jJAGfW(|fW$0$Rq-f|jKtdog_!^qidsJx@nLKMs1q z?gzbJ>^H`!Y7f|hUlF@V8|$)Nvdj0CJ)*y2lVzz{;hzyJMuKDf3EAO^*ss%rP{M)4 zhT!L)PJ7#9ZKr3MPTT3MwYPTt&0hD7*3_xC*YWA=Tc&l}+@Ky$DesW6!xd#pCdc`g z>ZKDUaMv>%)Hk|x$2UCR^eL;rVvy)~oi6BIi?S4dqK=a>UW<=p(zvPmz1y_wu^eBF zx5}?!5XH1@quIx*ps+eZgYU<$Rxm-4C98oHXodk#-?#4iXkKn#0CIH;qx$rCS~M=q7eDHLNd?U0H06Q_*3mJ8R56`HNM|hUMzxH zQx0;5X`5TVAqwc+p^Rm5BNoIg$764T%w`dyBSqQ?13B8*?$~tY@UOl#GAEKgho%=q zfUxkF0S-ve2cpfC*5|Anw9Qg$S% zOK2i^z!Yx4=M?}nNtP9&5*e6~frOJ)zhPqkyo33Qu8DDbD*=IRv?gT#lX zvrVrs26X3f?;--$*Hpu*uHu5A)EadCgx|?sFpt!TAv6R$ zlc@-pF%xAAGT%lu;yo&H0XBN@c_{!*%E?$>LM}dI3)pCxo#kiq4OJwF4IiGJ!%$(z z*?E-Fvl(OaC|^eq#?fJdO62{~;kWrU^43MP5m~*9lIRHDl|Zq2Te}cRjCmC4e;9bo zSNkUxE~9&NPE-`eeF&e2k5SmSDyb_B*Z&v+Xp$iAnmZm2>FnXp{a?#4%~tU-S?14* zCmZjB30npTROmyeyKz8{6jkHbN;UEWUoZUzUi0OXZDd0v(j-g=8O&E+EQMDy*`=Qv zHnn;-Wxw!m%J0pH>xlho%AxT`FFjUKLe_$ewP|)Y=nKyud82ZfEOD!HeMz)hLCffN z-$WlZJSK>H6kZ&k0imKHxXErI2+DA-!zsrm9z3j07Eoxu%9e0v5n+m-uP%@l|DrlQ zp%;4FzSHSaueI*EEpc5%>lwaU;pM{X4)50Q)%ragc3s=rwau>IvBWs)DW92LZ@tG{ z%Diwm@ugwnrsE)r28BZvwN*%h4Qz>% diff --git a/vllm/model_executor/layers/__pycache__/layernorm.cpython-310.pyc b/vllm/model_executor/layers/__pycache__/layernorm.cpython-310.pyc index 0f09c8c1a9811662c40e68b0f5346d2eac333e18..e77cc9c9ee384733f0d75ae61ba3d09040cd2eaf 100644 GIT binary patch delta 62 zcmdm~vQ>pUpO=@50SFA&?%T+{iCM*4za+OnzaX*D$wSKPNLu Qzo4=tBR_BRQ|1sp09sfS;Q#;t delta 66 zcmdn0vQvdSpO=@50SGF$HEiVG#H``3Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5A#(^H0If$A@c;k- diff --git a/vllm/model_executor/layers/__pycache__/linear.cpython-310.pyc b/vllm/model_executor/layers/__pycache__/linear.cpython-310.pyc index be35bf42782f589eb92e40746ce35b018385089e..c1cc88f613aac2fbd57d4ebf0cf2d89873e69eed 100644 GIT binary patch delta 211 zcmX?coAL5(M&5j0UM>b8FkHJYhB<|yl%Ys| z@<$^!HMxgFY28GGW!XAuTn{$Ns>x!uWg;;o47=;)G7`YhvnD|(D7+IJ$J3BrV gkkbLm3Gng&#hLyyF@fZn{;~Y#b8sNB|&v1KE#8moqnera)$eolUJVvc@JW|DqEWl2VUp0S>x zfqrpjNvdu^Vsdt3dTR0JaMnCtjR2tD8m26U6h=vg6sByZVm>&JIh(0Sp@unyp_HLW zV)AbxT~-#qB1VSEM#3J9GMlS~_v=ci0d=$RurLZS3NUgp@-gwTa4|CdXJOtP;P_NP fK@TV^z{>-aVfxR+1X98DkL5QX7hF|vP=ho8lv^-X diff --git a/vllm/model_executor/layers/__pycache__/logits_processor.cpython-310.pyc b/vllm/model_executor/layers/__pycache__/logits_processor.cpython-310.pyc index bf46f27a01aaf8657413a0cae989b586dfd82be2..f996ecf11a7103e0b672aced14bee485c09c6e73 100644 GIT binary patch delta 62 zcmX>qcTkQypO=@50SFA&?%T+Hl|>~;za+OnzaX*D$wSKPNLu Qzo4=tBR_952dga?0ATJEA^-pY delta 66 zcmX>ocT|o$pO=@50SGF$HEiU*%AygbUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(_h1He|0JOOkG5`Po diff --git a/vllm/model_executor/layers/__pycache__/pooler.cpython-310.pyc b/vllm/model_executor/layers/__pycache__/pooler.cpython-310.pyc index a97b7520e0448e7e78d3447684368cea896d95d1..dbb2daee7534940421a0e5b91e5e6fdd1120fff9 100644 GIT binary patch delta 62 zcmbO$JX4rEpO=@50SFA&?%T+{lTpP(za+OnzaX*D$wSKPNLu Qzo4=tBR_BR8^(?707f(v UlB!#fn4F!Mo?5*51>;6`0GGoR^Z)<= diff --git a/vllm/model_executor/layers/__pycache__/rejection_sampler.cpython-310.pyc b/vllm/model_executor/layers/__pycache__/rejection_sampler.cpython-310.pyc index e99e319f5d2dca551bef2c3dde801c8184805613..c6362a4a530cdd7e90c5609f3c8ef229720ca2cd 100644 GIT binary patch delta 62 zcmbOmH#3eqpO=@50SFA&?%T*M&8`xxUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrJJ{Ln zvy-S1RV6qBhlhj^M@|vqfP4dl#04ZI{(ct&YQRU zOZlg=;hE-eME=cx^W(S1$C?OwUuYMEo|YlXaxn1v6$3IMQHgh`=5(5SE@kC#KSGv# z9ITYOZNKC<{n>7n?z!FBa(lbco^S7#TFs4;|DfCOwsV44r~6NUw;P~@4|O>u@F#y+nd zE}BGMt$7j(3)=&92HFPZ5YS02`w{}v5|u%>z2P*%$1cqyZuL==DkyT*80SyoGh(6l zef)QET5XiUB(;%pfPHO~a)^!rYRgklFY?dBQzs`N7XbJO24zXTjy)XOc^UDuz%(B- z<_fSE4EbKik?!33QAd2oD9*t7a3Uen+Nd@v5+W)8Ga{~~BRR}k23`d&OYDna z$Z=||YNz8kp-YsEu5)JepYhiquK?=OPe^4CQI4(DbK)v5r6#lMNWKeLeH3{o^^r*O zL8_2f`5Q>x>F3qVBA3#e6;p6ajG!s@ zh3d0wc7oo(FJX$Bz(qiLUV&O=d(5g_kTMvo`hM$yvMdXxitscO;ZnGZ!0h*nQzZ&d zV`1g+N_t<7?TJT+FUh7%*;=62-JNDFe80ncdU66E`Fz;S<5=byKz$_+?W?k^BJn=( zJa8Y#0(kuiC!#ljwMgVqgr0>w2iyeI?Y;$t%c1uG9EWZJZ%fFRM3rC*0S|yRY6GfV z!cpxJi2HOJL8}j(Jc!-(XtzrBzvO@mxefj>mszi4&eQsbTx8Wv;cS7v?rwEFqAtSs z0IQF~rfKjWxwVOg%*gv!-vjMh_$*Ql^T+vCzO1Vc!zzE8KPB?~U4D5D9ZSm3Hk2}@ gD)$P8>ie|-rA(=&xr^ZAOHXW delta 1579 zcmZ9M%WoT16o-ACWbF7A=i#(*qLQSTWGWITgw~`9Z3=Ca(3U1pA#hQLu|07d#-7O; zyOkqQkXW%`QC*~p1xprLB3ES%3lRUpuwVx(1RGeef%`iX^5{tO&AI2yz2`aeUE#+< z+({;5A$7H%e)3KH^ROs(z6>u3tzW5VNcvrCYcNw>p&0e3YZ&<-JS zBcpLS9oZ1`vK@JR|JYR$c0N-b9vrN9(LCg7U`9dLh>v{09Z!!1QM?TO zMIa~p;sHeuzo+R?d7Boc+jm1;lTZ65FFmv4 zDz>cv*Axzf-)k6U+w?rcIBX7V>oS%8>&$BqUk7*=UQm+WOJ`-a|D3ok7yBnOZ^QTw zaI)xb|EHHwZ9VMwwi@1U%d++?Un9%4%%}f}(9;2|y?44dAANAKN0QZZukTw_Qw; zwcDzZaH>;ajJh^0Vv(F(RL2S2o!rN6>_c|2AB^0+#%n ZTY$tt@km)%E(7p(BA6g;d1LgW{{Rt+I{N?s diff --git a/vllm/model_executor/layers/__pycache__/rotary_embedding.cpython-310.pyc b/vllm/model_executor/layers/__pycache__/rotary_embedding.cpython-310.pyc index 4e5f06b236cd5b0881edc8678e1fc3dfa419d30e..6eecd9e649903f8ff1010add48de1b3532295a8e 100644 GIT binary patch delta 140 zcmbPpoN?N5M(%uGUM>b8FkHKDBX=aTN|1g@Zh?M5W`S-=Vo`c(iLQBWX-2MLZn=I= zW|DqEWl2VU-sT?WOjBkKW}eMIECRWhIT(31`#7(X;^oN6&r2`LFG#(`R9rflIc^Rg p$Y?eOHYN^6mVazalh?<^u)PEd6}{Lj82^BgnS+IC^OuAbOaKAFD+d4o delta 146 zcmbPsoN>-^M(%uGUM>b8sNB}Dkvo!EBTT=vxJW-IKRGc+KPNLuzo4=tBR|hr&(J`> zII|>Gw;(Y&J25@AcykAHrYSQUGvDSf7J*#MY>a%HJ)Bob@iG;c-r~r~&r2`LFG!vI wKX#4)572Zr1~w)(My9_kjBNiWuZ)XfdjS+Idbyc9{sAL18w<F@sU zd0x-kO-;klG+0%e&62}^o_9wFt!A@pQ-v0ZRm8$EwN~0T3GH5W+O$(3;1wtN&a~XI>eEII7?wu?Jl^ezg^n~@CDlHd@znX>dN5)zFgM@ zU*Yd{PB@RI`YO9= zjckl8QiFG63p*#AlChAiDeM@fqXo{c33XL!Vc+7d##Z@DqhA^#tLaPOqj%DO?A#&BtIn#5X4qq$Gc5W!O!?a^A7kG-)NqIDScndN&|oN zZ*dt-cgXWDj%{r)O_RK#Tee-vExSazo$xV7X<>FDX!_Z-X;KFWgP0$vcYaQCJ3(Z5 zlGIsj4?N?%!KL38Pb#c07>t6>{DEo`N))Dq|yk^YFNgU-uS|u4I$s`#d zZ_Z>e87&|IMt0(g9N?}%FcJ)ehX|6sV%I%@o49!QDChX@Vpp2diUwy$iQ^@%Oh3Jz zB1~YuT+&NogekcM?&D>-(|VtBJ>Y0J?~f4_=3-{jWkCGN3^8~3fpLxB?987g;M=6$WC^5$Pfruop9C^R2aq4EO@ z^IABr6I6RKk1bu6Jq^?$`~S&`Yh$N+Cc-d9%yDFFQDv_d)YLsnG#C!C0f-Cwfy?;P6eFVgP7dJh7zr>xJB*Q_%6rqnGPBWcOCboH&6!poT PCCp&NUZ`K|yA1yTD-5Ht delta 1531 zcmaKse@xV69LM?Gef#p`I3j+?M5H8~-01GaA{>H{gUmZvtymT;j{{C*(EWJ6cMz77 zW$T}2n|=Oa){3@P>#u}wfo70orcSL~*6KD}Khz|Pn7Ygm=y^YGT(#A0_uBjUJf9!W z=lSs+xkmf1ku7AmrzOc>|LDN5EhVL-(H%2{yC>A{?{W8ZwYkIn(QTpN-LA6LZlfz2 zaEATu-TuyiVOFGkSwwNuURq|!dPgP@9tlUXXo4O#A9C)s>hD6o$1|(nq6u@b>>g{~ zC@f>ZehG(7D3=dmH~_p43;{0z3`_zCfe(Oj&MeeHd z`3P7k5!a%jaJLxcH!4euRn5CFm8kiz=!1Nvve>5TwZL(li`E^b6XwtBvWfQbd{qH` z%FC(?GfrZ54=PYZ9N>-BTj-4WW_26UDNe2N&}ZCK&E!Knys^ zmfDI;wUQx>RSRG6rrKdTYtGg#wbBvJt$Tqc`1QJ_?!(e0u5GBluTh+U)MMcee>5Oo zLn!uCsK&7(N1FJSr|O#MJ6>NOp(%4;eMFPViaeX?7vAnM=mJlBoci~O`kYsISFQa4 z@<%}J#|V_#Lj&q8kXZN`48y=V9`NSV6u<1P$(@Gb6JQ8XCwPH>^FBa7@!E#R=vUs; zaE>mUy^YH)`eo_j(0RyPXpTKdR{aV>uJXjg8}vUQFPi!z-z1lQ1>FuDl5phR>=r%# z?S|~caD>xZYIBc6J_@KT8=;P|ujTRFi&8e*Be8(!_jLt3y4nMV7&lL~gvj|Pyh?zl zC3ahrl8jfS&{k*`P17|Cr7!3f-I_v{1fp|Eioc-hzmp=f+RnvX@$_KqNncN>Gb}=FhFIWMzmqcf zMgN_5m@;iVRbG0Z@CUmMu?l4rREszGw7*lo0pq;6zU?@zNkRIASL#29D(I4QAJC** znw;FehIh9Va#gF-C2Wh%=}`8?VWJ>npGWMiJksIXnP@$6anEBlnKIU~9)I2I(H5kg5BYPrvd@*TF2udk;-LE-Ua<)=uK;oL*}mVYVFDWO oUcGpso}GG%Q?Ts<@Qy@3pe{Tvuuz9P2ZgnZXMkDrn+a diff --git a/vllm/model_executor/layers/__pycache__/spec_decode_base_sampler.cpython-310.pyc b/vllm/model_executor/layers/__pycache__/spec_decode_base_sampler.cpython-310.pyc index 879c57f616946b2023d8378b271bf92605b058b2..ae776c2dbe72d5c7f02ea2bbff11fec924f911a5 100644 GIT binary patch delta 96 zcmZ2sxyX_`pO=@50SFA&?%T-S#iA0WUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS xUr*ChzF>Xje&`gjhX2W3nSbAD)-6r*u*C5i^^_}7IEhQ0JORs AZvX%Q diff --git a/vllm/model_executor/layers/__pycache__/typical_acceptance_sampler.cpython-310.pyc b/vllm/model_executor/layers/__pycache__/typical_acceptance_sampler.cpython-310.pyc index 6c3ed2008614b7cd1aefa1df2b27ebc95a09bf33..93151545afe866485118316d2e5760d235c460ea 100644 GIT binary patch delta 69 zcmdmHvdM%ypO=@50SFA&?%T-yn?)r?za+OnzaX*D$wSKPNLu Xzo4=tBR_Am9xIOkW7KAA(cdfp1IZS+ delta 73 zcmdmFvdx4$pO=@50SGF$HEiVm&7zT@Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> blB!#fn4F!Mo?5(Fiw%h!8bE|Bh-d^6?LZ=mvlwVXNqlBXMHE+YMq*J) zd~s$~YEkEACcT@?QgtA8>>$D%L?nZVUJ%j0`KzHPE92D3ja%5z|2gSl8sq6D=edr%YaD;mkN?^E-=ZMxYKaD>I-_qtyZcZLLMW delta 238 zcmbPRwy=ylpO=@50SGF$HEiT=VAY7zFD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` zN!2Y#OwLYBPc7cOo^^u?W7OsZtz2fqI-mhX^&mnPL^ObiHXsqjSzMA>R1%+=QW3>f zoRL_R5?`EIm0Hv>*-=<{v!LEFW~o|`T6Pd&4kD64L=TAQ+x*ecla+DGWNY&)j6IVD zEbJNkCkI$4OHBaDrhE QFQ_cZ$j{p>$oy3j0917py8r+H delta 66 zcmZp&YO~_b=jG*M0D{VG4I8=dF=-^|mlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} Ur0NzVCTAz6rxtJKW&SD&0H*D$wSKPNLu azo4=tBR_Amh~NPQW*%0y&DRY-a038fuNZs) delta 75 zcmX?HeY~1GpO=@50SGF$HEiU5D4-FkUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> dlB!#fn4F!Mo?5(FK=6P9GZ!nz=F5g3xBIpO=@50SFA&?%T-C#HNv%uIh-SU0~?KFPz(^q+6@HiJ7n E07HWyqyPW_ diff --git a/vllm/model_executor/layers/fused_moe/__pycache__/moe_pallas.cpython-310.pyc b/vllm/model_executor/layers/fused_moe/__pycache__/moe_pallas.cpython-310.pyc index a09e6939c90caa1263f49d09f7073ddc4ae5cb3a..afcf2182b6c7e61dd265caa82037ce8f26f5eae1 100644 GIT binary patch delta 62 zcmX@XcZ82SpO=@50SFA&?%T+{i&Z5|za+OnzaX*D$wSKPNLu Qzo4=tBR_BRTh?es09wuz>;M1& delta 66 zcmX@YcY=>QpO=@50SGF$HEiVG#i|jdUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5C2KSz0Ik^-`~Uy| diff --git a/vllm/model_executor/layers/linear.py b/vllm/model_executor/layers/linear.py index 8ed74ef..789a77e 100644 --- a/vllm/model_executor/layers/linear.py +++ b/vllm/model_executor/layers/linear.py @@ -132,7 +132,7 @@ class UnquantizedLinearMethod(LinearMethodBase): layer: torch.nn.Module, x: torch.Tensor, bias: Optional[torch.Tensor] = None) -> torch.Tensor: - if (x.shape[0] == 16384 or x.shape[0] == 15360): + if (x.shape[0] == 8192 or x.shape[0] == 16384 or x.shape[0] == 15360): if bias is None: return x @ layer.weight.T else: diff --git a/vllm/model_executor/layers/mamba/__pycache__/__init__.cpython-310.pyc b/vllm/model_executor/layers/mamba/__pycache__/__init__.cpython-310.pyc index 888ccc9def7f7ce47820c63166a35c052297b7b1..bff33db5c3da07f304a07729f238a353a13cb81f 100644 GIT binary patch delta 59 zcmdnUxR#MSpO=@50SFA&?wiPMqY|KBl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEohz2>|}@6FdL_ delta 63 zcmZ3>xRH@NpO=@50SGF$HB98T(FoBmEiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuNU|1OQAD6ifgB diff --git a/vllm/model_executor/layers/mamba/ops/__pycache__/__init__.cpython-310.pyc b/vllm/model_executor/layers/mamba/ops/__pycache__/__init__.cpython-310.pyc index a095ccb4437067b88b5a368360a0a8f180bff92c..db529d1875dfae4dfafefdd9e6141514567c69a7 100644 GIT binary patch delta 59 zcmdnWxRH@NpO=@50SFA&?wiPMqY|QDl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEohz4FCad6HEXA delta 63 zcmdnUxRsGRpO=@50SGF$HB98T(TLD5EiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuNU|1^`a76kGrR diff --git a/vllm/model_executor/layers/mamba/ops/__pycache__/causal_conv1d.cpython-310.pyc b/vllm/model_executor/layers/mamba/ops/__pycache__/causal_conv1d.cpython-310.pyc index 5b34390aab89351d90e29dcff6392055b37d35b1..a8096759a1daf09e389e16f121dca1485fd45a16 100644 GIT binary patch delta 62 zcmaDTepj43pO=@50SFA&?%T+1#-*D$wSKPNLu Qzo4=tBR_952kRGB0C^%6H2?qr delta 66 zcmew%`bU&IpO=@50SGF$HEiU*%AygiUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(_h4l+70M2n1MF0Q* diff --git a/vllm/model_executor/layers/quantization/__pycache__/aqlm.cpython-310.pyc b/vllm/model_executor/layers/quantization/__pycache__/aqlm.cpython-310.pyc index 970f5d328314ccfc27206294f2515b69de9baea1..97c6107c026605d390bb7393907871da52025489 100644 GIT binary patch delta 107 zcmdn$w%Cn3pO=@50SFA&?%T-i#;g*oUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS zUro DW$77Z delta 104 zcmZ4Nw$+V0pO=@50SGF$HEiT|W7Y`QFD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` wN!2Y#OwLYBPc7bD%3R0E%*M#J`5Oy+)fmpO=@50SFA&?%T+{g;^y?za+OnzaX*D$wSKPNLu Qzo4=tBR_BRbLNwR09(QpU;qFB delta 66 zcmZ3Zy+NBhpO=@50SGF$HEiVG!mJUdUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5G4n}50ItOrZ~y=R diff --git a/vllm/model_executor/layers/quantization/__pycache__/awq_marlin.cpython-310.pyc b/vllm/model_executor/layers/quantization/__pycache__/awq_marlin.cpython-310.pyc index 47ed177fabb2e22aa12a360e5307adbd08352608..bccc8e3f97e40f8c278b851d614667f6399ff07c 100644 GIT binary patch delta 62 zcmdlHu_b~#pO=@50SFA&?%T+{k4+^~za+OnzaX*D$wSKPNLu Qzo4=tBR_BRM>cm=0Cz(beE UlB!#fn4F!Mo?5*5Et|V40L(rXjQ{`u diff --git a/vllm/model_executor/layers/quantization/__pycache__/awq_triton.cpython-310.pyc b/vllm/model_executor/layers/quantization/__pycache__/awq_triton.cpython-310.pyc index 7f1d394373f56050a56f36e0c20156721751f03c..35acfdbe64312e4b70095afa6fc0744a6bbc3880 100644 GIT binary patch delta 62 zcmaE8aMyr4pO=@50SFA&?%T+n&#n@wUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr@X&xepO=@50SGF$HEiV0XV-|;FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` UN!2Y#OwLYBPc7a&kA1%Y0KO3xRsaA1 diff --git a/vllm/model_executor/layers/quantization/__pycache__/base_config.cpython-310.pyc b/vllm/model_executor/layers/quantization/__pycache__/base_config.cpython-310.pyc index 0759d0c5b1596f31dbf25bec7de93239fa488c7c..39e0f44b233aeef83b6be43f05ea3086c49149a8 100644 GIT binary patch delta 62 zcmX@Adr+43Q&QCCLBd delta 457 zcmaFq^3jDmpO=@50SGF$HEiT|XVHk)FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` zN!2Y#OwLYBPc7bD#*!q+cx&@bQCCLBl+E(uvW#qLKy!-HCkF}%Zw{46WM<0-@pC5c zkq%}om@FV8#aK33TP9loq6{PlRj^EEB3A~Ge+Gz)izYkD#&Yp6G5zCVX8Oy)vU!PY z8KY4yNO>NJ$OjRHAVL~W$beYIKth!f$S46as_Z8(5RjUDPL^%*dIj#ute_wv)ed6%g9tR=WKQ-~*eII{l!;;sNzE(H aFDhaMDa!&8puj51oE*n4zS&68oDl$ySY{Le diff --git a/vllm/model_executor/layers/quantization/__pycache__/deepspeedfp.cpython-310.pyc b/vllm/model_executor/layers/quantization/__pycache__/deepspeedfp.cpython-310.pyc index 6213ec26a10933151f67ad788ed98b39834cbd0f..a31daaabac1663c2dd2b97198b2f19bbc66625db 100644 GIT binary patch delta 62 zcmZ2twZMuypO=@50SFA&?%T*+$f6RZUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr{!&&$ij00f3>_ig0nV^)dQFUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E QFQ_cZ$j{sC$b3N<05HW9?f?J) delta 66 zcmeCxo2bW~&&$ij00foW8a8tCF>A!@mlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} Ur0NzVCTAz6rxtIvWxgN`0DyE9{r~^~ diff --git a/vllm/model_executor/layers/quantization/__pycache__/fbgemm_fp8.cpython-310.pyc b/vllm/model_executor/layers/quantization/__pycache__/fbgemm_fp8.cpython-310.pyc index ac659f7f26e7c9988900537c3818f5cf79c4d893..54b49c92cbc879247371dc318f49a51bc8ffd248 100644 GIT binary patch delta 62 zcmcboeM_4=pO=@50SFA&?%T*+&7u;iUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrb%FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` UN!2Y#OwLYBPc7cOip4+>0J_K($^ZZW diff --git a/vllm/model_executor/layers/quantization/__pycache__/fp8.cpython-310.pyc b/vllm/model_executor/layers/quantization/__pycache__/fp8.cpython-310.pyc index e60b9d0eb0cf80e73c06ee14a264a9416e3c107f..69d150f8ac359a52060ffbe04b77de2470ad3b8b 100644 GIT binary patch delta 78 zcmdm;xHXYGpO=@50SFA&?%T+HhD{|%za+OnzaX*D$wSKPNLu hzo4=tBR_BRf3|%Jj1MO7Q}<`#Vq{|6EUdAD0{{x^8gc*t delta 84 zcmdm*xI2+MpO=@50SGF$HEiTQ!=@3YUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> nlB!#fn4F!Mo?5*5H`_i1#z&KPsr$2WFf#pTV%p5Bv4R5ttoR&! diff --git a/vllm/model_executor/layers/quantization/__pycache__/gguf.cpython-310.pyc b/vllm/model_executor/layers/quantization/__pycache__/gguf.cpython-310.pyc index 63e78320cb8a18ce40e6fcccd1e4801f178503ec..72e41daef76b3b8f8619d4694f92ae164d3bfb17 100644 GIT binary patch delta 62 zcmexp_|}j+pO=@50SFA&?%T*M&8!lvUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr*D$wSKPNLu hzo4=tBR_95BkL7@#!Zv2iD nlB!#fn4F!Mo?5*5FUu8v#x0XCiD@PS=9sn5C7wZ53 delta 98 zcmaEy_%e|@pO=@50SGF$HEiULW7CM!FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` vN!2Y#OwLYBPc7cu%eI6|N&%=-fSHRC0y&si7$un57@7XFFm3h}oFxwc#H<FB>ZdGaDn*e)D(I7#~djEauF{ O2NYpp+H57R%LV{b%FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` UN!2Y#OwLYBPc7bD#j;8e0GALIdH?_b diff --git a/vllm/model_executor/layers/quantization/__pycache__/kv_cache.cpython-310.pyc b/vllm/model_executor/layers/quantization/__pycache__/kv_cache.cpython-310.pyc index e9a9e8377f2f116ede5e6f28315b04cc290ae323..44e5b4106e4e3c76336208752489270b4e7240ab 100644 GIT binary patch delta 78 zcmZ23vQUIOpO=@50SFA&?%T*M&8!lxUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS gUr*D$wSKPNLu hzo4=tBR_Am6sv{+h delta 84 zcmbPfHs6dppO=@50SGF$HEiU5&Y}^iUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> nlB!#fn4F!Mo?5(Fj8#K`@yKL*QD-(jMyCHPOq<(8C$j$KF07e58Z2$lO delta 66 zcmZ2uu)%;kpO=@50SGF$HEiV8W6_A#FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` UN!2Y#OwLYBPc7aY%W_^A0GBQmeE*D$wSKPNLu Qzo4=tBR_BR8D>Qe0BU>`)Bpeg delta 66 zcmaDU{#KkjpO=@50SGF$HEiUb$*d8tUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*51hXOs0KR_}c diff --git a/vllm/model_executor/layers/quantization/__pycache__/schema.cpython-310.pyc b/vllm/model_executor/layers/quantization/__pycache__/schema.cpython-310.pyc index b0cf65f2daa3d970429b8ce3fe0c96372beea51c..e1ee39ce62e7c5b9cbbf30372990eeefd85891e2 100644 GIT binary patch delta 62 zcmZ1_xlEEfpO=@50SFA&?%T-S%%T#iUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrb$FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` UN!2Y#OwLYBPc7cOiRBAB0GY}b1ONa4 diff --git a/vllm/model_executor/layers/quantization/__pycache__/tpu_int8.cpython-310.pyc b/vllm/model_executor/layers/quantization/__pycache__/tpu_int8.cpython-310.pyc index 39b843465700f009e44a9b3526bc4365786adcb3..470be3208b864b21fc3a97c74fc6e9e3e1436271 100644 GIT binary patch delta 192 zcmaE@{#>0qpO=@50SFA&?%T+%z^oFkUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS zUrjVJyu2b- VkVM4fi>$(v4+yhtt`;g_1OWcZHWL5< delta 149 zcmaE^{#u3QiULQtA-^q6TGTeSZV~Tu0g!kl!?82KX_|G#k`cL){ oG-L||i3Uxs7nB4F%oN-#;tLW801~&D^74vULA>zI2}13R02@mxX8-^I diff --git a/vllm/model_executor/layers/quantization/__pycache__/w8a16.cpython-310.pyc b/vllm/model_executor/layers/quantization/__pycache__/w8a16.cpython-310.pyc index cc44e16af4cae0b2732c873a92042ba1c07da477..9a134f3a804bebfb9aae757aa318493f79598283 100644 GIT binary patch delta 62 zcmZ23zgV6-pO=@50SFA&?%T+{he;(wza+OnzaX*D$wSKPNLu Qzo4=tBR_BRd!`*c08>>JFaQ7m delta 66 zcmZ21zg(U>pO=@50SGF$HEiVG!=w?RUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5HPa3r0HxFxKmY&$ diff --git a/vllm/model_executor/layers/quantization/compressed_tensors/__pycache__/__init__.cpython-310.pyc b/vllm/model_executor/layers/quantization/compressed_tensors/__pycache__/__init__.cpython-310.pyc index 6452a2063e1a5d581157af175a33091acb32f81b..a5510838be166de8d784807ca728a2da036e2035 100644 GIT binary patch delta 59 zcmX@jc$|?tpO=@50SFA&?wiPMqmrdxl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEof-1^^D$6QlqD delta 63 zcmX@kc$$$rpO=@50SGF$HB98T(a6&;EiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuNSi0{~qj6tn;U diff --git a/vllm/model_executor/layers/quantization/compressed_tensors/__pycache__/compressed_tensors.cpython-310.pyc b/vllm/model_executor/layers/quantization/compressed_tensors/__pycache__/compressed_tensors.cpython-310.pyc index d9325ccef2fa085adcbacb0c00249f62961eb4b7..db6f166eabf1cb1d0e99f12352b4bf585ec18f17 100644 GIT binary patch delta 94 zcmZoq{GY&`&&$ij00f3>_ig01VN)s5FUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E qFQ_cZ$j{rH&*mW_l?Bwr!^+3V#mL0S0)}jV`B*@_%~z#1i2?vFYZ&|h delta 102 zcmeyL(4NSh&&$ij00foW8a8s} xr0NzVCTAz6rxtI{X7dn{%LD4*D$wSKPNLu zzo4=tBR_95FY_^02_>K|HWnU6CPudZJWL>xkC_k1+x(VeCZCQPSXPLcgOP`ki;)8e knHX9AvoW&)NiHT9peT^f$nuxvf0f4MLM?^OSH!tQ0cO7<>i_@% delta 132 zcmcZ>c`uSXpO=@50SGF$HEiU*#iUWAUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> zlB!#fn4F!Mo?5(_lld5{lnPKM8w(F36C>My9wrdU#|-5CXJXp?oMR>*qsHV$acLnA dCZ>NZAaO<(MwY)Uf2%YmE6OTtJ|oU03II0}Bvt?b diff --git a/vllm/model_executor/layers/quantization/compressed_tensors/__pycache__/utils.cpython-310.pyc b/vllm/model_executor/layers/quantization/compressed_tensors/__pycache__/utils.cpython-310.pyc index 1e28ce3ff13c4872ff78d4f69ac525deb5a39227..408ed02015aa62fbc58b68a9767c716eefffb319 100644 GIT binary patch delta 466 zcmY+ByG{Z@6ozNn`;7&b%W_9W1r6CySyS2B*iB)gIm0E{kqud+Hd44R;9J<(NMq$A z*x48pYv01dLI_SX=Y0SFpEJpP4}J#r)V2+Rr~mRketWVza{&mXf)p32C=jg0K;kl$ zxk44LQk82|<2uz7O$rQdQj=TM;x@GtCI@NmP$#LCAj7jXE09wHDrhkQjfsyU&0(*D zfxW?8BofUdF~N$-9IQ1eAhIEiru3Q=kvNb+l3^x}DM6OGkYnCZ0vGbJM9WZM8gt78 zicC%JrK&&)JX9;Fx={Y7RG^AVb(5Rdn6qVZhZ@wOftH%ygd=Ee4cK8GE>G5>YZvxn znbx75JZVKG*oOnmHa6KqR986ExZ0x2mLCzqA86koN6&m*idZ)!oxxcPBZ6x|Noye$^10Go6f*-EP`k9@z{NPaq3e71Y|A=naa|pUeq>Ph5+fB|Miz-02XLetnMz{1{Q zJ`$B?kR-v5$Q0})$|7>WMU%TEIV36Yka*0(F?mQcAAA;cRLDR!QfUEl%wT?zK%VLG zJy&%Ipnz%-RUeA~loFItDXntT3Uk*ie#e9=Y@nr_sKFs@t_|2?0WOc%p=%p9)%)SY=sx6wc8iC+cM}dL jBByO#a{A_if~kWl?F>FUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E QFQ_cZ$j{q6fu)ce098yBlmGw# delta 66 zcmew>->ATy&&$ij00foW8a8srvS@VbmlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} Ur0NzVCTAz6rxtJSVJYMW0I2O1qyPW_ diff --git a/vllm/model_executor/layers/quantization/compressed_tensors/schemes/__pycache__/compressed_tensors_w8a16_fp8.cpython-310.pyc b/vllm/model_executor/layers/quantization/compressed_tensors/schemes/__pycache__/compressed_tensors_w8a16_fp8.cpython-310.pyc index 2f1b90c2e39dc64f6e9abe987e6ce73fbd8fc3b5..a286914bd5f52b5d09ca0a94cc30955de7665600 100644 GIT binary patch delta 62 zcmew){Z5)YpO=@50SFA&?%T-yo=K%mza+OnzaX*D$wSKPNLu Qzo4=tBR_Am67vNv0D|@vZ2$lO delta 66 zcmaDS{YjcTpO=@50SGF$HEiU5&!o|%Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(Fj`;!?0NFtneEd)A+v08`2skpKVy diff --git a/vllm/model_executor/layers/quantization/compressed_tensors/schemes/__pycache__/compressed_tensors_wNa16.cpython-310.pyc b/vllm/model_executor/layers/quantization/compressed_tensors/schemes/__pycache__/compressed_tensors_wNa16.cpython-310.pyc index 7fea9854ab034e1c39f835bff88a964c08e07431..c84fb933bbbb38959b65f73bf6f3016e574438d9 100644 GIT binary patch delta 62 zcmbQOJYAVPpO=@50SFA&?%T+n!>ZDxUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrpO=@50SGF$HEiTgVA9CcFD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` UN!2Y#OwLYBPc7cu&!oc%0G&1!DgXcg diff --git a/vllm/model_executor/layers/quantization/kernels/__pycache__/__init__.cpython-310.pyc b/vllm/model_executor/layers/quantization/kernels/__pycache__/__init__.cpython-310.pyc index 72e7450d3dcb93f1b94311f5fe7ac4042f2f1783..f2827fc5e6677dbd06aec539d64f8d8ab686ef21 100644 GIT binary patch delta 62 zcmbOz)GNfD&&$ij00f3>_ig09%%&2rUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr*D$wSKPNLu zzo4=tBR_BRKc;qOE)}3IHf9k<7RJpJ*;cSB$$ zlB!#fn4F!Mo?5*57gIYkj~Y-X8?z82(|;DG&E0G(Sf%7ZB8+TIe2fB&96)hCW+5g4 NAT7YO*_+3e1pu2D9b*6h diff --git a/vllm/model_executor/layers/quantization/kernels/__pycache__/marlin.cpython-310.pyc b/vllm/model_executor/layers/quantization/kernels/__pycache__/marlin.cpython-310.pyc index 478759a6a96db93ad2df87f33cd0cfb6210f90e5..b226a8ec60cbb29e3caf55429c966c36b270e5ae 100644 GIT binary patch delta 62 zcmeyW@KJ#~pO=@50SFA&?%T-C!>kgkUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrJTUz}Nz Rs#}nloSm4ST0HS~AOK?C6-WR8 diff --git a/vllm/model_executor/layers/quantization/utils/__pycache__/layer_utils.cpython-310.pyc b/vllm/model_executor/layers/quantization/utils/__pycache__/layer_utils.cpython-310.pyc index 9c7dfc0ee9f7874c2997fec9ded5f1052e3803f9..7a710e9dd5ad6ec6d584db3cec9f3c111e88e07c 100644 GIT binary patch delta 79 zcmbQqF`0uqpO=@50SFA&?%T+nUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS gUrp diff --git a/vllm/model_executor/layers/quantization/utils/__pycache__/machete_utils.cpython-310.pyc b/vllm/model_executor/layers/quantization/utils/__pycache__/machete_utils.cpython-310.pyc index 9ec857a38016271e8275b0285f05cba73705a3dd..1d2369644c0f6fd34c8249000cd44b518955cfb1 100644 GIT binary patch delta 62 zcmaFBd54obpO=@50SFA&?%T-S&Zv^4Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr)gpO=@50SGF$HEiUTX4Od5FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` rN!2Y#OwLYBPc7c;#VW%tz{SY)pNWZsk%^J*Kg)lPf1AsAz6%2Y#ylIp diff --git a/vllm/model_executor/layers/quantization/utils/__pycache__/marlin_utils_fp8.cpython-310.pyc b/vllm/model_executor/layers/quantization/utils/__pycache__/marlin_utils_fp8.cpython-310.pyc index cc9b2e80dd3bc6c16b0ebe3cb7f3526f5a532839..fbd93ab7ac0b44e997b0e74c24dc6e490924118f 100644 GIT binary patch delta 62 zcmeAaYZc?p=jG*M00P6c`!;fKW>iVlFUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E QFQ_cZ$j{sSj8T~r06>2fM*si- delta 66 zcmZn_>lEY8=jG*M0D{VG4I8;PGiqe&mlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} Ur0NzVCTAz6rxtI1#Hh>(0FmMqR{#J2 diff --git a/vllm/model_executor/layers/quantization/utils/__pycache__/marlin_utils_test.cpython-310.pyc b/vllm/model_executor/layers/quantization/utils/__pycache__/marlin_utils_test.cpython-310.pyc index f8cb1bc3d0f0990ccfb201328b86d3ce8a51b9ee..c5929a46f3e0499b299431f8303efb1f1708bb5f 100644 GIT binary patch delta 62 zcmX@9a8!XipO=@50SFA&?%T-i$*hv5Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr*D$wSKPNLu Qzo4=tBR_BRE9OoW0Fc@iAOHXW delta 66 zcmaDK@Hv1xpO=@50SGF$HEiVG&a9EEUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*58FQx!0Oy4lFaQ7m diff --git a/vllm/model_executor/layers/quantization/utils/__pycache__/marlin_utils_test_qqq.cpython-310.pyc b/vllm/model_executor/layers/quantization/utils/__pycache__/marlin_utils_test_qqq.cpython-310.pyc index 119fea028c553a5b73710e09306516ffdc135baa..3bf1f4bcc32e5cc9282821d9a203376ea4e07eb5 100644 GIT binary patch delta 70 zcmZ1{y-J!ppO=@50SFA&?%T+Hl}RN_za+OnzaX*D$wSKPNLu Zzo4=tBR_952lHNLrab=5$Jw5<0RRZu7iRzf delta 74 zcmZ1_y-u1tpO=@50SGF$HEiU*%A}E}Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> clB!#fn4F!Mo?5(_g?TSCQ(^t)!)(vl0B2Dc<^TWy diff --git a/vllm/model_executor/layers/quantization/utils/__pycache__/quant_utils.cpython-310.pyc b/vllm/model_executor/layers/quantization/utils/__pycache__/quant_utils.cpython-310.pyc index 076fe518375830e5a348ccfbf689932a65646592..53790651171c5ed02d263d3890256f6464823141 100644 GIT binary patch delta 86 zcmbQ`J;j?lpO=@50SFA&?%T+n$D)#;Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS pUr8PWg% delta 118 zcmbQ@J^jV2JpO=@50SGF$HEiV8W7bI4FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` mN!2Y#OwLYBPc7aY%dE=Dm^QhY$DNIfk?B7V)8=zL^H~5~!x~or diff --git a/vllm/model_executor/model_loader/__pycache__/__init__.cpython-310.pyc b/vllm/model_executor/model_loader/__pycache__/__init__.cpython-310.pyc index 3a5a9b42154e36a30e60f893b454092a568a772a..93f94a4a5f99f3a5ebb4dbee7bd5f6de26f8060d 100644 GIT binary patch delta 62 zcmaFFagT#LpO=@50SFA&?%T+{ib*9vza+OnzaX*D$wSKPNLu Qzo4=tBR_BRU8Yt>0AMy15&!@I delta 66 zcmcb|@rZ*vpO=@50SGF$HEiTw#iS9UUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5CQ~aT0JD7-A^-pY diff --git a/vllm/model_executor/model_loader/__pycache__/loader.cpython-310.pyc b/vllm/model_executor/model_loader/__pycache__/loader.cpython-310.pyc index 82e3897b88b6f1d0b59f63a321f2f3148c6e2f52..50280b702ca75fa6b87e462e56d73603722ca724 100644 GIT binary patch delta 160 zcmccF&UCSzi94T{mx}=i4A<`4$ZgD};-_DdTcBT%S)f~zSd^YxqHCU8nvrXmTdtpz znWSG(S(1^Tw>ga~SC}b}ar0H#S;~BQ+%-Hk9N7#-WsD4Ytea~c{R9Q%fF|-VvavET zvM{pzXJeXtH)tAA!{pLnGmyTu!MFJsT_$%XS+cPF=VID?BB_fFBp#Caod-nwmi6!g E06ar5wEzGB delta 168 zcmccE&UCY#i94T{mx}=iDz`OkEFQ_cZ$j>v@Gc?dI z&MZmQEl5nxPE1cN-kijhE6h~bz4@Z-EM>mJ>KdLJj%dlpoeu6>@KvQ`b z*;ttvSs0oAGyP{{o_sxM8dIVCtO}3Y%TadUyeHnl@7a diff --git a/vllm/model_executor/model_loader/__pycache__/neuron.cpython-310.pyc b/vllm/model_executor/model_loader/__pycache__/neuron.cpython-310.pyc index c6314a97c84174fe95f53a46dccd521bdeab2d4a..4d66454ab4e12be7b9d1b06726ea9592a9418deb 100644 GIT binary patch delta 62 zcmexp_120zpO=@50SFA&?%T-ylvTw~za+OnzaX*D$wSKPNLu Qzo4=tBR_Am1Y4vy0EN{Q`2YX_ delta 66 zcmaEB_0ftupO=@50SGF$HEiU5%Bm5hUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(Fge_7W0NfN72><{9 diff --git a/vllm/model_executor/model_loader/__pycache__/openvino.cpython-310.pyc b/vllm/model_executor/model_loader/__pycache__/openvino.cpython-310.pyc index d2e597f798b98432bc2258974860043039f453ab..f256d7f1734bf7e055f35a72e328490d876bbe28 100644 GIT binary patch delta 86 zcmdmCu*rZspO=@50SFA&?%T+{n^`45za+OnzaX*D$wSKPNLu ozo4=tBR_BRJ7!i^AwHlkHU=g}4n{6UrvEJe*%&voa~kpk0Br*o{{R30 delta 92 zcmdmFu)}~mpO=@50SGF$HEiVG&8!ikUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> ulB!#fn4F!Mo?5*56*DWVhyYM08v_#~8za*{E@q~`ER1abH#2e?@&f=8CmIU? diff --git a/vllm/model_executor/model_loader/__pycache__/tensorizer.cpython-310.pyc b/vllm/model_executor/model_loader/__pycache__/tensorizer.cpython-310.pyc index 3bd15bbc7d68017d1b29b367f0b12b8611cade97..8993fb11f841fad4f86863c079edfeb70d2851ab 100644 GIT binary patch delta 702 zcmYk4OHWf_5Qe|+aC(K-wm>iRCbX0msHI9R;tdsp3s=TS97v32PPzCEG))B|nl8%T zVEqN`ttKZfb>Uk701FfUg)4E+rwh+w&NJ`4Gw)fPZ+qYO0=t2LU+`0X|7G*!IB>7v zLV;4b!Od?&N%DY43g!XjB_H@So9ehT+My7HbSqUD!fbJ=FhwAuHMbh35g7S5AEhWn zHG5Qy;t;0tL5{g2Fre}@36tDN zC>&1lCj`|L6`@EaDA6=b(+te$wR38g%23uEQWvNK6`F%NszQ~uFh-694lj$YTsPn% zTv`=7QBzp+2cM*XniPkA>#|kra>}ZB?4;G!YMmX|U)Y!XVng7_iG;e9wHDZR#qz8O z9K|S~jdl%I7BOZmV%&;sUu~F}z_B9}u4z{iQ|wA<*LB`XV}|=o*MJ+C#T4%hSwW5u zZ{KVf2@Xfu7)XdlFJO3AmN14Q6PV+pw=wU8{1@lONi6W>j&BNQv1ldrti(HR zoW_|W7cATB#xI$FP-#=M(%fp6+fQ2?R=ZrM7n@Y2{fgRpR%srzH+OgJSLP$nkYAe8 zklr)%w<+x(gU{ok4F5yH0l#!6=9$;9*Yb^!Jnem*e=Ym=QjHAR@Ad1&!4GU~-FM2z w-p~5Gyvgd#D6!Fq|F5EDaKf)bXYj4rr148zjdE=F(^MkU9^7*?Qy9(Z^>4&x*y zc*lvtlk-Z0EvqmA7nYRmw5IrzN1vDiRi@NUf6A{mXw8yxKU`ORP~DFFy${);vaayX zw+t@&jz3MV8DC#ec#5ZKYPzA4GRrgmEYJFht+_Rgck$eb2A6!jLbh(6CtF_HE>m9M z4&_cmg)6*==c&o^ZCW4Sy82R0EnMRno+j}+&FSX@H0K5{hI9Yhpz}dKM3tMZB|gf_ zeooe0>e2ZyA32G@t>&`&i@Eo_$9pwT?5wT`Pi#K)c8~TqcD5%g6XV|A=Dt6+yR!Od zW!>NNf-|SD`9`ZoV+K>tHC1KCxp7u^gQsSp`P*8|cJ$J>inW-`WEwftbEBnsx40H( z5PYdVVW-WxDOA~M@NT+ny(epJF$^DqAJeZ29|>J{$DOa$LlMJJ3&R10W-t>|t*D$wSKPNLu lzo4=tBR_AmJkx1L0Y0EEJ|+%kE*36E4n{V{&HtF=838^E7eoL6 delta 92 zcmcc0b(f1fpO=@50SGF$HEiU5!>AFcUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> ulB!#fn4F!Mo?5(Fn&~v7h!9XG9}@>N7Yhd?(|`5IIJ diff --git a/vllm/model_executor/model_loader/__pycache__/weight_utils.cpython-310.pyc b/vllm/model_executor/model_loader/__pycache__/weight_utils.cpython-310.pyc index ccaa569aa708400c35c828f161e9411097257e22..a2a2667be164d90be245841a983671584ed21604 100644 GIT binary patch delta 520 zcmY+A&ubG=5XaxV{h7_?S1E}-q`G3atZrCh#exV5D(FE$8if|5qO|qNz#nAA! z2dkh$4*H-Mscb+HD;{L=;z9HxdhrkNpr;DnJd03Yyg9?bFwA`Ue&+WMY(0gvpGp}> zMETXbx>J9h&S*y}9&H6)&j4ErP)@u-YU0xUbC^}1sk;Px8n=i7x_>g5Ta-m z7$QJ0kp@zTiOleAw3cO}<7KmOP$B3Zocngp5S3SzD8bYrtZ&y)s8NGSL}jvxXp(3HS>T)vbpdZOo#;d&iGjqk z_O%JWC*VdoFN$f=I5Ym?UgVqhF?hsx?IJ|{lRX1(`5*hz^!NYv4T_=yOAg^CzAo-N zA4pQbXZm;f`=fUJczO;CvLB9vA>di}cy2Pp!huf^Q*;VM_!)@th(La!185vW8OY9KQA9lEu)d)>7#zKhDj zhgbv$K@fEVU-HSg5cH-m_U0cD;$M(ruf44AI)?)v&Vlp!v9<$$x52E(Vo@S$_50hU z%f)Y|rQMiuR~pN1wO%Y#-D-Kk^;UzWdTr$P-8*ih9F+22q4>P8SZaj#wG(+T4uk}x z0-P{lv_+egNu0hU%N7?1T_ZUpGxCuRkOyQ=Ybum zS*`|~_$QH7X_t0Q2?vvx)K7(d*PKXSju5GPQ(ukYcxGaSx2t_-KxNr7{n7R5yR=|Jt3kl*WBF` zNsqt}q?t!>hGQ8U4#P_39Tg&fXS0;n2!2l4IDIp2*-a`aRFRj=6hSeYv-_{Vk;G1K ZM>>MSPcl^`py8+70$$|y#1G7S&OdmWefa None: - loaded = torch.load(pt_filename, map_location="cpu") + loaded = torch.load(pt_filename, map_location="cpu", weights_only=True) if "state_dict" in loaded: loaded = loaded["state_dict"] shared = _shared_pointers(loaded) @@ -373,7 +373,7 @@ def np_cache_weights_iterator( disable=not enable_tqdm, bar_format=_BAR_FORMAT, ): - state = torch.load(bin_file, map_location="cpu") + state = torch.load(bin_file, map_location="cpu", weights_only=True) for name, param in state.items(): param_path = os.path.join(np_folder, name) with open(param_path, "wb") as f: @@ -422,7 +422,7 @@ def pt_weights_iterator( disable=not enable_tqdm, bar_format=_BAR_FORMAT, ): - state = torch.load(bin_file, map_location="cpu") + state = torch.load(bin_file, map_location="cpu", weights_only=True) for name, param in state.items(): yield name, param del state diff --git a/vllm/model_executor/models/__pycache__/__init__.cpython-310.pyc b/vllm/model_executor/models/__pycache__/__init__.cpython-310.pyc index 5ef0ec36f4ca51a5b5d5c333573c6e9b5ae4fc91..d17d8c800ccd8a5607c0faddce4393cc54246270 100644 GIT binary patch delta 61 zcmdnMx`vfIpO=@50SFA&?%T+1&7|U`Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS PUrz delta 65 zcmZ3(x`CBDpO=@50SGF$HEiUzX43G}FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` TN!2Y#OwLYBPc5FD#pDD4YiJa3 diff --git a/vllm/model_executor/models/__pycache__/arctic.cpython-310.pyc b/vllm/model_executor/models/__pycache__/arctic.cpython-310.pyc index 7eac1099b60eea1283578247f57ba917a3e06c97..3dd3e7cba6d2c1da99dc0c987a5d381ed043fc13 100644 GIT binary patch delta 772 zcmaKqO-NKx6vyYh8OM3^<^u|w3`R$N%`navW1+cHNTWpw6>Y*2V+KE%k2kLwBe<`k zX;+|j%xo}nOv}Vk>}dsoK@bEjT)Al4RNztwp`AqcBte997eCJZpZ_`M-pgH4<`pSz zw_6Q-MN4bT(o&^-GLlUy5oJILWqZ}WcsA6M%=IUu$*YmXz~zW?E!&??>E9|Bs-Ub7 zySs#1RY8xrf2)77xgxiGY*zAqNL!9)cVFGQwPMFZo z`ZmEn!L#LxWI7g4sE@J3AA~8)_|Kc3avg8V2k?u3uxjs)J&kR3i`?d~{NLQSjRn^- z9bt*Ard?|%2`i`sF2O3U2U_>N_$#@(n>-ZEz;*p@FbMX!Zb1_@D-${l7sL2Ibm2zo z3N!MJ+-=k(&8FFzjfq2`Ze%_(aZ2PnsmM#R5)+vrFQ{L+Zee1zL31$2piOf!Cvz|> zv*(Rq07L2&Gx2V|f4c2tw)g5b0;*BWY~yU$<4x6bhc&jp2we5@X_leiQD*GVY_5m& zt#GSgF4Dc`F&K@(YaET9g9Y4-Zd94TAy_~F8(29lVCInt*PGm&TTREL2UONU?{g4~ zUKu}oocPIGE!UI&l2Ai`fE#Zfj#4mv%*7E=W delta 744 zcmaKpUr1AN6vub&w(IWh_L4JSw5?p~baQT#%%=&pp2{AimuZdVh7GT7_ihTp9Yhlf zqFNnovqHE2m$Mpo859K4W4_jdfe%S8V~UgV4;fs75+wgI;S%8qVTSM& z{jG5*VzD&|1vIsVpr8%3eFJNORo9K<$yi)c7O>ythD98AoqTSJu4Q0hDfHT>Awx3BtFv9?>>@0MXkyW)0(b!nK(3R$zt z9oL=p;;JXylLtAd>REVrSf3TMmaJ8^sKOK|pXD`GC9Xx%lQo;AV(r=5M(fR-Y diff --git a/vllm/model_executor/models/__pycache__/baichuan.cpython-310.pyc b/vllm/model_executor/models/__pycache__/baichuan.cpython-310.pyc index 7318751ec25db4ef7d067de7a72da4bcfa4d639b..b43274eb98f896016456dfc377611de768f2b3b0 100644 GIT binary patch delta 725 zcmaiyO=uHQ6oq}GiI6l}V$;db)JaH4GPEUT6}l)Yn1cUyTe^uRZ30bZ7?Z{}X_dDA zgVkJ#X={-pSgW=mvs17sbn9N@Mi*|SOP9VgQE(wRi;u&(=W_3RZ?;F?kJwd*!?urq z@y!o!?aS8CnOHHe#k8E(Urg!anPPt;U&`j=`EqO`cR8j_6|-u=_-Ji*u$J-Q$ai*Z ziZ|<%z%)?iP^@|q`U;Q+GQb#6p*5dqymPGyY?emdTIY4RR{=9wp}nJBwCA2-*Qnq* zYoA4B2)JSFdM+?Wg=UmZvwaIl27ctjkLYJ&Ry8%PWPb9 zb?!s`9$fR4*$mkvl~rk4O0ufal#+r}Lu3%BaevG;%&;o|Luc2qPl-UtYgY!^c-mSn5#A@9!Rq#ss{#~PyQ+{A>A;( z1$voKkm*qHqVpjvhRlBbB=jRvgIP95pMrzpDvS~!A<@wu@s#>PlWf&^9vWrdWmG-D z3LpR$;02xQ?qQ3R2$wjUwl3NUKjX(wMe3YCBj?#V4Mm691~sAzCr{YS9}Uef>1%Yr z4EIn%@jG8}lfUV4)J_1eDW@c@>yU3~xZ8bri_2Yp4t*2emhnaTA#~zB^hIF9bm?>7 F*e`>}xk&&3 delta 721 zcmaix%}*0y5XPO=E(zPlQfd0NwQWkuZWJnMV!{CxW4)Nvc+*BDYg?dprFFM0v;`5w zFAmjqlp>P!B!Y_3Y+_6_%0Um_H5#Hvul^0bQ!w#h;vRmP_nGINnVt7d{C!-=S}g55 z*jIXW^`)@HOR;c4*TQNxp{QXseIcAH0)oVLhEs_2iU9Mj1)z#wUKm3~^(A z&rh&UumW0vP$Cp@+U|q0(X_wjUx3ksjNhC!7{`mQ6T%b;#|hKMhARe^ zGK*#IkJ00CpP6OKrb$!AMpD`}a?TO1GsMkleMnXG{1D4#w7sO?V2}kZO7Sg1f^eHK zOqeHZk5ToE!zA)z7Aja2qfjy4icwCik!65TVc0ZX$|h5)<|bhVy}oXk#i*~3zsUrd z$3UkWYB<>Gz~{c0{huwd!+$JPCwtrf2E(S^fp!0!<36=Ry0dHRPHW}{_5_l!i1k3f zZQ-xvBDovJkH9|QE>B>4@TBbyNkE>R+91VuF%ukx8T=d^a4eIMCy3-QZ?$-cQdbd{ zjb_(ba6h1|i?BrC2qwZKJm2AkDn>#D#zSo)ehf9(3eI&eY%fBP4#El^l}^Db-jig; zcaj$#<9DgQv}dHP8(-yL RoR!{1s}fdQDt_5N{2L!dxq1Kq diff --git a/vllm/model_executor/models/__pycache__/bart.cpython-310.pyc b/vllm/model_executor/models/__pycache__/bart.cpython-310.pyc index 4c44deb85ac74bcd372ab008719bc8d23183a52e..363f805070215d477f8ba0b47d44006e6245eb95 100644 GIT binary patch delta 100 zcmbQWlySmRM(%uGUM>b8FkHKDBX=^3ikp5(Zh?M5W`S-=Vo`c(iLQBWX-2MLZn=I= yW|DqEWl2VU-sWj6Up(XrfV%jYco;dDSeRHCd6>AE_<(EA~A delta 110 zcmbQRlyTNlM(%uGUM>b8sNB}Dkvo}1!%M%kxJW-IKRGc+KPNLuzo4=tBR|hr&(J`> zII|>Gw;(Y&J25@Ac=IHdFCHpoK%IO{Jd7MnEKDqnJWO0nd_XoEBh!C2CZ>OE%uIi| LST-;5eZv9(=G+~l diff --git a/vllm/model_executor/models/__pycache__/blip.cpython-310.pyc b/vllm/model_executor/models/__pycache__/blip.cpython-310.pyc index d540977c33bccb288f3dd6346baa7772172a16b9..f27531a72967d9867906554bc920c72efae95695 100644 GIT binary patch delta 470 zcmX|-O)ErE7{@)=yyTk6gd{I9=FLshM2dwSSy3n@B?gxnb7$`D%<&p!=XIER!eB^E zS*Tg)ZmcY9d;o0jQno&U#CaMyi(k+Aopb)3{&{IvN8BRpwD zjJOfzQMRb^a8GhMmh4QfMzr{B#8~GsJ!Q7q^*XT3Y~u!a4#Z=&OUMuo&4%U&39|Uo za_2cFgM?v17Bj6G_lX!48yg~XiXm?ij_}PJ5S;PUVpUrKj?rxU5X|`&Ub9>IelJbR=K987{!#b6EqDH_6P%neH`-#M8ul^x%yNHrJPNXzaZqz(SQO{stPxQ z{l06VCLM`sgXv2aB*e{6fobP!01&@%4!vFvP delta 456 zcmZ1wu`Gf+pO=@50SGF$HEiU5%c9|>Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> zlB!#fn4F!Mo?5(FhBaS|F=}&=Ad#t)l@-@A_D;U2s0t)^%gRm`QJTfrH+j9%6CgQ7IgPPx z@^58Dqh6rmTkNTM$@wX%MYou9QuB&H#z4%@2C>{gL({Zv$eMwF-=7n%wb z&}1%(1&PlD5wkb@s%kPa6{b(FP;*wE3lxfC%Z@K7%FnvRm6vsWQ{8V-rL0J&i#YKr_A!NZpl5rFfL^4gFW_r3U@=Kw8d0AATOjAh< zQ0HiB(@QHu#ZZ4yKFh~w_>ZGzWxur4F*9ehnx>g%>W}XCu9d^IGyB=I-}Ct0bMN`x zo(|g8LDo=QT06yUhAEhjEcNSAeJA=lSbv^TN%M z1)-pkt~JDxX|%`NXjD)piz*-_v16d9hW#`UF^(kkShN>lFJ+N3@zdE6lZizaVw?k4BRae>~$s?TT?}9EFz#Lv5jOZeu z*VX$Xx_4odE}F$k-fPdIHp8?(NuypwmIHW3!flOKcoo7cT;&+6t%kXVTO7q&C(LDh z(9uiFIGk1$w^Rx{21O5G8J|f@u`xnatN-=8p8ra#p11)XH0ZX7cGw-jMxbB(TB#M1 z)L)ZEOE$-k&fs06AJo<(b}g5<9JGp4oE5an@HxwAM4QyzBv#?aVp_&|L>nJSzd)~Z z=a@?Bp#gTxysQ4C-x#9L6cdj@DO)K2z}W!l6OTrS$o_Kfk8KBt5I8Mn2U zkrBt9F^Ln^_(f+RELC%;-`A{*U`Pb|55Z=*2kXIkp*mfNx4HYi!@2LE&>*o+{)l%0 zH7@T#y}O|Iq2684#>_t2#&cbHlAW#^+RoQplc_*3^n}?;{V-ET1hBRfr7R&)LjAI8Ot~5^{8^VfUND)5aJ14x(=UwIG?+ z8AHccSmZub6=u>oUQ+0!^Sq^SKb_#}31yO-CR`qV0#&|7#k+UXMWd}KiOT*xNcUi& zV!lD(NeNTamxO)6y6703g8Vu1W1=fEA$$d#G_E}Ga|~VOvy)S;UqZPA^zrYLGd$A_&HEMGL?9S5Z delta 1763 zcmZ9Mdr;I>6vw>_{CMn8qAn|s1p;FEslXy34dbXFWlV#HPBYFrwJq>d(cS&Q-CYt& zA%#*BwT|dCNsT2DqLTdt?J@ZnAN*m86Fpe1vCPyNALC5Z^k?^b7aNM1{c!I0+;i@^ z_jm3c=wgFi%&f=9$4wD`&BJX+&G(~npDzgdd4Wf-b$bdt^)&?z&4IPLuPDFJQQ)r+ zXn76p+V$==n%}S~>*AQx*gDn1QoSMpuLgVq{SkaQ?3VyPxznc`7ZdiGl-DudNWK}r zu@?Nps&5F9F9u{Fir_l%0?+`+>f{2-D8`&dXXZrug-O*3NeMgvQ3HZN6UvUO z6Xs7CzDi|D8R1eM-y(!d5SxK5D8lGT(iwY=;!{e@El}lFJ7`%-MRJ=Mho;s00vh*f zb@lFm=4uRTyjesZPRV5**t2mjrGlkyLZl6NML;!&vvfk(Mpd>f<7smWHVbir(; zVcSq-t1!utoUfVdJWazYTjk zuv_kbhcJto7pajb%FXunRSkzc2prQeYp@167&SLoY+^qE%VM_RxbY zJKIav>>@$5k1PAH6>lOUo|j=>IUti&!jiopTLTRdiuJggHSW{7_y4`I7w%}ySF6`) zoPQu&@#K@ec^?X0)VLGLJ_2MXeGGM?#sg3%YJ4YWgzYD%y+E+jzJm4AFZTJYk5Y2a zn?J?8USNRk=2o&JG*5kw4N|LG^Hd+?Q~_tgYOZ@-0e!vZbJglWU%)Tckx`#v&QaiV zV2~`cR5o@%-q(bEGj??8i zX%@NK7mucfS2M_z=VK?0#=M;-^J)0ffB`Z)^4TX;>adH`tZ_84(=_fFRW86eLW70r zY{a-+Xk%=E?#;EbokmpA5)(T_RmC}Mlmf*W>AVU-n)maxGYI}cK%ID{ zel#|hB(jQsKcX7VuRASAh%ka6wM|abb!pEg!~fl)iAL`3juB0^_t~;nhrREA&{c?iDvwb9wYN_2Sb{ zeoAl1TYHmME~?4-9dVj~xV17+@w>eZ9_>-UAMl3*Zqc8M$aWjq6_4&lch7}aq6pR< zI#AX!bp)mZCT-MXO^j~=5kL&^EpP{~1Up6N%DdSq zW7Xo@Z0$GDaSY)s#jx%Qgp?}1F6hyC36yn!d_&t{Z2{T=+)utA*aP$dM}T91T=WF2 PlQi(mda<(g+1>vDq|@K4 diff --git a/vllm/model_executor/models/__pycache__/bloom.cpython-310.pyc b/vllm/model_executor/models/__pycache__/bloom.cpython-310.pyc index 81e0e5e6fd120810005dc7b7145f6a347c76c64a..e2bdd4b197f3e05418e7be44d6a6411ddccee410 100644 GIT binary patch delta 487 zcmY+-J5Rz;6bEo`BPD>uM~X#2z-UYuYQrLN(@1Pc*mRO8L8-L#XwEL}!2zNIxJVQ+8_Np?2)f}9H(nxtT3$1N*)fiDyd8h&iz+0Yc) z##%@Y!^Dn9*G$n8HP!q#_dApx+jsg2ch~k~n9#jF7rvnnAv}Pmy?;+R2u`psvVs~| zjLZxjbu}BmP5U{*5abh=1FNpe6p}Kt+ OZxN&fc^yxWul@k~1$`X= delta 500 zcmY+5OJp-<(x_GBAoCzge>t_g~o z6cs^{cZ6c4lu-+j@YJNB%OxpP6q7kIE$K#_OoAq+rwsSIOEQ)*7W_(!@eq(sT?;NSU%>m-U1q z>ZJtj<}^3v`;>r1o5%VPSwt$x5^@AVE=zK7!>J?-tZR;BjkxQD&=-aucjCp4S;;3d zl9z~cU9aPY?(6IBTkaIY6CCaR z8;xOb4rb35X@KOJ893`|Hh!DNqbJ0WCcJw?b8FkHKDBexQVino4AZh?M5W`S-=Vo`c(iLQBWX-2MLZn=I= zW|DqEWl2VU-sVt_2xG=6lh;|hvvDzUG4e4^{%|^TgyNW|118 Zxg3l<96XF1j7*FiOhA%(GiSOnI{-65Ab$V= delta 157 zcmdmVhjGsxM(%uGUM>b8sNB}Dkz0vF!(YF&xJW-IKRGc+KPNLuzo4=tBR|hr&(J`> zII|>Gw;(Y&J25@Acyk~}gfZic$*Zj0H8~iW{&O%f{o`Y1YT#gEV`O9GW8`Aw0Fg{g yj1b86mxGOEvzSexI#c1|&7H|f%wlywYdIKsICy|cnHWJDnf^1eZ2q5S%nkr{rX~ac diff --git a/vllm/model_executor/models/__pycache__/chatglm.cpython-310.pyc b/vllm/model_executor/models/__pycache__/chatglm.cpython-310.pyc index dadaa4559f3273135c85ac652e45bc8f3d00d834..5a0e6b04dcf78f61098474e214df0a319c56e8eb 100644 GIT binary patch delta 693 zcmajZJxo(k6bEomD=oHGi3zbNqyZ6q#I`iF7%0YWehemRTwGorwbF*Zw%$HPCKDDN zbm5?*NQ|S2<_#u@P_4>GDo_#wRKTbxMmIG&IN<&3fN}8+znpu||D1Q%dg*5`Inyqe zV}twxcSr6!ZT9*jenZdrGl`7X&_rj<@b1^o$Mt~T?N25;{Fxpjo=%yq_O_i=GL5=5 zs(d7e#RwPzqabHqslQ|mJw#mvT;MtwmXx-hO{BD>n$&t?B9#`pc#PH{c*gB}$Eu&m zQYjOcaWe+S!E-Rd9;MPbiSiD3$_JGPl;`WMA;$+ zP#**HV14BRjp^!*u!j8s!Iw>wyhi0mFjwnv-fu(IT3XkMUHRC;2E^H^DR7 z)jAe@B0{N#pGV~d7z5A2xIi-V0mQdJAD95Q!BYxI_gI1EC7Bg;$vMvKe>Pkd&9F6b zIuea5sZ>nM@`7Hw^BrT;RB7A8O5|`|W)n2%`q{g*OcsYE3!lQ`89~{QOY@`1rojzx z7#sl+@KPYH{(HYeD7*nnE8ik5fi6MVswTxJji{+iPmb?HrH;0GhS&^^NOsZ!7FzJs zvm$Ns?q@~)nD>Ce^d5)j=#FoPsK55LIB>nP=}b)Rj_3F*BxWrciN}-^yb-gL)Zq85 zpF?;7Tm;xcnQa@0`#abEdqG6Vj^xy$J>7fz6+=@gwF}F8ebTs>%`57g3HH zX{ydn>Gmz_J};X>i&ymP?NtN&PM3Cb_Cq&zoMla4(Qtropa#?m%EoMt^D12nG_qN` jA2`Kkb!V_-WMx{|+sx*vDdaR2FkPgsP(sWMhem$`@5kLB diff --git a/vllm/model_executor/models/__pycache__/clip.cpython-310.pyc b/vllm/model_executor/models/__pycache__/clip.cpython-310.pyc index 7dccad739906e6696394d06ea2746996ada39268..8d371d89e5393bc5238b606e4cd88fb285ee8d4a 100644 GIT binary patch delta 614 zcmXAm&ubGw6vv&-PqP~hiZp6tp!s2vx>7tomc1ZnVIi=-**Zt1Un&9bb8{mQ^a)=7aoxa@bvUK;w7TzjN&^2Sp$9QLu3_|bwmlV2Ju8U z{E9ELUV0yu4fvcGkrk*WQ=HvokF3H}>JR5($|}4-%QA;6SyV4K)dgy{s6kgy3h3rs zOVg?AY3e4$q;wtn=^T&!k^Vig!3BOx1@+g6H;8wzbMb+H6VD|0H5rF5`RH=&9O*+d zGtJpe#^6(Cz;n!IE6Nu7g7hv%-a|+T6S2hMN_I`9TDh&)t2IXZu$N7UMRDuCp4i;--A|{21i`Z=%W=rKkBW8~*>RAHkL%lQHbespxgCd;OsU!6zI@{u4wJ zLV`pD0+;i*$R@P&l`}(bp#s9k;d*SI?kmh>Vq^djMJ5BMsQe{l3F3v4h<{J}hygq; G{QL*VnzwQQ delta 563 zcmX|-PiPZC6vmxNvs-r)Y5hZK+NRbtHJf&`4SJAx=)sdcc<>+^EM-kL*{y3fnH>p{ zMhYIqSbesI(is0G#T21sQPGQd6%U>l4}xdGd%!wl!8!bx_sz%q-n=jQZ+Y1XhowX8 z)ZVS^$#O6;uibWuW;;3E)@qbXfRRrGTEnCna*c!OVWhHFc6-tQuC)q@)GElo&G&Chwzd zXeM`17cNfkQ*gkvi$Sv@W?Kg#iBuVN(ni} zDkXfdoE>n~6|@V#)p#Vs^gcoA;UMmXgd-?~B`hJlk1?pJ3+xk>RN+LInF!_xGWY?P jHT(#(kulT;NmEhVJE#3Xr~$+2tjrfkS{!Y-oBsM2#^9?* diff --git a/vllm/model_executor/models/__pycache__/commandr.cpython-310.pyc b/vllm/model_executor/models/__pycache__/commandr.cpython-310.pyc index cdfcd5dc35c377f77997c1a1c9579fc72e449349..91e8bc66795ba9d153ca3f477a06edf9f1827055 100644 GIT binary patch delta 70 zcmcZ_aWR5BpO=@50SFA&?%T-S&8p(1Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS YUrdnuMXpO=@50SFA&?%T+%#HQk=Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS zUr7tf$X9V5YahVKv7(=3&_;uEYb&w zOaKv?AYvkj$OaLUHhU;0GBdVLUZs-3)&~+PpS(aqe6qf3fHX+`EzW}c;>?oF{Jdgh zU6W_2x+u;7%4@PCnLP)jAIa>=|5ay*&jJa~1Sw^KC^Z2I%$>YWErx9#keSRp`J=e- zWMy?lq1i~PKvF8V9+Kz30(i0A+kQ9PN&@i~db zCGkMn>>?SEcqfq1iOh^Glb5MvF!oO7SIv1Y$-h-+h|dHG&HyQ8fhaWr3Cx+iN-c(Q z?qqg#OQBgvl5-)FLF&($3Zph#Ys_S1T(J47rV69{Jdlhih?ox|m_P(8hzJ1@D<}U` ml;xTVWF{~&FckYuE)(_zm1SK3 diff --git a/vllm/model_executor/models/__pycache__/decilm.cpython-310.pyc b/vllm/model_executor/models/__pycache__/decilm.cpython-310.pyc index 9479d4ee3646aad99d744a5c92ffb1f283f7af2d..30d7d4c07c203b35fd4339471ffa401f7f4215b9 100644 GIT binary patch delta 70 zcmZ1_wM>dTpO=@50SFA&?%T+HiB-izza+OnzaX*D$wSKPNLu Yzo4=tBR_95E1L!*Q=a^0efHn10QcAyFaQ7m delta 74 zcmZ1`wMvRRpO=@50SGF$HEiU*#H!(=Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> clB!#fn4F!Mo?5(_kxhe`*>Yi5Wiy8 z8wZ(-2cpK4Mu{OkV!WC79TTG_y{Q*YrpALNTzu0t(Ma56fA8&oK6Yl_`xt#0t;^VK zwN>H?tv*?+TbH}WgNDw6EWrkh7>}#Qz_322=^;HIOeH3QY{Aen>Ec(p+6oc;Zkuj7 zBVzfaKtxvOnaYibln-Tjv^d)^3d#go&k~LhP7qEKjuRXNGXcJD>;|>C*|;Iu(n3}w zo+2y5vSSw{(d+a;3imsEWS!&;>dwPLUUPczo%0^3c)scG_%sDVNt#ONij~iauhO0UhoU`<8xAxtF$zKi%G@e?2Mh5{7&( zJk);WciROlw;zN8?)E$uZGZD@258dvp;DtbsR9L!5iXee4O%2|c#aNTzD5QWuXnr= z!QoD}gML}sp3FrjW0RVi71RFE`P^2S{*o{$7UBKSd)h4R7DX=-ZWC1W_+CJ~xZzs{ zV8z9*A+g}2Zndt`i0O?T{_uaIsj)l$ptvw^{V{Rj1_Q6alI~wtruWc&iO922#xpbg zqWBPHq)$ delta 862 zcmZ{iT}V@57{`0gv9swmHJi@q4t|hsXIfK)ki0C!ii8MnMzq%4amQ`$?A`oI@dH+O zUex2YK?EU06bHJosOZKrgsy@?<)uYXcLqWAJX??;or~Xj&;Nb?@A;qSIa`tU5l6=5 zsyam1?31O(jtwO+9Gc9DP%0CPra~#>TF9KuCo&U#CwhBAIU^rGZboCt=vX{weNifG zP{eO8z3~e9#V8@H#AnR7$cN?W-ki8rtp4QWIBb zOOvSjUfbpRQuZ}=&ok~YbgXZG0|{%V{Wd_>${p(irQ8zgfd^l8oOSH8p{H}?KgTS0 z4$|;9JEQdT1pRM8$}ZxMfPRvPA6BvvQ)I@)B0bRem9=D9TiUNpm9=GSRSN*b@mVl< zYKRK#;H-24%>t@RbV8jZL9L|FbR?;YbUP^EgbJvW|LLf9O;F2s+Er`4>yfM&bdo4w HB$WCCyd2iUBj!p{?{W+)hCdMbUtg zpo?oIicm~_A>wO90TCaVXiQug7tEjF&V>ti-d}5?AtcV?n{&@S_uMmcO};Ff!vhQm>>q-NC3YSQYGa1^g{8xl8edLu!L@HiKx-);e{h zL#oz&w)(8)C)o!3P{Z;h?NI0elx2U&OBY$9dX9{-=9;55 zb2wZ8UV**f?`V@)rU4_^2fnb3f&Eaqu#$Y!4P5>U(Y%BoI7VSSL8w25J*o? z-N1j5+3u%?Y<+QqBOIg-U%)N;96oQOLym-+1OCdga;GEc4M}!cbhn5eDX7%x7t)AJ z`I&9kkg#IQ9nwZS_&owqb?u@rED8D4$8*{Vy1*H56hy!&aF(O$g0jyWqFxkEf+%R^ zxKhIYU|U#{Iwji8b2Zf+@Q1vfaDZ=l4qYvv2OMLyMyu@t4_$gH1)D`#qUU)gWYHZs z?*oUyMbNKYGu9H)tE}Y5wB!<#P1nh3mR!_D8d*8+G&<+ zzPx8`k>4vM(ObCw1{el6QB7Wd2b_=|!QJhi`-+F`{ z+^X;uQ>+Kb9pZs`V zNb~^;W8fhe2WBwA5e$iqAE6L`&&P=R!4ydB#3Pk>Rh>_aNR-y|l-Y{Ek{H`8>?JWp z6y6gu%4{X(%ov6gPzdg_BPG>jlChGGoOPeUOr<-`=oj?=*@Q()V|mYT;S5@n60Pyw z=2(@zk<7Cpdrj8tKZo<^o@1Zw?+h;xz64L$Oj)t%Il|RqEz&r<5KSsS%A7>gHpcAE zL-^}+h77N9vJJdp$>rbkmJtpD6GzBMEcA+HRrvGY@`|dHMJl#Z^r`w*QI@@a4_#uz z6^n-37^}lr0c)`2uyEz}$_3O4z#`ZORyUkPngsM#X4O9RC diff --git a/vllm/model_executor/models/__pycache__/eagle.cpython-310.pyc b/vllm/model_executor/models/__pycache__/eagle.cpython-310.pyc index 52cb839b063ef29ccd7e071ff03352437fe382c0..9aedd9d494334792af5632976a8691962d4b081e 100644 GIT binary patch delta 78 zcmaE-^+Jm~pO=@50SFA&?%T-yl2gT9za+OnzaX*D$wSKPNLu hzo4=tBR_Am4A)I|Mvuwg1Z`Qw7`d1>TMC&n0|4~!7{>qr delta 84 zcmaE%^-haBpO=@50SGF$HEiU5$*JM3Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> nlB!#fn4F!Mo?5(Fg6k$bqu1n5g0^fTj7nKAMFgSX)aAr3KTJ7$5X9bvRvz7`E$BnG7* z2HPiyEPAL5MzPef@gzhO|B0S7F~)-@4{j&F*AikpILZ9-=Dlxy^Ilq$^l_t6w~0S( z%c}+bn#R%TOGOjDgp_DW32Z=2wX{cv2BU4!%f5&d@+F2-gYlUBO;fW4O0wGW0Zcde zWF`?~#3+8>(Ew@Lyz{5hG)b9jM1)AAwf-Yq&ssa`Cg|JG3F;zoCiGv5pA$mtIAw2P z$hvII@X)Pb$0#!|*ERIP)pR9QS&CvEtEO_6Sm2aYOo$DLY=#ndiCN+fVJGf!+=lf< zDRGflBx1yU;sLR-NeQHqDk2Pv41et@!UE=P0T{>6wr*}>Yb|!EHp{(xCjm0}$?n(F zx!Kb)Xm^}wdPw0T;xX}rSmK;!Jro9s{lo-LIer*7`r=lyn~3|494cqV`G}G}#jlq< zA7@dKRc>Cs*==46)(piGLO3jjE1m35N>@ZSg+`}GUp@@d78yM0JP30*;@qV!FZ&FI zY74%0Uf4cQ^?$p8fySe@=e*+9{HJF))0nfop!u|uyQ(s@+`tv=a`iz0^R5Hi@_!Wz zGw=jBx z|FZAK77fc!;W~(gPYfAGZrEd@tgd94YHMoVpoZ)Q~B!oC3 z`b3IJr?2o42H9a!r!cyG&Q#!`s9-&$l;o|gQMgX#TxxhxtY@1jeV*R zJfwEW{cTeK1zc$l8E9Ya*YSHK?ket3dc-40FN;uU_j*id#~ zXf9Fy-%U|yv0}K>D^z$^)c)rtSnQm&&5;Ln6IG4U`hn)L&l80Ota$cWUjLO`pz3+~ zhvy_HE|uluI|l%Y_`>V8EKx?F(zV|pW6gU4mayB`yM>OU1EbCeI#BSZ0mW~HO3wSn z03M*(FKB33HjR7zVfY|l^OwN2NJTc`TAUpO=@50SFA&?%T*6#HQk*Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS zUrOn*Uh^PY*l^`MrM0kRTKoC(2BB~~Lif>|c znrtJX$-=|P!niqG!i0&jW%2^46vo!ctkQECYbGz2cH?dVDUJaVZJWPH+cElg0@=4% zixTtFQ;WJl;@u#k2S`NmWERKgBo>#%17)*|q4>2N7`~VgiUr1Q8P_ zH_E0nHcx&jo6p!ZIa1D%v1#*cIe$jB86er|lRwB`1&SY2P!j>$%bt@PpOKoFQX~bE z?wF*g$JjSnU(t@4id<7z=Mp8QS>kg*=FSEwWq~M-2MNrZ zd|4@uasFf@WlN#CNRsoxlACLl&oVL2n(VFS!?Wc_xxOpO=@50SGF$HEiS#V$<-^FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` zN!2Y#OwLYBPc7cu$R@(a7`1tt$U!E(Dxd*Hbs(Z1MAU+a3J?(lB0NDvAc&{|5tWl$ z#Wyj!Otz5FWaDCF`p?3&IaR`hiLrU|EU6U6mdXF6<}y}Ko-6If-3(G510q^Czmv9O z^zQ(&Z?P67=B1|=b%MmZKtwl?h~mjCj?YOfE{O-qW*5nU#Cw2*CTCGJh}{Pw;y^?{ zh)4tx6DC*7rZYB8ek_~M*f=>@&Jjp{ln~jxQqG!@Z8}KBw8^jJuL4C6D5!~m?Pkx( zjn7C;OevBANw-h_rJ%>yJ6TiFj+uj%V{(?Fg(!B5wkx_Q&H!rBWXIDzpO=@50SFA&?%T+HoK?k5za+OnzaX*D$wSKPNLu Qzo4=tBR_BRFV UlB!#fn4F!Mo?5*58*8f)0P7GJLjV8( diff --git a/vllm/model_executor/models/__pycache__/gemma.cpython-310.pyc b/vllm/model_executor/models/__pycache__/gemma.cpython-310.pyc index e2608e5094eaa73eb5f4a8a61f04f77c33f654ad..31ad8d30894c4386fe1417e85f1dbc658987d394 100644 GIT binary patch delta 732 zcmaixPiqrV6ve%XnSj$!tqD!*grrSU8l=Q7R1~zOP(?&=8EQj_CN`m&Bz>7AEmc!( zqhS0~z12o-MHfNjjBBAP0=jB@dnA@ZEuBUc(fv zMAuVv-AOj#US&t{w=ExH3f0H0$*#a+7cpe5DO0-yYvOcUI0=U}J?#>f`CDjRSwpVC z`EZzC@JhHsYopYz}tX6Mo)jK;XAsV@>^jB!s|8$^b*$iUEVrr7$dt+>EP zYj16}*aZtUuBw@&8&@tG6aR$zKbRPICMM1qSTru2#V6&GW{g2)lZNWUv&uN`_gE{3Q1x!Y^2n(*7qH zp90T-=fDDgmbSu67*7F)g>6?^Qwpl+gK&r6LVPLY9YcT;u~M-Go=+n~4Oi@nWJzP1AGm8%eLA_XDp1 gC*T1t1Mir6Bh=vTWStu3a&oWJjpq{${&3j%3pa?X+W-In diff --git a/vllm/model_executor/models/__pycache__/gemma2.cpython-310.pyc b/vllm/model_executor/models/__pycache__/gemma2.cpython-310.pyc index 6b8f9e30a3289a77eb435cb3e14682f9c8098ceb..eba3d7d0093ec6167052b358b2549610e61bfaaf 100644 GIT binary patch delta 711 zcmewz@jZe&pO=@50SFA&?pw&suHvCzl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn zP+5|ZpSRhVot2yM)@DngbS9}>px&Y^5RnHW@iYIGG-Qg_+GBufsqCp~slLe)vlIuWBkXg4_ixTtFQ;X_B0u3Od5lBSw zWERKgBo>#%17)*|%qfWkB{px!H_mlVjym8Rty)(~xB>o%~SVm$7sbr^se!1xH5FPLMHOAfg*Y z^ni%o$ukv8+2(eAvIeB52o$uMED(+0kXSld zPc@El+2meTOQ9u5lFLAJJPT4Yd-Xg&=`BAQj9I?H!ZXsYx@=*?dYZl~H~< yNLCs|tN;;AAc74SLinapA&JvJl!7jpJlU(o8bbJCk7W z)hZGdx;h9#;-i`>xane`JLyhbxv97a_%FEa!j1PB@d4sp{5bbJ-#O>rvpxH5)@%5D zyLRx?+*n%mdQunVy2WJOP!(O)%hzPHX_t)JvBO7?$X40b4w;HtQHq-7$R3v$a?X@k z6hb<$XJtZ_P$Mi54BQAr!E`Ya zVv)ieM{j4PkyjP9q*?4Ti57uzs2^`+sb-i~AE-U=1H8PKmGnNUo8)i=PrR(874q7GIFiCdWX(yoGO* zVQ4$=lNv-{Q#MR^Ll6jV!g)e}Jsm8i?nB4*D$wSKPNLu Qzo4=tBR_BRXO=@O097{?KmY&$ delta 66 zcmdleyj7SxpO=@50SGF$HEiTQz@ibRUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5JevHjJqa_*@u&fc^EZ{ogm1? ze;^2gsBC3pp_P9jB39bi`3szzh=@~soVjz(VP@WDUuHX1GPjyK^p>6 uf~TQyXb;Q$h<${BXhpOjs-W}*359U*kWlX;SQdy5p^=2I{=F2O5%(L2NQ*B3 delta 498 zcmYk&OG^S_6b9hVWMY;@c%9U4v`E6nY7^DQpbIYB1QCRnNzKvGZ^qQ@zHC>Apk=Ed z2qK2s20=d}T~wRe^$&`^qY=&GnU^!?J&UP_U&0-#&1P-kPv!pLw&UG05|N4;lN2=` zRU{=HlkyckrRFBb#zT^p*5zP68qY+NvSv8jZ`xqhciGsx@zB1)eYVeXU5+!z;9`~+66+e0>#NX3f|8}a) zoeA%wSLdR(1Z2{uw9f+74|EYkPf&34HrhfPU diff --git a/vllm/model_executor/models/__pycache__/glm4_vision_encoder.cpython-310.pyc b/vllm/model_executor/models/__pycache__/glm4_vision_encoder.cpython-310.pyc index 1efd14e144e6deb790853bc841924cdf41b93192..2025bae472665e7b4ab44d5f0795e056ea22176f 100644 GIT binary patch delta 389 zcmaFn_{fnvpO=@50SFA&?%T*M&7u;jUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS zUrd%UmOcTJ(m4q2p7swTI$;avYIBBun3?yxlDJDS2 zk88#=C*+3F)H-Q0ExRG4iyA-88gjwG3K!`jJ>(YgkTdqF=h$oB_-j`?BKamFToEkA z;<7ZArPMUN4;>uI4E3G(OxFC(rYM*w5m-Ukq2Sv9*b6ztVb9tzq5MO8BK1CI?vRRL zl5m3v4)J+_08&EA$b8!nZzd8Ud8CRA*hnwR^Y2J34r(B>KO+9uU65vSA~n<3AmDyM PCrT6B=8FaFWvl)R=96QB diff --git a/vllm/model_executor/models/__pycache__/gpt2.cpython-310.pyc b/vllm/model_executor/models/__pycache__/gpt2.cpython-310.pyc index 3cc35e57d1466db0bf519f19f17999e0de0c12a4..39602e6353be42282aa2d8d4ca191bf55c4f37f1 100644 GIT binary patch delta 545 zcmY+=&o9GZ7zc3gVil%hznGaH2@WOH5+XZVL`cMiWQ?g+Ypbnmy)82#A`XrYPv+o1 zaB!I3#eX2KOGNw$vPj%`pSesApFI6OecNw(m%L5-OrGy(VORX&sp`AnMi)iLutZC@ zCLNh(HD_|pILaAuqa+q|MYPIJ&Mdl*T!kYwcZt6y-D!51ipUnS?Y?*2d-xQa1wz*_ zN zX9zwzjdKpskppB7$-_^mPBKsr&y$Qh+fya0jXr)lj_V0z1Q|mzh{Z?;9bJ=3CRHWP zP&8H5i&>juzgkWno2wPs;1I-JIjE0I0Urste0YP$Pilpj^UObfj7EMjzNhg0(R5#xUqB}q925m v;U+duPT@87GE~AmjGQ1I#EUE=SK#j)ASS#GY!TB<3|@M;#{V$kc{u$GO;Cux delta 541 zcmY+=&o3)c6bEppVT7uvD%FQ45u#6YD$BxYVDl20#LC8>V5v6z0b+rbjeBZSv-srR^PPL{$vvOFnDsk>Kx>2eD%S^B{(Wim zw_N5-ww#=1$(EUwOBJ`^*pu;zgv?FX7%yqLO)YP5@4s{=f#S^tj-lhPXuxDbAy&PI z_Df$NCDt)ui&RSCX)p^Zd<(uy%T!pwm(CSf^X5Y;EM=&o393y@v-1YaQXxm^0;SF5 zs-o=>BR;$q^4^IyV0{ z#dBnCgc`@1>t^NDp>9^%Ch^qYgLdy;&lYV^vys8ZwEv8*mv`Do3b#mL->d$Vu3iqyKq0)c;CMYwwD|@^hvdMu<>S4`2-n0 BiN^o{ diff --git a/vllm/model_executor/models/__pycache__/gpt_bigcode.cpython-310.pyc b/vllm/model_executor/models/__pycache__/gpt_bigcode.cpython-310.pyc index 97c4c4cedbc61581119501e98fb2a213f59a72e0..6fa561a0486e91e7c3800556c60b76a0959ff43f 100644 GIT binary patch delta 604 zcmZXPzfV(96vsVa+d$K3+R`7i_)>!;PiY>Nfv_40leqb#70PShqkYo%gWLB&pn!`S z6BCEC8sk6UVBW5So0AR>HgRxscXBZCeqR>|clhMw^F8<8bAGIRUrD;D)Z_(uYVSXO zNdAq_-qC#9(>%+o`nu?tes#$Xx^~Up(|T4*^Y;C&>xA=(ew>EkyOcqfAIQt120R4n zVfNDaIBjqtZO|qkrGLin!Qbc2%vyOJ<%UFkvgZoDx$Cy|mRN+ooAar`FLSHZ2*2fS5p8j{u%O`m zVWMX@yQXfeiCJ8^2FwBL+%9~sG-at~#dVk)K-3k@9(6T%wK%6mlkOtU118XxsAmGl z(+$HkM(Z{E)`2Muep6J-J(;Vq(eUTK{#A5K*l0N6xqZvGT&I6#ukGpEl|4L=IJNzO z6lc1=PQT4Rfy8L)#Zl`L#34T`wP?VCY233e@*emb?w5H5prSV%i6Kl=5f%gGW0tMcYWh(N4tVk6RD1rUHnCN;f z+er*{^|Wq_pJv)M_t9wO!FR)7vA?_R0u6L*zrg>&!+~!I@l~bkVe1rvP5zZEP?K+x z(~<9O#b&GMtItn}cK9|mMnC-2P?pkLD8#`w=l}uWf?ckrQ{?fVbd@~+F1^(uX~;cp Gj%fF7-Gwy( diff --git a/vllm/model_executor/models/__pycache__/gpt_j.cpython-310.pyc b/vllm/model_executor/models/__pycache__/gpt_j.cpython-310.pyc index 2025e1df2e58a836c147e15470f42d805fda9b12..1375c93dcb9f92074cf3c39b29bd0f991217aabc 100644 GIT binary patch delta 502 zcmY+-J5Rz;6bEo`6$n%`60lUjM`A)848f@Qh#C^3qjAtd4G4lzp}n;&;0r|t2M3q4 z8Ycz^9ZUx|(2Y1t zbD9tPGGoN9O<+xt8AL_qkbRhUr^yb~+>|82?TM14x$b!*>}OEuC0U3F5uyMUs1Kjl z?JCtJL!yfQZ^^f?I8#qznad+I7?t zmj6QYS+o#N8Gx6*TXGJnuOw747(+xH=bO7K@Z-ypDrEeP;3G#h~$XH8;Mgp0wgUmse1!~g&Q delta 528 zcmY+AyE6k(6vo{p2{u78VMUUmLJHRVImTqhXcR`F2@;#Nl9kQgxVu4!XGeQlg+igw zm>nt|e}u^xg-)r^sN6#nxA@ID-*?Y<=H9pXdt9VGUt?JtnyElk zxbP>*27LG}_ZsR+NC)Oc70WS%<~V@~vY6#{#l;jeqcI)zEkuqZ;nl5_p;&f`yEzs{ z-Qb8duu-f{#1w)eW)KCK3Th+`S3yb?Xladeel`c4&DML;uJ9Wb(dKE^CS`ezF$rff zFf5IeJme%A#>`4Xf%5n2)U^I3e@S!QJKT?Xs`l?=Le+k3r(ww}!A|>GWDnb2L=Q)- z?r(4!g#!qNR!JGQLz970m0A8ZoyU-i2-`Y5b=;5>Fv7diDH=nF5MCGmvX0?9oF%8A pMqWD)(QHE;Aq0dAVI$5V8I6)6l%p%8=)6R)1vh>OE5cdV>JPuch64Zq diff --git a/vllm/model_executor/models/__pycache__/gpt_neox.cpython-310.pyc b/vllm/model_executor/models/__pycache__/gpt_neox.cpython-310.pyc index f551e48db109ddd62c3d5547821799e9eb916367..a0a3d4aac14f780eb0961acdbe4cfc15d00d5576 100644 GIT binary patch delta 581 zcmY+AyHDFt6vlfEMd02u6mwrg3c3_|fajBM|Xy z>4t>Pn4t?xtD+KlVB=3{J7;ah#MYrphu%|`^h)=qPv3Wr&e6G^|1vMR@woVaKjreK zBQ?Y0OJ!zzWzX_TOrwU*N)>z4v=w{1+_2WmUXz)w6MPQOg-AEJi(e60gFYRP zo)^PCiydNr?_!f9?bJS+EiCQ7FP%l>2yRDIatw=^>BK=#c>FI6&NHh5c?Um7OJk?# zC>(3ahO5=|n!2r9hRIal)I6QO2PHQ#geQrS75Ce!N p;tVSJoVd&7FaG`Kup*{mD_k>mgX delta 503 zcmY+A%P#{_6vmy2PD>RjW9l)LE+o3BAtXphy|yf{@~UY~r;Rap%v55$-@C5P($)fr zAd|4Nu$K4(x*=Bf{s88%sk`{yFW-00$+`D-{BbG+!_d&to^ILB7u1BQWL6bTwcSg9l7~6>Gjs>SvNym=6BY>yA>-cEopGRH zUpNanJP+^iOXR0eYM2gcBnJq2cdKC-MBURRpQRX@YORrP5E#BTiZRoZ@hYpI9E&hS zun9>*0eK+@S!4nO72kwWP~BM569}r8mI9htNEs^Iv_vXi#V;`qI!ciqew~aJoQ*8B z(%e#&$-GDAnPLB%{t}spZFzazU$(qDWuv&T{RjP65SXzZE!(AXu-(CDQH?>1z)vN zA3bU{Y--!6EmXzp!dTO8x-ur+8r`|lg^5Q00Ph)0G%lQEzMT6zk9+Ptw>I!-K**ZS z8`tr#dvUogj2YaaU_PA-=2E$?d{h}soaJ>7}Ge z_TC-==P0-5HA<2svSpLfO!hSb;t_{8bc4*BgjtlZy?~;3Rd`0`bHWsU@pcMN$!v(MZOa5`GBT@n_5+Ng&bPINk-LL~ z4^N%#3*7BH2n^A;ueG1+MlcyoU<3{SIkoJ&uLv-KLw?DvUYa`C4LmYz48;?fd@4WO zcw`IeqH0m2et1?vF^RB$cu04gjMJgU{J KGppd+ZLweLu*&rS delta 846 zcmaLV%TE(g6b5k5P}|DT7{L|+3l!Q)Yo#JAbYV!03yF`2E+lo)6k2Enc}xdQ@j;75 zK}3Xu8UYc}@Ddf61QSh&3pPeq#Kgq7)P-^5f1vl9nrK|uq`!Rk%$d_Ww=>m@Nj=>iFG8C=lTty>IqMf;LxAiBuk@{1|OnFaZDm0bl>mVVLXk(6rm z4rw0>f>hWo@|>hZQ9|})DVvdd!7$g_-8BPIMHKr!g@1zR@r+L}uq1W1H-#yy<6qW5@ q0UQQ@HoSi)jcN`4(;3Dj>Z822r~Vf%lGddF diff --git a/vllm/model_executor/models/__pycache__/granitemoe.cpython-310.pyc b/vllm/model_executor/models/__pycache__/granitemoe.cpython-310.pyc index 915ea8154102ac45d639acf2bcf9f44b87901d13..92d51607e710db100da92da680cd79624a3b2fb1 100644 GIT binary patch delta 670 zcmaLTOK1~e5C?E)Ya2)mh&5_#%%f4$)s~Q`Egn25da5XbAc>H$HA@?tedNnFeQ14D z(g)gBGm3|*c=e!C_ui{V@tD%PCokR<6~F&R#DlnpAH#g}&3v;zbKi0SD;V@|lV9fb z#(E&@J9s|r7y1H*DK%4IKUBgPKA}@S6|o8{noSzoT3$RydjzQ+y(NJnl`MM;*8zbc7dy3aY#mZ3X|Vqjm_vR&4Nym$6Z?0462* z?g`V@N+rG2Ubk2)&*-AgA7cG9&);KVIdMZy?w)5c7?lpTU||@-Q_R6eSt>^&w?f&N-okWze#4pUJnuv{<^-3nicnJ z^0Pv7{ONFvme`j%Nl*B6%AhrVo0_9#&h~vg_7Ih4K)Wv@27AF{pny(r4y^I}&;e@j VWp#lX?v}ctba_9p!7uv@zW`h?tM~u_ delta 713 zcmZwEPj3=I6aa8%fs(K#Hnoi+$e(h6jkPP()Og@x^wfj(WWc1G1tzd%*>YLs;`v4ULVltwjM(N(*p@YM#3Vg5Qt3Jp)N ziisj}1G$XcME;EEML!c0)Yv>Rowu<&gmfSmKP7ro`&icpD?ULi=*I`)f9IEc>6oml&}NxdtC~@>SqH|Gmw3yir_^JgyA`48&c_YvIVcx z`H0tpum}Hb-@=+r=Ue)Vkh;ZV*Kcbp)D1Ff>1u_#fl9s2pWFMt>)^|rAy1%?X_6gy zletYcU?#ga`w)AaMTQeGdW;-K01=P?avs@%lB-KL%jHW?l<2(_nz;Z zneTGn<^qji@P$6{J9+Qn_klehb6dB4Gc2{0acXwPHtiEmkyi}o#7b?aT02?0m9fkl z8GF~MHtO`Nvcw{-qXT{q8>LzQ<@C5nD=rg>au^EW{R_$-7u0j{r9 z-Kl@VGa%jqoTF#M>A4Mr5c3NH#147pB@nL&DEL0rEu+pC>Ga6C;Vu&(Sf(#V%GXw~ zZ;-zV<~6`7;548g-~j{yZO;&`1K=A!1L)*!y9F*w7e|k=ENu;{v^QGrhXa%jPS8mB zYVfRBh%?*HQ8S!oQTjSO8@-5~JvKcF=M-5{ijGGvugD8~`4wp22V6xqZ&&4uU^|ye zV7W~9A`6P#8=${NrqYM1W|J18D%+&Dqra)H*RY#fu&eLwmgAHx-7e&o#JsQda8RE%XX?$DLM9Z^+O1+13m_PB%r&#!VzvX&GJss>Me48{LI+{ zt(09nRJD2fX*|yIqFS}}$M|iQf|nZOdHi`?PkMpF;=7E?;g(J(=)uH$%6>;f@wI5D z+M>|%1Rz3sJj+t8JMkxMv@96S*KV7Erj10{8)^H6o^v^uFWovuy( z{`nS8e?EdZT{cnH6T)%{pbKyZjC!e2HaPc!DgZtJ9}?duN0$vof1h_qriejxu+@T# zvA(|Mun6dvsq2$+8ksywxGUe>uBoN-iF}~_4MVmReUo@+C5iA~Qk*I8Spi!WpbfOs z{8uKNolnm7I$KI^ k*-uF8(_8Fa`f~aQEsKYuW6zv-rS~}7XU?>(TEvPMiK()nct%6lsH72H7t5OY_4kIOw48EZzU8!4L z7`<_2W7J(;m>7(Sn*IP6nz)q282tg(l`f3Nci*65*;o?J+;`@@Gw*)PJQ{yIE*UOY za|8R$KfC%wx+#)$`K}ltebezdlg4#JRrI)?pNSXeOS48{AhxYPZstqc)}o?bP;#0H zpBxF|Df=6p0%?b^^C;;6!|9iO%(5bu464qi9ST(nIgR>Z!8u6Q!ds`WEx_*6ZiF6$ zaQU0FiAY@-a|l7RwB+#MdK0{s66+Hzthh26RaZ|EgjjUjOeVH7^L#rh6nh+;axI zTTNaA$o@S{2$u<1^!A_NdnKL<-HG%r1UrI&;6hkceiN`o4vG_OpL(m^3(I~Ha`KyC z+NKrFsH>*+R@c!#3CDdSWCCvbd~zoebxFVQrK(9k>>$Hw)SN;%i!jZgHr;d+)y#Z$ zPSNXg9`+|kv2QDrT~&%F;iW$yo@6$dVtLtrpRC8~MhQidjiV6jr&#nwLisTB+J~Ur zIpL_bxj8UWlWT@)DQ}AhrUNMwDK7-x6ZZ_diB=<3lpKK@!EpUhE(N#StJ5eST~#XQ znCoZuH`^FAHQ0&UDKyyy;iui^{z1>dWY^a#Q|#8C`DC&6zVf_Ua5;#8MwLdbpc+|? zQX5jI5zZjrQZ&p`Mpx!FS}^Fv-_7C{GOAWKoN+!n!ee`Tz~y*+*P70&dGO|6(45uJFka~Sd0 zWfMlb5k?UH<8zRO?>!qjvrHWg(qVR~I7;)yd?8mggyHZhatv;VpGT8ui7ytPGG1|t N8*8S#I%lQGj$fQuC&T~% diff --git a/vllm/model_executor/models/__pycache__/interfaces.cpython-310.pyc b/vllm/model_executor/models/__pycache__/interfaces.cpython-310.pyc index bfc0a434a6b1e746d35122a048186ea5ba8d9f51..54a8e4bb061a4a345c2ffb5edb19b14714fde515 100644 GIT binary patch delta 62 zcmccOb-{}}pO=@50SFA&?%T-ynN`I{za+OnzaX*D$wSKPNLu Qzo4=tBR_Am8k?Rx0D*%P)&Kwi delta 66 zcmccMb;XN2pO=@50SGF$HEiVm%&HNfUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(FiA_%)0N08Y<^TWy diff --git a/vllm/model_executor/models/__pycache__/interfaces_base.cpython-310.pyc b/vllm/model_executor/models/__pycache__/interfaces_base.cpython-310.pyc index bd8289cb7bd362767984296b36311662ceabb5e0..30730cf696eae68df688bfb1ae87909e3206c3b3 100644 GIT binary patch delta 62 zcmeyY`CgMdpO=@50SFA&?%T*+$f^>kUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrzrOU$jtL6FyFTz8y+0)BNQpolT2i%bMuM%uXwa1%{# z9~6y{dkiRX&T|A7aLaQN%J|!pjMRf$#BI*G$1E~;nET8UAvcNtb4uP(n)AimPZ?(4 zL72w@-yliTu;SZ*Djx2BL;G*tpF67Do?sp^A?6`|>RFQNGeNAAb!3;B1><>=TsFk3f3buo8T3_7n#9zS+P%wr=^q*_^ve(h| zn5tz{W57}FTxZJ0Zm$*K8Ge@|uz}8S(p>+brg&Vo;jUMPC-^)Zf=!fsE~w#;@NuXa zhx(pEe1`iU5IdGLilz$vln|;&?i(7p;@b9tPZWs1x^Q(ipp4{u?}u1CJv%QY17&&_SFk$K@zHk`oHyg zG=ds&>fofgS~oXG2a`_K!NJLxCS6=K(Q}~j4Zrv0-0yzhJMVY?Z{DWc?baRiRM!^X z*jncJ$#kV8(nWouP)rwR#?y1v^0Ypi89uN-U79IRrsfJ07YpYnOY*JxxDE31k7FL- zGFF@?K;TE`d(sXiEW3NROdzD;J_DW-#cK|6m|kLvQD#&SyklX(@+xDVumQ*Vj!Qh5 zWmIv|Yrr*h`9`3QIbQ_ovf{Itf;BqTc8VKpT3{^p2P*3(cKk=7hF|u z+Ba(H-Lm61e+W0DR#%V6+%3j1KxzU}HPY@Ee6|D5-^cOG>=>9*=N+qO;O z$vr>6Yz8qt&O~o`mgQ^#SOSHoyH(wS~*}h&H zX7ik`LM4G~z;$4)IGyxNS*GwkL7zMaEIQ;IRe4+4Bz1bb1Rr>Rm0%%KD?H@!m(lC$ zLWjAbx!k01t(Fe!Q7y@e7Ljp;nvrwtEi(P$zSGkBh;CS&eiEnln|iNZU9vb^6-(+(zt{|135rZub})q@TVMGNBYE_|w5$c%J(GDqEme{(}{F z|8XuLdcJ6@m6(*#sJ!ltyaba0_yiQ|TJQVxtuD@%=v4h2o1icCEr-k_vmnj})B=YA rKd=aRfqOtHPzD?Y9#e` diff --git a/vllm/model_executor/models/__pycache__/internvl.cpython-310.pyc b/vllm/model_executor/models/__pycache__/internvl.cpython-310.pyc index c2207f618265e2760a9c55f93d1333e379317d1e..72b19060a55b48e391ea369b0537bcde41a9e897 100644 GIT binary patch delta 840 zcmZvY+fG_h5Qg_=Z%~nqctAuEJfNtEh$jS3;IXBxwzb-JdTwS=$(l+GO%FF*zzdl6 zvPty;dPSP_s&CMw*L{n=fa!8+6E9pVlllICCNnGRSNV6@IlnJuuC)P)<|($+;2d%$z)HFFEJDmFzMd%>&NF51}#KE)2v z!G7>7t`nWy1zj9~fYSA%n}ZPK5QMk~dX(27dbtn!6gx$^pTiL50T@t5qZs4}L=?Nk z5D&w!VoQv06rzgVVw7VLQ`{uRI1X{e9x=`dNGNU=6Fdo%l3TDK z)ZG}AI;iwIS+qv$d7EE@4GdvVRf8MYi+wWR#D2iK^YM$=WvK_;V?B)?)>Hr zzm|972u7+E)R!khjc-0PfaGbma@0CIS=hU71veShLoRBj%FFPl% zti9OiE^OspWt_rk*>?AuRWq2BtL~jYAaBE2Ov%3csAKwzj&l^c@~C-Ss5)T#+S(#6 z$=Ua& qZ)$%XQHQfbcbqwG=Gn){ryo|Rwq|XP)xZ2>KcYQ)U;8|lGXDX}sNIVI delta 830 zcmZvY+fGwa5Qg`mEmGK&Ln*Y-mNTU--R0a;pp=4$C@O-7@f2iMg}O$F;00IPqTf^oX!f*97yWPS6`pP7~U<@|K4Bg^t?e9nG+KKOoa#X=ftXh@w5 zFvtW`uji(8ksHo8!;VUIX@SMEE?dY4zALSj+Mr#rOLmYS{EFSOlL8P>?2%p64c&?x zWROA-q8{i``7PN?VF*(MA{2$F(i&wS^+Ug6uNx6gSIJia|`V zCC4ZZam6h%K}kp|_Q`QdK}vC}v?&c~#cgteCSj7f9XsR{O~W+Jzzog8tkV2)jxvy; zEM#@fVN<7^ryS&H0TyTx7HJ8V*cgC3cEK`sLji-Zf*~lbYuJOmRSkPZQ^kZ;&chht zJfiY7(JWTQTFD4%a2uo8SJhx0`*DEZJ2)sdaEN1=V}xUrBPN`?I3~PeqkcS6r@B?B{o}#qseQ?1U4H?|OV_gi diff --git a/vllm/model_executor/models/__pycache__/jais.cpython-310.pyc b/vllm/model_executor/models/__pycache__/jais.cpython-310.pyc index 68b8894907f4af533ebd3c790ef5a87afdfe321e..b727dd6d2c328df7690f033c33e2d7f2eab8a79f 100644 GIT binary patch delta 571 zcmYk$OKTHR6bEomCYfquq_%2C(&#kVQ#JxWPNpU^)QQjZ&rqMME{ihofFFMx zNNBXcpZ3gA#3R|?Bv>=b`ZaXt`GQeNFQBXd$sY_;>(#c#KaCYyT}E~t98^?wS@)wr zbW&H`z?MRwaTgo`O>hIOD5~3?sOH*{tO?tn7kiQ4RFu+UKkD0H6|8}C;Etl2ar|&m zMzy*(%is3hqma+%BnA96cZ`B~$KWrbCH^y1P?4TLFp3d7J+4=4)a^O38_z6(Q{Xgs zz*BjfZt;4)nZvK0ZD9~O(h2;i`)@u`I9`0H`lX((37_JHHLy7$zbm}XKF0o$qLkb` zdKN*OFAh)Z&s2F?+Zf6{ddEzypt_>br%Z;TwJS6mz$;Hl9sh3Dw)0xv)U hq`-afhAnf5T3j|SQ7e9HdI>#1-r{yD%ZJ7${{wi?lZ5~P delta 612 zcmY+=NoW&M7zc1)(j=NVAZ^o(O--VW%iuDKmmaMPU8F$^UZONi)6tHZyqUf?QDdvE z(74w1yLtB{9&|wP>cNwsErO7fN3ULr2u0stFL4e(KECDgXVy!195$sB*av;9TC*RwC$ z7t|F-;+d8XKlgl(FrVJ_%`ic^%r`bizcUkY2V0kEQZJ=^lqDePrCy9~jwZu3eV#2| zLGLO!peV-!n@dl$V;5b|3d9@+x4;m%2AbfyqP*3S71xqMMOeHhwxd6KouD zSOk+`Nm14u?l%HivFp?Hv45F)bT%6>P9L%-7!Q*JU)jzEmQN{+J~4uN6dVJ`0jEfA z&mh9L6K=gSYg;oSjlti;F;wH=Hl5B{Y=K_onpxy&Z}C0#e;tp@&Qvs7iV4n&M*}#bgpnA{!o?GC~4bt`cxR`zTdHhkyr^g z3O^ZpLhHMR*;5)C{E~l!elK_oA|M8q!E@SQ+`(EjRy@yI;frED66ff*NZ&j42Z)QB AQvd(} diff --git a/vllm/model_executor/models/__pycache__/jamba.cpython-310.pyc b/vllm/model_executor/models/__pycache__/jamba.cpython-310.pyc index 088a165ca87cdc7c5b4a67dcc2ec2abe7ebf979d..753a1d65b9a99f257bca00a105775d2c0c400212 100644 GIT binary patch delta 3032 zcma);Yj9IV6vy493AAaYG|*5aDAHE0(4@7L7OHKLLDH%`#YY6IeLWUwn*?UmQpGzbU4+)-fM`bMD!*XV0Fq zdp3s$*lPpK5icnzI#2xSUOf7$qu*Y+$eWBMyopGnCaLl+Em_kTOLfQUV!hsIq|=*7 zC%fZ%_K@9cV`lby$63bO>2yg0^JT}L|A&RGCj0p1?NQ;6#{?AScZ8AwBOXpBqA5d} z%C8eze_@iVx{-(*nrRDmr}VXa8D=aOFbjGjTCZ7PL^2wW(G%mR_pQd*Bw!^l2Ua#C z5sf7IQYfwg0?-x(<9agEm5QefehaiJa6N{`bgPD%OmcoDR29HYz|Fv9V3mMU$~z&4 zfiA#%9xW()eZnpwm)pwN1Zy!X__N4b#4KZ|#MxFL1V$^I>4`pABR1X$6aqc;ozu-i z^r!PD7Nnmh9Ch9S_3Z-JDRv%|A9QSDeHrvhF<%6Y^pqic`7Fn6`0fCf&=uv=>Sb`v z_|5=w7~XQOr1KCyn}E51k9L$VW??#0zMVxV;i_(kLoI!7fYb-bxc!js1X_TN0*Y-g zA9Tu9$9m`wS45HF$vyVKY&{^?laR~HmD99+QUgoV@k#3)Lt-Rfg>UI-(JPjG3eK%9 zw>!iE)*G?OGZi-~cVXlLK!!MKVEv>{zJ&GDmdP(vva6 zFWBdj;zD7fjLXNx+sQgbnV!Z%{c?I((?Wr8ocF3c#7m)<>0LuhrYNoXl3^{r1(1G` z19MzBtOufMTH}FWR5gr|J9}%2&z?JuWOF}QeIMp;1-1kC3MgZSAKD%CfxAkS>#RGt zNM^+bTL+NO&+xN~(NS|YKs%?lvH_7ZH~l#EQ0cI}Y|6fU;Q>~MeJK{RSWm?QYkLCS zni?{4JH7|rWhUK2GTA}*PU~j7>9=W1I=8{%@1)9&<#M?O19IEgu`)KdS$QgkMIrB# zJX-f-&WJ;D@Z#O2NToSe1Sf0GyXczfy-Oo7zZKr?d=KPxz=Oa;z$3uJ0!m44^+%zQ zRoM$kc8Z-s@>|!f?ctlrS=q;SP=(t~uT+Mw{ugVdAh)F_F?~cO|78N-0n44FRyjps zQ&lUvNGQa)tb_hCpdJ_t{NI|()&Khz?;>yYN+;T%V(}M>4yuU`8`t?(nmNHuuUGG$ zBo8x=wdsh)xq9vzZ6fuO-=_?#kURmd!4p91XLPX+Ix}MfTSEcGH8Fox{`Sca&{n0k zbVMmnDUtEWl394Jl!mC~!b^X>YSi3$k(pX-#KE6|{4C~MqngfNgj5tUBD#@O^`ORg zQQu7ORRgekN#NYG@Cp=ifmb07J`h5J+uV7OWqMhBnl^c@`Cj^UW*gf)Sh)6CtJ&Rj zaF(Y@_Ne?FEP#hX;J@p!pGs=l+5YSeH9BK^=wr`C4tZj6I{7p7vuAdr+}t621B@b||haX!k9@3)x zppgB}l%7ySA<+wa;z6}DAfNE3VR|9ZL7&xL%ns3ywN0LUrT@7gm!3yddu834(&4$! zeppw`*jD=TvfJ!O;Quf!t9MmC0C5H&BYj>-rqxKrcqMc)E6ZtH{haD|#J6~HWhBFW z!}L91C!MYLiPtlC>lV)5#g33UyP9J!|>Fr}_eu92!cz=d` z2o}TDwZPQ^gYTNZs5j1|p?3kDVzpZum%84CIl>j4LVA_m<|LhHT+KeA zs;0SRM~4i40_&66MAP-mqPNh=xju_tL1pvWYW85{O<*7Ft-1d878H*SQM?VswO2?_WBg#X3C^y(bXn+B&~&ejpm}lK-1B4v(Ql!vWC{bWf%z|6%6dq)hqH zN719LPiQ=8cxw4ZYHMD?GIW3Qid?onqwkybvd_h$rY)gzHO5;J%NKNPfirvic) z=$$L7ZSzQ*UMZ`&Jmc}t)D4cL4|$6C^! z_l4*$9*jAlt1<0a#=pXN6EGJzCh)062p>>)t1^EhbbSH}Gp(wg=HEgg&7~ygoEEy1 zVvd2hEv!`hljP7T%Xn}0bnA20HWRaI1Wfz2ad|!GL6ZjhfdK&Bm_G;L4ssd!H;_)# Ikp&z60)-FX(EtDd delta 3026 zcma)8X>e0j6!s=ffToo$G%ckmR-p7r+q9P2O=uZ~wj!IL15u2x=?l$}CgHw>wrT-%UG`dn4F4C|IL8 zWd|?lU|vlQ_*#Zs0uF2Hqd)V?UDspX4p>gL?vfgItqJQs0B=KEN);;)U|A1n0JPHW z?&ZRuGwypt7j@;A)<(c)oi~BH8Nhz819b~vAz+IF%`un_I+kB867*YsNMrXn#stKA z0Bnze&9miR+E!32dg&MEG&)_-=^EuHwM=hYIZ*_fZ6pmt_BrHH3Se_wpl7D9)o#Vk z3;?@1p>qSYu5hjxpj!%GnBJzut&D&k=ra7OS%RSrk~7&)OJ?lOXL7L;(WZ|0CEMui z3~g2~3=Qz{pkZ|SgHhR|%TAdEKBss+wH9g3BV~gvxgEfIkppXLFc|TN^*%%T17Y1X z$4B;ZQJZtHA^#|PsPrzJ-vPKAaHj%o(&)AYcPAb4%uyx#$`feitT@1R0Y>sOwqLP3 zVa~SEj^bvqP36o(-xeRt8WT%@^1#e}q8f2&HY+2N==N{i?C&!4PBRtp?azl99Sxs>#@OMBVuiGDp>A{F<$VU;?}wcXT~+j6X!pWg;ZLT zm2+Hkb;~cE)w8k-;vr~v%3YvifCm8&0UiN7tU$|5S$`A^uF7Mef`EG!`0SfDZkAig zHG7NLN!cC`Jv%$-{}*X3EfvyJI61D8|8hX?9I`R$!Zm=Gpzb-V#eMYNoWjfhZ?W0z ze_vsuxusX;lCq%Ld{gvz+)$%58j(BrQtvI@UBF$8ezsiUsMLqKa6%vRj)ns>Z`sM<>pjf7cKhN^0+ zvM#vb*Ci9C(W}H|l>*Hr_k(^G=j~x5B3}TN9x_7_Gp3f3hWHV{z4TR0 zTON;qdaM~5KqY9w{QI47%qphKYKzM?JL~dgh9a><+~1K11`TQQycpXD$El=tKpdw1 zwHFk!{r87;j~MuXeyBZK#!t*LY+nwzOu^ub=}Yg4%5bNjKbhL;vx}O)~y#O$Wz~t^UkQv6OjHe*;Rj)ux&a(M;qGkm)_V?u?st| z10ILGJvBMs0Au$k#+zU~K|PHfqK~Y`^Tb*@+c;C)Ni&*?#1^V=TA}#cn^rs7myhY| zrby1G>Wt-x=~C~O%{YH5sb9QGsB4j2P zOL+#%317L_X#T=2&etIGIhDH#==4Ip@?Ev`Wf;9NL&i;iMDI496Y_J&jFjZ4TAs8i z)_Zhav$hDIPyBJE3CpfW`sA0x;!JU$oL0OO>Wm5BZ6Zs3UrO+_RdRFkWb^a(#b4l5 qg#ydDEXvoj5u9GY0Dz|wMznkmfIBGJdkYkl$$HW+&ZSQ-3H}Y^tkiJ; diff --git a/vllm/model_executor/models/__pycache__/llama.cpython-310.pyc b/vllm/model_executor/models/__pycache__/llama.cpython-310.pyc index 09e72b56f012a9247bacdc5fdecd82da5be91166..c2c4cd69e6fb95f3e5b213bde99a7318b07877f7 100644 GIT binary patch delta 1167 zcmaKqTS(JU9LGCT{|-09OsD8(DRcQ(x2f}z(2WYM9z-cBOtIDeY>VAI`PTL`JS2J_n^if zA0M}XeG2c4-_yjXjg?l}8?Xl40kdqUPDwVGdH1@!h2AEs$GyuMXqH`mpR!z?rzK&< zkrby&IKn2=HpEfHA!yYtA?-?^Ze=v-f=_8X$thTwp24iTbS=@G#!xciFa-4#rV}X3 z5M2zlaUMUlH|+E8w(p`mx*mtR;j=zKI-uHMi|=KIsG{r8?|^Q@9^p93W2ZBw4zx$c zd}weTM;D>)LG&|(W2oKdl;{OCE+Q@=&LK>QJ_b=cyE+%cx84AlvTDd6?9bYew1xR9F-rNE)kw&B z*kH^|=EuTfYSkMZl23Na&9n_#jb-F6j2eHCei+JLCJf;g!;rDaKsw=Pc0K7-wwqKc z(hECsiZyssbc_Qo_#L%Mk`W=$T!v9V%QtLli7iM|s zhfu9S9EBsIiClu)qDzN2SVgy@U56+^oPgZinfUpx#VC3bit<(!bEgv%Ap|drmvM&u ztX;g<7qB}Vk|XjU8iMW?i2_{D%TMKh>nw&evRi6slH5+09HhN4oo6FgK%bu`@U@@8 ziu|_Z4qW`-CgDT=>dX)u5o7<;H`vVAQl8^{+)|8=M0xoy;H$Zwyo61b^2CY1247aT`L`MhhO9Vr}dS_!AyrIxKknc85f11&&T4DiK4_P_T*>UTrYI zSb^RYLUWj5?)~3IgHPh%lZN3}LFw$4N_k-o5#D0z9ds9^kV&{vKzq6T8=){VoB#j- delta 1239 zcmaKrSxggA6o$Pc3{6`ME`Y%ngkZx6v}g;27d7t26^&b?sRNzR(K;=62DQ8>E}#e! zJu2=Rf|_U|k^$UTP-CKTc`&9%AAIo5H;pEk=smZhh6kJU%b9ckd(WA3|M{v9>b6K~ zs&xeW#rk%1+mbB>3q5r@^@JnUa@Z4At31(|5sGMD_mmQkt{O^lRIc76*C@K_vlQBi z-`p_HDx~dZ2haw@9>h+l&&VN-urw#r?9Ol{krsHHwSgRfiV4}I(OfgZPHYEJn2y*5 z5yxEDehkYIEew8ZI6~#X7S=`;<)CTVyQPKp9oZi%SmXHKG3-e9T;@l|i!*DPB zaK7H&m{`;>!(%HQjqzc`S%!Erm9-j$9>>H9#7V?agbQ(+L9+io9uu1p=MYguq8LVh zio}T;PY%m5g_?_VRuiH2ka=O^Ml$9+s`43z&g+D{yh?H&jJ)|7t61Jb>=rw*5P|(g zBK#DR%$Iq!r2H6eoWtO^ZjJ<%aKMN~mAF;aRZTZ!ty)PmjrZrbEC?!^p&BvT0Ne7* zNf%tr|4z=rXP+}I3C~GETtS$SHQGs<;mf4;q}g2V5(Lr?D+_!!94WoY0f!4#h_^7j z4WA2UF6+gx4{;4~9dU!9-p)I7^VilB9vG$#p_V&jCq^?6dtkfdA}8U36w1I!FQGUG zx(-o_*bn)W2UGu;LK;b1p{Q`0k7t@uaSy>Sm0udLNB`J5Eh-0tN-*J^fUedn^bnjW zEE>;W>j;W$hN=X%Dr!y0&}ln-EcA+JSY8t0oFiT21@6PaQJJu~Xj6I>w6h0?jW`V=vb>tJokH0FUtPABx1I9z;KCR-W$V!BYp zH*xSyCVVR?`(4uXPN^i>&rtQ8!Ji@E=uk|nzz)k1H+39 zLt{yFkJ%R>dvk4n`+H)xddmrU1@_GG@ZL97dW5QM#AC!?$1cOigl#c;!oAxAt4g~` W4_L~&$SL!BS-&81PxL@Th4BmK2uA$? diff --git a/vllm/model_executor/models/__pycache__/llama_embedding.cpython-310.pyc b/vllm/model_executor/models/__pycache__/llama_embedding.cpython-310.pyc index be7ed35146e88fdbae97ff5629bcd1f0178c358f..6ddb6544da9489e3f89f5f58ecab1d7ac4678ebe 100644 GIT binary patch delta 61 zcmaDa@>+yDpO=@50SFA&?%T+HmPI8{za+OnzaX*D$wSKPNLu Pzo4=tBR_8wYd$LgTJIEn delta 66 zcmaDY@?L~HpO=@50SGF$HEiTQ%c2pgUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*54@*8P0LPpbjQ{`u diff --git a/vllm/model_executor/models/__pycache__/llava.cpython-310.pyc b/vllm/model_executor/models/__pycache__/llava.cpython-310.pyc index b0e994db0ec36b92c8078056ef7cd6e6a1c48eb7..b0a04c7afe3695c839c250f36d7753ba7c34f57f 100644 GIT binary patch delta 62 zcmZ1)voMA`pO=@50SFA&?%T*M%%EFQ_cZ$j>v@Gc?dI W&MZmQEl5nxPE1cN-kis-WCH-XEESFb diff --git a/vllm/model_executor/models/__pycache__/llava_next_video.cpython-310.pyc b/vllm/model_executor/models/__pycache__/llava_next_video.cpython-310.pyc index ba9e031efabf9a11cc232bbf8dae7a549697a5f7..e747e9932043778f683ab38b873e4899b85f38a8 100644 GIT binary patch delta 62 zcmdmzwjqr>pO=@50SFA&?%T+1z@`$UUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrb8FkHKDBeyPxN}zs8Zh?M5W`S-=Vo`c(iLQBWX-2MLZn=I= jW|DqEWl2VU-sS`jUojpLpe`;Z0Y(l+7RJrHb8sNB}Dkz1ETBUHb%xJW-IKRGc+KPNLuzo4=tBR|hr&(J`> pII|>Gw;(Y&J25@AcykPguNa>gP$w6Y03#bC(|;DG&0FPSEC7?_88H9= diff --git a/vllm/model_executor/models/__pycache__/mamba.cpython-310.pyc b/vllm/model_executor/models/__pycache__/mamba.cpython-310.pyc index 32a49815558c15fe54e0f2b03f3d07e6bf76c476..3cba92ac9fe6e4ec0254a95a9e2054ec0503bfe1 100644 GIT binary patch delta 791 zcmZ{hO>7cT6otJEph7W%g|=u3rGQM85Hv<{qpsB2xapz^rXoKRA%y`SgDw35t^b

of|XV>&m!xQ=L0R(v7qDa?d;Go%d$uWAa_noVQp^+terg zYJJW8+2B1Ll5&MmAyWuSadugdf=6?ubS|754`nlnP@ycP^P;?I=rDKI)LjmP4LZ3F z(El-UCeUq1xAnMQ9YDTh9W{U=uRDscds0oZal#Z~0#9|@VOk#PZg5b>Uwb`Jm2LY5 zp?aU}DB%KOn!pnVRPY8iOY;pC3YQf`cAMlKvUaf%n(q;`k_R+tCGGvKVy*M8>MDk8 zyezP&HCbXz5T#hLh#S4%pn`8*XQ3i*y5<4qaLzsG){aGLB%EhQXp{(9LKT0ze?k?1 z^c{@UX`!M**^!7R#}au_VAoX{-BS_^@l;Ak#jfU)@kFecnH1PHO1Ii^$TMWDlCERZ zlQM646}0q!H7>TS@BMzec9V0YBLwX>H?hwf_CHcJZ~FhYctZIZobZ0p`V<$w_qj0b z>$1;~bEu8OG%aJ@cMBHL=?~eTwk<8B`Azwve<#2aruR3x8Wf7Apcc@+v=;W?(shngJwCl~OkhnzW6P93 zLue9=ge8K9@QmOjJST7}6s{;S_GY1{7iwq>PC-qc4Zh@H4TE8~k^UL0;c!^|3(ro+ AXaE2J delta 763 zcmZXROH30{6ox$=W~@^np`lZ(R%>ZXrvZnGMj;__;XgBL=MouXU2L=|5BQ&o zXopsz5gImR!3vfQixpiheUe#PjMFV6A`Ba=N(KTso@SQ_6NJkg>Q;7&>S4keLf$yp zRu~}ixrT2ubeph1qnlxXtzqSWl=E@P$y##ah z8@#G2IM<=zexDL}$fYX(cRq@n_xPBq0;YXmU>^JZeU1V(_HCkvszto(pXR%h+q| ecDSL0zdQ3#GA6oK1bBn~ut%atVkL}(lYaoLyS%9Y diff --git a/vllm/model_executor/models/__pycache__/mamba_cache.cpython-310.pyc b/vllm/model_executor/models/__pycache__/mamba_cache.cpython-310.pyc index 9ea4aa7af15078a2d794f9a1e3c2a860cdc3755d..b677ee78a04487ef883fe39df188b49d81ace660 100644 GIT binary patch delta 84 zcmca;bJ~VGpO=@50SFA&?%T-i#H`}0Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS kUr|63b@?04&iK{r~^~ delta 90 zcmX?YbJ2!7pO=@50SGF$HEiT|V%7-MFD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` rN!2Y#OwLYBPc7bD$Q&&!qy*H-!6LxO!N|kN#>n)aiFxxKv3zy_%I+Bq diff --git a/vllm/model_executor/models/__pycache__/medusa.cpython-310.pyc b/vllm/model_executor/models/__pycache__/medusa.cpython-310.pyc index 1576df2c2229a57a4a4167692084380914410430..ab11d57f9adfee01df7f7bc66cb1c3a8e5084e08 100644 GIT binary patch delta 98 zcmeA%>@eic=jG*M00P6c`!;f)W>WFcFUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E yFQ_cZ$j{sSkLjI|oERe)69*F;BNHRbe;y_-CJ9CsCKe!@4~SV9H*<+KF#!OT)f#gE delta 102 zcmeA$>@nod=jG*M0D{VG4I8;nGimtfmlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} zr0NzVCTAz6rxtJi#q>@{PK1%^KNm9x6B{EFBg=mtCN3rkMiwR(Ae)1c@Bd~tu_h(} DCsQ1L diff --git a/vllm/model_executor/models/__pycache__/minicpm.cpython-310.pyc b/vllm/model_executor/models/__pycache__/minicpm.cpython-310.pyc index f028c817c676d8c745ece04f180ca1c6b2d94d5f..66950512f804088cafa5ce815c13d8fe3d8497b1 100644 GIT binary patch delta 904 zcmaKpOH30{6ox%5Obcy;BE|$LL~Nm@9hwRSi5g=fC<~(`E(|Q7Mjnl{)aejFjTl_v ztLOnl@DZg|P*7offe0qLaH%U3bnniUD<#qUPh&!iagzD+=Rf~Fx#!#mYC^Si+H9HY z#OI$`nziI-IO=?AIO>arqOuxP+FDe(D%{l`_J_ND9igMXXs_Dd8PN`AEN`F{Ei3OQ z(EwZQjdYPulx@^b+Fc}_7u}Q#JXsJZz65z$z%40zpu2$sKo8Ih#KqCgT5e&sk>V^D zO^A*ki)y7|)JE98^%n^`BDPz?aHlIC_*Z$<;c<*Wo&zF41+W*m4b%YR{MFGzW8Cb_ zql9+a*+6}9;kyl~Tj)Ad$r4tBEfi~N4Jk3TNeM=dD@oz4qzl>BqTE5NyTAmJR*~!o z{s}ta-w<$HQbQ(S=#$=q(ucecH3>-i_;GG5QE7-jlg<x+v^))l7oI%v6#GoGmeQS)z zFwUloX6PpXtubbK)gP0VU@vQ3+pI)W++SWyPkE|brq}$bd?fdnsG3PKo71FKtI0}c zGKgQ$s0~z@NUY{cz+3nVJqmzDAPq19jlg^U60p-W{|KD2O$)=lPdNgAQ0uSUX_WLA KnC5rYt-k?+-sx!o delta 868 zcmaixOH30{6ox%*nHEbE@R7=^AQtG*mZ28#fyR&sE=&!sG~mM001`=oX^jvKlHfuF zYvfcEd_-&!11gqLL`87t23IC7biu-%YZfM&)cb=PVoaQ5zI*bWN9LZ1hbP14c8g`> z2Jv*y_9o0ZsSclVCZsBD?E!zA($?CjbaaPLwFkYWo-!rW8g6oT_yec?ElnZqaOz?P z)obSL??ji_nA<=DS|GQIq<%3?z07f2g*1rp3NPF8D5528vYsL=7sN#U`+{02itKgH z+>sjc5^Qz3#he;fE#2lpSC%N5aDCp3b;*)Cgv!6?!94>8fP;Uqy0jUdckkNz z&)c%8^gt0BW#fN#;^U;v$`?!fbDm@REPxBjhPB4kbxtU|i_DwI= zRUxI$X&;r{r0bmIbWa_QM$gfjN67S`RIi2*KL#$W6Hg#|*ThN0(*Ug#Px+fCB)x%N z&^mXf5k2G{ZxLxc?sd~VfA9|HG>fc>B$LS?{YW#Wk%@HTl}MM=8MMA~Bhd^GRJih9 uVTuiS4Hy6;&;Y#S>AYN;;+2YXmMJ0RL+Ww(tJ?X>eR^s2A5HPXp5~wJec-nM diff --git a/vllm/model_executor/models/__pycache__/minicpm3.cpython-310.pyc b/vllm/model_executor/models/__pycache__/minicpm3.cpython-310.pyc index 24638a6ef231c6862933fa6517d0d8532d62c1d8..9afdf527cf85ea66cb6d900a701ca95818f5052d 100644 GIT binary patch delta 1188 zcmZuw%}*0S9CawIg|d9p(n4uWkXQ(|ARi)9r3h9DF(DWf!FDN2yRiLW`XyeF7!RI2 z{1Q*zG%+5Gn!V`7KV;*bi-`w4ka%(5)VP(fhc|EDyx+{^{dSHczap-jBsHEfzmfM} zKe-YPX6TyZ3+ulfDrWMbyqX^_$~>hMhbJ?obY>(|32EwPD8FA!=d!fqyuiYG+4LeR}4G%NMi@ffX171u0G0;2Ry`Z*oOe9;8Mv7%%PInG^BR-s7o zcv6!Kg`}cs@p!dLlwN}+syDX0W{wbenDo}`{SnYUKoBqp5Z3B>n1*#vTQg&0G|--H z75>@_y=mX+pM&iNU>>kwg5l&!LES3J8ovoGMxz}shE6g5T{b;IJKu&?0i@`A$9aYr zx&u29s=I*IoQ~-#-RiuPxCeS4um)%VGy&QHA~6*VvGIohky$<1Spd@Gae%ddH8W@l zI_{ij2|8@))R()4*r05xLB89jbws#RyHQLbT=ohrEst3eJ-MVCBac7W)T)u3v^SkS1xXO3xT z5Uuy@`6eOaX^MBqr@-*G_!Bznc^1|{MW?La{?OD6dnUJ~XgrN|>zpXP>W#T-E=@mr p$9zx!H(8fCpc%iP9nb^+xMLHhMg67!kOdOp;^>3ZN@*ex{R06B_Lcwu delta 1250 zcmZ9L%TE(g7{wi1Dzy}O$)kV-gM?!2@Ro<-l!p(D=z@UYV;IVX4jrcDn-)?RfF`U> zxEq%ytV~RdX=36(;o8iWjfqQHn7HwtJ4p-7;y2$t-@SKc&bf0k{&zf-4u>ya5Lf=& z{@2iQKv^nSf$vJ!teSI3wbBX0QY~{u&E&JmwA~-;?NJ>w%Wh?iM9Nra4u4eMrKkle z|L1GGBerpU2_s8=r~*68Tu)|ch#yqMdIp3EiZDAqzL3XP-1udZ-DN;{2$7 zF1#s9@wpKw3GQ#`^i0P(k_$@CYtU>U&Sx8*RKr*|nA+A8Mk2`^nl5~9c&rRaf8a{= zV#ya#m-Kof?2-Z2fKh(4sk2=k8lPe3>4gxNf@?W(N-Q(QT)&mJ*F{Ry6yMuIuflY6 zagee)8Fq>qAo=YyZOX)=mEJkcVr!Xx4i$o@ZD0qO14_9S-_BJ`x6Cr~j81v&Whqva z^S;Q+=!U4GRdg=am)KEeD}yTq?4aRg%YQ@~BQi}5VhQpIsl(<;CB>(j4pfK1Se)Em|$1yFJlFfA!CN*VlT|zCGQdGS#A6jW{KanMk(k zCnqab4Ts{8s##A{(#UMq)8%iRo?&DvnbK#|(~K-7OUfJcjfPWkN;zK7Hgc34DJST; zMxK%<JtTZ#zD$RJK-eR;Wt1t7tJ^+dRc6!%%}JIN&7*EdHw#v^QEej6EaDf;>JD`$X6)RAww9^$cVNH|2Tw6H9sQH*WPR++-%}=n{ zzY>Z(Yx$kE++7zomg|=N%QayyU(~`iJB$^dQEwcr)BSUG%g4gLU?B3t_+B%Mio~RM z*|7L)(%0Dm@qBWl_m0_dVSy(U#7F}i_kA)l98`^1rSe~ug?fEbJu zHP3})iu|y6FTK#V0*5B@Ga}3*ewtCjbn%CbGS@WB9f*%ZA|b`rtsU{tYaDs=PJqnf ze$kd$kaQ5bT#_NNkU8lXLPN`Z_zvC#&xH6%=AYRk;-##{q=#UT)<;E$GehKVY-gVl z%Er6%Rr37Slt8eDq_bu|hfoIaimln1BHme&OuXtm$eyCO zUA8l5^0)|QXT^V>M3hU`J)N`J_7$jK5}(X@BL6cG?F3Ov zKs)NPahdCvV)1RcQ|vkM*<7viX&7X)=SXsGh=s{+zXsP@gVMY)_IzX|?>w_T4D++1 zr(nYN4-mcLOhHBAvk<>Y;4(*3{f2i@^DOh=ycP-tIakG71%I@jBCi<9%@Xex4lpiu z7j>-4B)^YVEH?0UI-Vmdl{8bxMuN?h$ZQ|DEc`p9@NWaYLEv&mEwl~zNf@32$aJe9 zJqmaPumz9^z(PlDsx}`~wWyhh@_te3I0zTDs{Z+~TrU1aL>>d&DLqR;e;{hp0%*jY zWOAj&a{W4DkVb5LIpDXTep`5o``CBI)5Yb^dttz=D0%q=UVuRrSBf8CKaK=T9E?3I z?kW9&{j2MNW`0Txmu0ha!dJG`D(8kNMB@y~K$mlhCXcNI!hS>R;hfetHU-@u3P%$s zy!y(T`6ZE3Ug?md_M>;%)eEA#e8qZ!bdi#j8@X71pP4-tnc1|NwI45K)1x5~r*MVzb3W2eNWsv=sM_p99f99`8CxH9-J z=qH*SD^cO#AuSN%0&Y3*zd`B%d>Swd=mW?J`^3Z5h4z<7kH&?<-uXlPxOkyDKm7<< zXg|pO-$wMWBfqKs9@{53au5b2;EG=>EJuAB*J5=Heet7!Spvo8lifxWRsx~JE1Gs( zb0w{HEAGm2MiT2@v-G`-a6HFYqOvBv0`*mZ%vPpoIqqNPJ+S>dfy;42e*Z}Z@zwgW z$Uwt+wklJ84}pIM`~~n|1d81sSY8RQ)$SK9Fk)f5%hC;Fuo!5)^0~O#=;CZU0Y3jqc}O8!7hmlt&O%( zSbrr_cNgS;IEs>%J+1}NDVuniVjnb9e1Xt*D39`C$!}gjO+H;A$7OC#o${aUWCGpNw zzWBS&nhw;!vz8l5oeIO+{pRLY==LM!>yMqA*o1g_C|@*pm6XNEfxwpusFtQvlC%vf zVJZXUNqW2yd9>?JMrUJ6Pcu6t26}eURp3NVWs-ala-uKe(IsLHzClkTv{}5;Q({eI z$xOW0vx&VeihFBg`^GHC;=jXyYftiRNsi;aUDp_hjdrnjd86dp7)2@xi`=hzLjL0# z9~TGvYIoFOIrEUBJUp$2H|&dALx*`dR$I@I>+Bj0W3)x=6-ltm;`P3MRv0Pjx3k<| z!ma`2S#%f@N-S>_y#tMXe}E{*3uD7GWAj$SKJH;|sZQ48G@=@$5d zfzCvF4>bJ>t5Ygc+&R`{tWJ%4DIRugG4XkK0lO-`+rDvD5xH+)A1kqi1%7(5 zUgvu$+OP3lIEO#hhGX=sjn~1B&866n_(T3+z%w5VEch3BJvEMQSi68JHr;znyN4iQV15R$Lq7P+;?hVrD-=cj zSz^cNV2LCKC~~a~e3*W`O|~kEd~@_?%zh8z=o*La?v-2NoOot@sxkya7%)fhTMH!2 zo-Y%)oLmm_rl{IqygCcB+$1-@8o?oxmsGq9>fL}re4e(sJpg*o;;9~gvE)~+-qAW zdZ2~2&c=z8MSpYa#P*7KB_U(y|8k$Si?qq3=62fQ9r=-`CJWgX`jB$Nmf#&w>4VCx z*#6E`!Ppwx>3PYABKIsv&o={ZuIx0)hiD17i=4+Z2mJwm*T~?+HcwNn$3se(Ua3*{ zZ^8QttdHbt)Wrl(Tu;x|fR`aT&*L(oAZ88x`Z&Fb4e#~efO4g*F2WALS(qv-QUh`tM%j_(w! zGv%WAVDajQ3Cs7R#X4d6BB|@F#q18iKLMD9`hTYH+)ezI=L2}=N?p6iV3=F*mro*z zDZn&90o(?-fzxOk+qPFl<4kak%QL2qHDX2gHYR8^Lc+f~3@ z5Z?;e4VXnEFJKNZFZOr}{y+DCDqiv&PFInOMZUnrO1Bnq&(5(dS=wGlUN=;2an9Ri z4rB`3-2PnLZun;bj{|V~iFNQf`T~(H9+)e${UdBo$h*fm675z}e&@61d{&%ZeWQ$T!3nfFwZN7XcCnaS?1Di^a|WSYT!s>|OBCVW^6X zi%Chc>6UCKlq@oeY|~DnlsC34ODfTh%1I;_ODfWqvyyDmky26U#EMm=SdJ~`|34rA zkx;oRWw7}6_rLmg&;P%B=I7VgFRn3X!0C*!!QZLxJUCl>&bd8R(U@j8?52Y|mRx)gStjDGmYb9rFT8X~#w4IN`xKt~HaT$#d zz_?sO-eDa365@YWsk@Pxrxk=3v~f4ZwIn_vr(t9ef@*gW3>qhL$;oKBv#? zhPMB4J2xBjwhMlJ<|2dNfIbPo`4<*+jed{m`b7rj!`cX#k67lXne~s0@ZZ^QI?4yC z7lWeO2zWh4wc(qpUN{w+4ft!TYPMDfeIdPa!Q-9x%;>@JOHthl<5G?NfDOps#y-nN z<+tMMG6$hd#Sp@Ngkgjcgi*^5|?0V51@wNpRt^Xjx9(T-9I@2qS{ z$%#FT<4%NrIhArCp&t$H-q1-=kIXUo&nX|V&&hw-R2Ta&GKhOl+Ea(wqjEg;Gud9? zzGsUDXa(w$B0Q+Z5GLjOsSU~F$Yx@mq!FcRt1x9#+UMD0@=Dqf_B80E$kz0dq6=v9 zB>z)IVqpWDam~X$?pO{$nicC64kvR0$x2B3<%+s*K$E3BT$?bNS#CY z9KvRV7zEt$h^pz{fTl+jq05i*;zuwQBM!~y4beV{r%>}G!o4J!3;6sIRrjNjNCTED z(TepusDoix^V5Xi!{PJtP<{`4Q9hMloOT8oxGD&qw*EO}c;(OXA7ZbD=L-@Tdqmz} z_=D2FT~SoTd7!!7XU>qN1=glWt!QpHEf-f6*tk~%A)#A@8?6EK}D`zcKz4(M9 z4)3DoaVe{n2oLQI5V*3$0rWM2@EF365$Jh%<@d`w)fpTQ$yir5ds3FW9;m1KURC`G z%Fz{%UGNBx>9#rvRpM$!OvpD~el`~F+nmIhUmmG&v!BWrE3zP?{-q+1U6vnJ^z|P@ zS5*M6Wbr2aMB=QD77EPk{-F2*ifQ71LkgRMkOU+dV5575cR zCF!*K4gHcQYN@dC| z#UUSS_Hw)8aiu|x8&8&6hYte03Mc_0w#H5Uxs)cqk{qsqLrygo|8pP=Cz zbkIiR^zP2$G>i$Y1zdz}ViN*Yz-k%1C9mwRQ-@IJ=Q6q}C;O8&uvAK)Wd%6HW3Gel z!wTqUOLr45xI=$Ao^EuQgY)%CcXzt{b<-v_3x@ZW${UTTvZ%Q_?G8i5nrIJ&e^Wlt z+{hB;bIm#1KdA=?AO)1T&RXJu_qY{VOiLXbm#r3lZXx6%*wFO`q%I=ByM;{@BL#03Hn9~#MU`1S$ds^RCu2HuPH?(E51bUP|MuX+&Io;mdhAs1weNAWd zB4hdXbf*Q{-qr2iZ!cqGGQFc|hvgQPt^h#W#l3{0DMeNh0=z1%4HqL7k?=zu_c1tW zqq-W{ob2e@1viWbx=Lf|acn`0EBNeUa67&WPa(KjzS>owLXO{xQ{?+yWh%A|uOeSM zm?pP(Cs`$^P!QrjKm;L>uXiA0#&4(O^WA4sDf#w;29KT*KFuBU-K&dXIo4CPqYCHE z0+DqZJ4{b#HsS~#6CtZFUjWhV8nJR1b#G9TU6)sS_OP6A+8!s%d>i>10-aDN2ky*PSez`i7Fw@OD8`l-=QiZEBWy##YIdv0qZBVd z0pL7WjxOO7fK8|f(FidBQ1sY> zMHJFe+&=BCLD`3BZpCYB4UW?*xB38=c10Wk?G z0^aa#aH*v%T(79wL4J2-JuzTaR`wR*LIwCHuu@Ki=yu(5lFq^Vn~#C`k}9fE3n%2x zjOI_##fpk^78TaK z{o$|;fztVYq#i){3<6a$PA~35IF3LGdlD&1XDn_!wdLzal2vOO`NC*REM7XSlgtYF zrpz4kQMF~u3uB3SxE0o(tzT@fjWt5C#f_i)^kTcCx@Z+td;iZmYi2eZgIx^bMK8*x zDvGKwMP?tEV$D!&DPeh_j4i>}qctTaT5$+pk=7{`@Z!bu@b(|l*azrAEf)|xR}Zk> zqyB((B+3x(JcdB!5ik?wEE6sRDg8dbuVbixe4D$z%I$_h$nA!A;`EN}y1Q$s1dP|O zB@lcWy;jJ-I#^o_pTFR(4*@=YLDxp;KwARpfp5wGJy_SXav*rYc;(LlR22Lt?LBDR zivSaL3ybNKy0O@S#aHUwlP>iB{4B?McHQ9HR4IPI!U?x|*RW?1V^Ni!P2M{I@ z4kB=bHRXgcuGcMY%8H`_sIc=#b1Dy^&0z$39P5@CNZ-LtIwIdaS^>3|=-!mzMw3Yd z55knp*K+1Q^|bqA7ob*-LAmCE0FMl-!= z@kN9$A*?!hV)L(Y1L=h16+e>yG&Pq;_mn45d;#Gi0y%yP zslSx_y{Q#HK=O3}R}_4cGJ^fdCm tj_^%{FaoXZ+ep2NP>9a2B1M;)Ye?bMLttMN_*BHKtoF@AT<3i+{~uwM%vS&a diff --git a/vllm/model_executor/models/__pycache__/mixtral.cpython-310.pyc b/vllm/model_executor/models/__pycache__/mixtral.cpython-310.pyc index ddfa63fc3bf557d655acb00b2715a0034d18b15c..ee61e0b53deb7ee6642bfca5c497a314f8526e9c 100644 GIT binary patch delta 854 zcmaiw%WD%+6vjQ1=0VexLX$owO`5c6npA6y2tf@9ih>oSU@0h-n3~Y0bSC3%+B~Xg zv_86MwH`(L&=way7A|Dm2vS_Q(zQan5ERj+|A3(Lr7d(L&V}DS^WE>9d+vEZ@Or?W zbvUYb7+>_|>MQ$CYv6b!r)Uu^qjl$!Vkn*Kjw$2AN>s^5Ml*vEt(Y6ms=928*lAtw zseem!n60jZwpwx;tD5v)SDfU6QBX_(0#Jc5K;x$kt(H8(0+&6F`nQH@Q{6@UXMi}6 z=Sg{$F7N^OF)DG{Ez>1^$=y#5< zgK`r%3)}({z%;OVq40dABKLVuP*Gp;ju4gE?mOy3c`>(zlVTWQ9}odbtoha)C4^A} zVUw8Tet)R0q7)(D2d?m}znL!cbN?;GPeIrEYBf_ENvNjyML=p$UUky@F-0zDg6HZyG{e!ZahlPeb;V4UBJ>&l-hJ*bNomQ5 delta 909 zcmaKq-Afc<6vjL6?5@jxi0Q7V>#FPLj%1@27$gKiQdUqmLW{AD?yAGCJL9|V>TZ$S zcNbdbk^IQC%jhm9gdjqpJE1O$An&?}{)xWcGi%XBGy}i$@XYg`Ift1SgKq}iy4UO4 zC$8LP;ko;3N%*XiNpmHs535NfsSPPcZgNad9Xi<6sid{Zc!!}5C)Ck++N^XcZitwD z6|VqJqU1kX>H+q%oUtF}68rA5nSK6VsF@P2d4@1S7$jIy$29 z^kkH)sRSIMJ`2n{FP1T=u?S=o+iz%ROYH%|NiIWKNk`S5+C z9HRbm$$vJ(VAEpVGNl-QD2g?{Y%89yR$jq(O;K1yrMbJ>3IboE{9b024y|Cm`5Yv0 zr+J4>Y~gZCmP%Qx-ZMv!hbS-c3#9K6hW|3|lMy34AS@6NH(Osq3XQhIwHssv2}we& zfLvOfFM(Tasla35?Ai^LtK*!)yCvhQVQ8sQzK*BDEs#e&+;rR_ep<#{jDeFmzymf> zJ>Uc;G`T(~CY++$gj>8F-)wfDRD6PO!^dD5OXZLCk7$xA!Ww}Q?1X;8Q=BUc!Yqc` UGcao|wf9I4>toO2hmK3X0B#}Mc>n+a diff --git a/vllm/model_executor/models/__pycache__/mixtral_quant.cpython-310.pyc b/vllm/model_executor/models/__pycache__/mixtral_quant.cpython-310.pyc index f1fc24ff12ff9e81010152202be156c6e3f395dd..eaf2ba1d3b660d36160477239f340530cd13d609 100644 GIT binary patch delta 608 zcmajb%TE(g6bE3=SO#P$DFoA2sY6QXFg8t7BN8^UFp>}!xPzFGW)NZvopv$|0n}Ph z!$VLA2f{-wCK`7v$n1pp7q|g-tl7(&jozPN!otM6_;Pa|_nw@?z8`%`-s`O@6DPUz zeOC#{k)DKOS_vy-#T~Tu2lV!-K$D#H66Ph z{xkAD6R+44;5nG&uAoW<-mdYxQ^944rn$CZ*!K##F>n_Yc%fmDo^l}6sZ1kq8@zTi zp-%D^#9f#E7Vh7?-aCuzLof&C!5hJ&>da^=Ym7Q6+sKXBA;cF1x?(4Be+#nU9ms(t za4|$&wP=by7teHxxT3*x+)syR zsWFHzIQgO@dRP%8PBwRAD_a zsMXLo4(|K;#30RL-cqy2h2nN*^f(|>#-L&_Bok zs-)~H3U3<&G|k_QsrEI@w1Rb@fB<*~-thTog6jOb$ENyw^P8gLGDMw!q=$b4SzDVf diff --git a/vllm/model_executor/models/__pycache__/mllama.cpython-310.pyc b/vllm/model_executor/models/__pycache__/mllama.cpython-310.pyc index f41d4304bd719a2842e96b4b588d1b0804ee3896..873863138fdc744ebc16367ba4a3c2aa3b89133d 100644 GIT binary patch delta 118 zcmbRLka7A$M(%uGUM>b8FkHKDBlmxH6%YNA+yecA%mUq##G>@n5?%A$(u`cg+;aV# z%q0DS%94!yyv;@&kt`B^KwW%HJd8YyT+B?2EdRNf1b{parp-%vG9$TyfU;a1T#Ouy So2AkW8JY3~Hv6UraRLDOn;qu> delta 126 zcmbRKka7M)M(%uGUM>b8sNB}Dk^4WphL3(}aglybesW@teokhRenDkPMt+{Lo}qz$ zab`)XZb4#lc4B&J@n$`aNEWF8piVv}9!4HUE@mc1mj7H#0!&*D$wSKPNLu zzo4=tBR_958|!Q?wKAYCE=CS86kudwWckm*%)!LL$i~FN#Kg$ rlB!#fn4F!Mo?5(_iFGy?W5wio{IXn3|5^SsF|qt(V%~h1Uzi;L_3a#D diff --git a/vllm/model_executor/models/__pycache__/module_mapping.cpython-310.pyc b/vllm/model_executor/models/__pycache__/module_mapping.cpython-310.pyc index bf4fb66e97a2de5ce11d89f5ace6f592e14f6f3c..bb01564ad0f845bcd738ca664b54f44316a75c51 100644 GIT binary patch delta 62 zcmey#_mz)3pO=@50SFA&?%T+Hn@J@=za+OnzaX*D$wSKPNLu Qzo4=tBR_95A9FSf0CN5mm;e9( delta 66 zcmey$_mhu1pO=@50SGF$HEiU*&7={cUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(_i#eMG0LSqar~m)} diff --git a/vllm/model_executor/models/__pycache__/molmo.cpython-310.pyc b/vllm/model_executor/models/__pycache__/molmo.cpython-310.pyc index 6619cafec69bf2a53cb64d59622a16a88f7144d0..e5dbd8beb2abe07de5ac9910c592d8ceeb7a8810 100644 GIT binary patch delta 4535 zcmZ`+3viUx72dnAWJ3aZ@C<<@kO04sgbg7Hc@hE%2@nVg0d4}zlKbywlmG56cb6mt zbkWf9(PrCm?!qlo%EmIfkqdq8Obri)~8QcC9MMq^SKG3#meUzSaH#{b_F#G-I ze)rsS&OP^a^5$pc?axSBC@n3;0{`3(J>56wU|MCdjaiu0uyZ@L6AQ>T!@-@@sbss6 z#FJ?T*nvEg?tfR#EWPVFQ&!3gqEnjNycLCrfyzJOZgJIL~-dx8DC15DmlX_=M}Vq zSJFz=&NPCJ#Yk3{5O(| zlBXF>yqPxh)pWILPd8e4D{bX#=o;0YVXWor=sG258*O|&U9aSs#s=O_+m)PSY~&rZ zgLl$S)t+T+;$5_h#Bh~n8=LtSx`l70TREjvDdZa6yodG>i*7l*P2YZmP!G#v`F<xfN9Xy^y&RN==gxSjx7Xc zVSTDT*%DTEz)lU&UCPQqw|q>O z15?2&fvFs0g1{_eRlrn@F(F{8Sq(6;nlUO2R4uCms!k6>q`RP9&z3`b`Iv?Prh%;h zX2lp2(UbKam}itVLSQT5w+enu@N0%&sXpLKWvf{Wgt?ow0<#8w}(_J0A^S*o%$Z1oo!-Wz>FwnGg#W9Pt^B97}gmU$k9p1f6x@gmg>F^5S-J`{C zvA<|9XfBEJa7j22E{b}EUyl}5@ZEjf&4)^iz|NBJo@iev7$0%DGl?00aAqD!{{>hP z_afYba9{k5oV%^$S8{Le56MF^CGR7x2@(u=6*l^RV>i7m?%ggllsAXnvbD z>zBxO1DMXR&^<;_+%HoKencLN|Gc1ykVobFg)QVMxp-a#sC(w!NVY!<%37*;3K`2mPpnvA(~<+o)OWoKVfawZwuV42J!lFKTXI&m7E59z6JT4pR=96z^pzh%;3jw>hyG`ei9`N@?#c5ew zKb@SG&Gn7b9N62Fh~Lw6T#569N6EB#4MQBlE@k^aDE%5iov|lD(ozzMu1EHd04C`auVUj**sybN zWWb!LCK-=6*sQZL2#5h=OPtCpo{tik*_pMfJg`+OYg)KGZ|3tA6;SB)O9t;VtITBIzBb~TKP(o`Wic*gJSWMeV9?X+ z?d{Ve;(UBUYch$cqx}W+L1M4UDIyyvnihz7d;t-OdW1JPAo9`VgJ=?JF^iasPyj$v zLC^4BR;xsfLf|joAyB1RggOrMQNlY!EI>&kQvt8IHAz5BLVj4Cf@jujan8Wz2XfZh zellI&vUVNd>uWFO<4zDQ0I-J^qRJwKB7|aulKA;`4nj)hM{S1|ECxm+q7*-=0xCX> zC_@-OMjl%qCFQbU!=>tS)U}GE=;k_*k2JYCj;ix7V*y zNm9F=pz_TaX|kw5dAwKT(1l6*O=mPTpa;jyRmykTD@nDSx$$l|`%i3acUGfrh0N$! zl2L;rTwxLF)gzIR5RGzEhe1}$lO1(V>=P~0*;zwcuG~T=Q5=q(sT&Jj&f$la^B_Hda6?+s_e~h3e z3`Mp@sMIt72m1s^z}xIW9tvlR*oMRm(*_mIcO}HM3f**YZ?v~hY(#yPAQdsx;A0uV ze9_66R@vE8O0wk5J%t?|*sV4QRPz>*kN&3!m7;DWu6S25C6cuXJCujbD2-dfmGMhG z*~F?7`FmGZym-5xz{7c$=Tw&;mDk{;zXmWT4F)2CP|&l}+dHr`6x0R$K?Z9NKvNSh zg(tcPcD6VH+SE1_)y*V>d-`;^BTLZAY}C({kM5{SSEjGtJKw~K_c+N^bE^YYZR|NU z;?M6)BAID67WF5I8u*hEn$bA2ncga>r99D5oN@cI^0furgU591n|@;2Yg>Eo{~>G%I6 zFrLKG%B;GH93qU?F^P$r5+6n}3~>3O`>yc@Dyc+V4KPtd?(bU*Rou&c8>aQ6P5=#! z)q2O!^B!3i*ybDoy4NP3$(=5b1#&V6uF=9Su_t~u@Di~Gv*iN=i>*NtKRd9GWMk zh)*68x6bilpQ?Bcz!Mp3o(IJskne}5kbAzc+3)~O5LIO_y~Megu2AleR&%;TM=|r?m|i37&=IF XCPWm7M0IibQk0X1yI>x^;V=ISFpjp| delta 4434 zcmZ`+3v`sl72erwcJn4#@_-QXfCN}b$OA$`o+N>UKnR2+JSKruwJlJq)&7cYwNwsO>w{|Hw3YQy(RwOvv1+x)x4n0E1x|{|`M>|p zH+SxxxifSByBFRkuf0!_eaXoQCit5;v442x!Q|?YnVFbbkKr*ihL}K((Jefd#wyvO zTe*$ecpQyW?N~jYC(s0*NE3MyP2$NknWxYcK8;S}sWg?R(KMw;bUU?!Evr7Ar_*%B z+4KyaNi&rkr`vfJ%|bcE;`JGPCe2nI3HmIaLvxf&^w~U@<|;W+&*S+tpBK;q)lSmq z@VRs@FQkRMh!!a>S)a$})A@V>U7*@2x`QvI3;80th!@jhUP4RwV!BxMP18$x87<@G zG*r$jXoVtE^(A~MU8>|Xy^=4Z%Xk&7Qf<3l&6m^VN}jIQ@LF2S>u4RXr}eynHYh$_ zZ{#cJ3MFUgO}v>lD>+kd;VbD%C1>fYcq?t?ZM03bXN2_Cyq&i5HFS+4X6kEs2klUD zw!V&c(oQAM(%171bc2#}^e(=UZsgsxTeWBFJ-nCpDmho*#5dE;d<)&ex6-YO%hM_E zqkY7rnGW}B+l~;ro#nHFAv1Nd&>Xsh&84n36Dwpz2TZI;OP!3N16nLF^Vob~=1-a@ z33Wqz0dqjxp=FIQ(9wWd$QA*!D9Q{1Q_M<$DTy*ez$|8^z?4RrVOFNuM?9=t8(|fi zJv8DOw6Y~^=>ZEJ1?5V%43w8em33gMST!)!QHBGvoYeqR6J@->)UrBY>Y|Jfn0nR# zOoQfwiTa`4$W}mmMO0%aFior(m{4<+5}HlxgLMX23(RaKJgeYog{KXk3TXB$9cjCE<{A!XXaHnMJ@#*tz@+U`LM>t&mO znNZATFttTX*7m?O%ri|8v8{|k@7{RA23a5U_N$<7Q@CAA!8ho|F(=z`AeQb^R$N*I z*d1VQ7!05dtA%OoI?<7$L25(lSXR|MW&f zSYEd*SX;U)AWC(g+ohN4o`F*TL~z*WU9z~mtTf;WY9)S`d(<_g1&p!yayy~Mv03>f z^@osr#E%i~Mfi#FQqDbQa$Jt*-AaBYt@%%pqw-9C9^j>Xzx6@Xc}ThoN{C?`EEq6P z{}D2M0AZ_NXinWLj!J9c?c`D8uEJJAPRKWk+R5XxcwPXg!}D$++fReCBS}1p1AmY3 z8-!Mb=MW5pUm-k?a0cNI2qzJK3*fK`C(2_8XeUgX!=y7zR*DB?Xu%q@Ld?-8JxZd%eIr$MZ5F>8EvFD6^#Vv%KGoC2fO=`kG(Ud`-7Lgl56HilJ~yaVmmvNEbT~HP*F8b;C)E2h0(yv8d;_Id z5MD)i4FF=IR`n(l4q^b za!U3u86p3WPn6`yH1uoz|%& zSb@O(2dD5Z!UqWN0UWn}?YhN>u$@_QUv-=HZP0Y2$lQ)Xd8xXJyd#U2Hv-~}CzkKe zxP~_voKmwl>%TbA67i|LqfhaH+){7NrL+O45b;%wB$&nBVd?T_i0E9`8 zco7?a#D;~t0;Ay+wQ%F-O)=(NoCM4P=N4JpWzWY6tm(y;8w+eeIWi*CP}ld0ataPJ z%fQOw&@<@dNdz~-vjE{3zl(_!lq_6xd4&npKgVvh2!e)_ubOZ(c0Gjp@!nnBsir9s zL5s%uhMX)o;n##2n>Gl96O7YDze@x?F5M|}SB2A5UQx4aLrW<{eo;M-d@RdaYXR{z z>~B2=slm}^Cvh{t&~b}6CtFtQ)|t={|CWz{_z@0$N6v4rOMD;2B7~Qvw>>ih?~oWp zz`-JjQntLKeOnry)o}dinA7cY4{HJOmSI~HN9^j#e+YdL;)pB@)@Enq;pqEtbUsQ@ zaGAs$xnXTq^;{6YN*aYot4jdYS0rhOc___CxNJI1JR({CU~SL})t*VbEoXL&kW6`? zV;$hxj&}=Ap(8x4a5x;OvJhbrLNP*#@#eZ%LdxXD&N~-C@n&)mQHHN1QI7pky8Ztc zdEfdVSt|24d|3d0!NvFBTa)XHajB`K8KH|4cX!`>#C zP&if{Mn}4+M+&M@lW0VMS`;)8*5l+`P*PKGMd=`N&GPi7+Ir=v3ES=11GQ>o9JLR) z0$Sv(J3U_iuAq}$wK>YxDp|X^z^Z~#DhD>dN_ymqEl=6imliLYu!A*6tmu_9wziTj zhI8we#0EvJsYldGt*u;4q*i_`GgI zo+3byqbU?P?620Ns*-Q3{JqoRb>i|84qe#aj2W-SX2!kQEPBi30Ly7Vg zx7(_&c%re2eS>se*&gVRZXsa!ZF%RJl2xV+V~-0r!m za~!qDjPsu7iFxPK^5|$8yo~ds`$#s{ZhKNMmqCknI=w!@A(x$(K0Y@MOACjY+6D&| z4+X}(e9v^;F}12aR_GDm*bo0n=qol_VO5KQ8@}YB_mMmmOtpXN+opn< zjK<>-cF9Ijn7JF>P9WHjOhmYe$OrRt2$SCz-<-v;Pn9Q=aEN_FLwK&ALN%vs3fxAX zHO>YO#w31<%&!r0rFXn&vZGJ=jG*M00P6c`!;g(v8uT0m*f`c7i1RbmLwLXrviMK=jG*M0D{VG4I8=nST#KLON)#2bMliDbM$jElk^KJOEU8FjP(o+^ouh~ UQgsUwld}`kQ;Rp-vYwFz0EYAx8UO$Q diff --git a/vllm/model_executor/models/__pycache__/nemotron.cpython-310.pyc b/vllm/model_executor/models/__pycache__/nemotron.cpython-310.pyc index 54a91eacb5662087151f9c1ea6689ae1cf85236a..0d8568c87717448b4046319caed9016ea347f641 100644 GIT binary patch delta 96 zcmdm+ygivapO=@50SFA&?%T-i%Btd}Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS uUrlVBDNl2AkJcqd5f`9t4n`g}9!3sECLjiq%$rMeJXryP@fmyo delta 102 zcmdmLUpO=@50SGF$HEiT|W!3Q0FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` zN!2Y#OwLYBPc7bD!YZW7R9LaOL+cWwm>bXp4n`g}9!3sECLm^GWctsb}rpO=@50SFA&?%T-yo=L?+za+OnzaX*D$wSKPNLu Qzo4=tBR_Am67zI+09u(8bpQYW delta 66 zcmdlgx>J-ppO=@50SGF$HEiU5&!pj_Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(Fj(Ive0Il>Dg#Z8m diff --git a/vllm/model_executor/models/__pycache__/olmo.cpython-310.pyc b/vllm/model_executor/models/__pycache__/olmo.cpython-310.pyc index db57da9721854b4a38bcffca981cf38d75114d8a..8d0aa1f73108c4792a9364c124a440414ae899df 100644 GIT binary patch delta 96 zcmccPb*D$wSKPNLu vzo4=tBR_Am495{Mrabx0kK{y|M4W)SIT!^vco;btnSdBbGH>Qp^k)G8v@#iw delta 102 zcmccSb;pZ4pO=@50SGF$HEiU5$*$q0Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> zlB!#fn4F!Mo?5(Fg5!u7Q(@)idvc;oVlF@vI2Z*uco;btnShv$k?B7Z%Vu^(e-;3B CT^sfQ diff --git a/vllm/model_executor/models/__pycache__/olmoe.cpython-310.pyc b/vllm/model_executor/models/__pycache__/olmoe.cpython-310.pyc index d42861581936a1ec92f5839e1e781a51309c99fa..78f03c7e6fe8c186348ce5008c92e198d843faab 100644 GIT binary patch delta 961 zcmaKqOH30{7=@ie+dyf+XeoWr0x3vEZ19C7xH3p|i7WtlbXsa#+j($j27EsgQKYE+ zic2*n8WWAtCN50G#Epqdm*YYg8e^iyja%bAGcjolaTeb_bME=){`cPbIs9$dqj-f|2c=f3#?T!s5bV*I9d9_;?SvI40_ew@i>XGIW#e6EE9@BG*TwZZ^IR&%)y6(AS zXp9$|PE9T5bvD8^8wC!*txYSkp3fSJp|NqelfV=(!4a=xJD`(5A0Ps$^4t0kRjwkm zL{By>G$bJ_0b% z@pq(vzyL7K@laq}F;uZ3SVj8bPx|H{4+6u0)uKk}rdL6$dn>sGGbm*{fuqzP7+s&_ z(yS@WPNl_kE~Bv&-4B>vjk|Hj-_MkSLH`NloJ^Fn8FrFub_zI6t3iL)8Kgb--p;{J z0_TAgZ~?GeS`K{@4Eh`z5R7tHxK7|Z+}(UPY&B{1XYj1)l$7aAkp)qAoPIU;de3sn z57oM*BK1WkeQPd6k0N_oFCpvxPdii_U5+dwO3q>9;I!S=G1-mLBA=w4e# zY?;rPZbP-b7XHSFW2|OcnUihvM)`Z&IL_=qtS@{Ei6|fgVUBpcz3c0AJ0^#2a>sP4 zA`>Nsu<4dWRn5y;wnCllUtK!N7RleCMXy2zfNMZC;06YPJM_}mEX>oJjtODD+`j3f Q!(;uDxGOeK4V#mH0FF%TNdN!< delta 1001 zcma))OH30{6o$RUwt*JVK!HMOfz(13sSl#EU}Z2d?vN-{a2SVDhM9JTGeZf!Ko?bB zDjap=g2+aVE1iVIjV?4U-I~lsjczb5WN(c3%wR%@3%mI4-~aySKF*yVeLwpGT6uZd zF8-TdpM4RK{B37alLn+zO%m0VDql+J)8?3#KiYBlP|A?a%t2k06fv7ItQG$OFH2jm zgX^B&0lt9kHFQ-r;XK#SPe_wnCTV$7&Q5B4*$dBrOoS2*U)?dSCge z#HWx}@p;w!o}B^gsa`t0)8z5wZqTVJPnaNR+JL%SzETQ#K1pn?zSa@i0@WiU(u#JmERso2Y9HUn3d$-mB#47gXGCBtdd4N@ZECc!x-1N>G0jhXnRp@*4PYb40{p*tHNN1WcbQ_$qF zy*X_pqe49y)417qymp35-fidkoUqf8_LYiSJQwW_%~EpbzW6lSoxDYb{{J|g^C~T| zLUe&DJTON~-X^`Zt#gG%T#pU0C9G~b5_WPBTu*Vm(d}Nr^|H9yl87(!8QVXpyIvFj2P+)u(h+Sc@0w_Bv)5MSkLNwbXFN?SkP{XqkamG~6fQ8^vxXciu#w@uJ(h`WM*GJvxHL;Dh&ZIQMrBmwPjIIp)w@E_)OIr1RS=htt~m zC21&nQZMLzMuz3GM&F=P&MT5qNy>$Vq`qO~HPuX6+w9OVr`%8A&hufmL==cD&Um6w z#O<)(Jn|e0pkl-;yEQt?5R*g^Prb+1Wh!$h`93>TDhCMN{OS7$t|G4!!fX28|6#Vo zI}HoVsJSdNC|M@fICIWIDJ^G8Mw*|lFp>HdPQuP4syB!UVw0FAwupas83|~h;00I4 zNN|+9+SYEa2d}{+^H{^8XiHg{1!;s~D%1ld%!MRa$CHri{qJ@Rhg0z%d?3;K&K>Z3 z_{6_MYqu%d@)CW%)gJbW-(VkW;*e+e&EY(JlKRbGR?I>Si#E3n;@2qxf|r7no@LxI)cRM%n7R7Ty+RCJv&2 z5)%`AqKS9@1xC}zwf_Rq8@V(54PNVeiY8tdoAlSy^PcDFNk7c)&L-ScDt<&>z1{VX ziKJS)s;_uLx80^;>$WwoFZKMk>ztmbPwJlKo8wDHvtzVOFPK(`;xrdrPye9FmRum3 zKpR+)7*jEPhHK7A@iV4PiJPA*8oIAZ5!Gp47qzR*+1}q;32OYVaRO z$VFl8RTyFS9#mNS5mZ=^EIwCoRT~3Gc`q}hzFbmz?ZBzr%&{rRo}%NB`4?SIcknPq20!(a2#m?6<)+?H+CN zmUcGt^smEBq&I>+EltX@6C51BK>2NW^FRs7#NnFfe5TT-ZGKldmAfqc7$sv#ijg93 zm6V@Kguhj;(S5E}@0{4ebOCq*D$wSKPNLu Qzo4=tBR_AmI%~Ns0A<(|rT_o{ delta 66 zcmbQ`I?t6mpO=@50SGF$HEiVm!lL1?Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(FnYCON0J;Mewg3PC diff --git a/vllm/model_executor/models/__pycache__/persimmon.cpython-310.pyc b/vllm/model_executor/models/__pycache__/persimmon.cpython-310.pyc index 7102bb86bc008e256a64975c2d67702cc5f4c067..3a1f8330cd908346230785055b41c191d1ec45c4 100644 GIT binary patch delta 531 zcmccZdDW9UpO=@50SFA&?%T*+&8p(9Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS zUrsc(t(tNJQ~u7RTo#7MH{W zWwVQIbK0k$O%}K$3a#424DVZ6HlzAfg>aFo6hG5K#vrCQSY(A3QIffh!AG@t=R$si&fM5Jua6FSDkm_6B4G>0)~@*>d& z#?;BmVu9S*AXyy{kvq9w>@riK^yCon$>Ie-kz1@qiFxU%MTH>QA`nqL`JcGBS_zP; z$yuZg5-9@_Sy~5pM)p+yGL~ z0#R=S5@?>RDVxaHGPzsUQm6?@vIQ);`I@Xb6Jz^iJ_TLIj>$F(a*UmmqZL#|Y=E)? zj694Sj7&hx#>n)aiDmL6g+=nMAZ=nGq76hafe2O*Q41paC;yU=WvrWAs2IywxB0x{ P5+=4xka*qXN|hJ@*-L(^ diff --git a/vllm/model_executor/models/__pycache__/phi.cpython-310.pyc b/vllm/model_executor/models/__pycache__/phi.cpython-310.pyc index e081a8c9c3db81437b1ffbb9ab0d9ff3e70740c5..150fbf81a6483cf6aca62ba038faacda8858509e 100644 GIT binary patch delta 571 zcmbR1I@6UqpO=@50SFA&?%T*+&aUFBUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS zUr} zlUQ6550uR=k^zb50SQe`uvJ9`Ab~;_m!6d+SmaPlr5smXKXI4A!S zac4}P>?G<4BtP^U5XX$~1yZZU7OQAoVN|^|l~^=E(+9 z(TpvVd!#Idnvf)0Ad=Um{xIdqPrfQ0s9XsWaR(`3E;0nMt3ZSYl0fxjPnk5vj>#Kj zL>b#BACt*o?AWX?yOL496{J!eM6`hjCJ@02BFaI;gvs}LWEm?ai^`WXR&4H-U&q7- M3YMaZ$&N}f0NU$}UjP6A delta 572 zcmbQ~I@gsupO=@50SGF$HEiTAXV>u5FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` zN!2Y#OwLYBPc7cOjGdQ_F>3P`UVBFFc%T7A2_PbI^FO{8CdQP>&4Njcsgs`xwz9>7 z#N#Fx3I%effS48_B5m_oA#Xml< zlWc*+pmGIB#2uuBxyTU2t^^StNCH)pU1ie5+d;x6AVLZx#|^QpZSovXX^6pO=@50SFA&?%T*6%&6j~Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS PUr%S;lYx-7G~ zzL93Xv_w;=O^-ZOq^;Jv zUE&EpSzEN6l-jzqte(*_$xJZY!xQmr@Q^;(uZQ&^Z6MjJWzJ{&(<$SEw7rj&jKTeR zW*Ze{eg(J=Ts0b-f16mIY8)v>bj~qp9)W+28l9&sdB|?yCUNIQHco$>qwIlk>A+>y zG7f)2pd|60R3grA!I1SZdtAO30YfP$0{$4$?a^6 zw&aL;8fRuna(A&DopyJ!oH5~EHCc1QFG+ej79ZfZsMm8`Tx-D-X7}i;M>QAFS|Y30 zVP1rMNn!7ta~ZOH;VCG!iU8C!ZF`gURmhoYQa)3TXKC1XX77C@VS#zZSD>fpn=iy3 zQoVA*_UK>8*Pv!7p@i6+i0o8UG;1{$-DUcvL`CNEci5^k`J2kbjK57xbouR6@Q+xY z!z_Pmi8@s;+aO(yH|+c?f2hX}@0ef)rYkl7+e9poV4JiR=xBO@!ZQ?hR|=ajHVip< zl(CN#3w@4MHUs+=@EUjvtOM=95ugQl4-_b^$qgSMO@IVE1wPT2=2ljubuG<`M)cr2 NlNk%<#T${ce*wnK$prua delta 800 zcmaKpO=uHQ6oq}GNn>IlCM{x26PaR?$)uTv)Qv@oh=|gK^=DJ0WvpoojY*wEB%-K0 zt+t6?tXh8>t!bNujbZ#lw2GFf8dtV2>4_H!G zt9b=~vQN%dEV~W8|>3AmEI;8dws(X zSdV^e{bgpm#0#|ZzzA?bw{Q3*usp4FC)pL!+~dY!_!r6U>9*t{4**0-&lxsGKRqMt zj(%$6IktZc{xyyTgQg~9QSCa68^Ab6&zg9;FQKM0eLNl1n&IE%kXCE$(9^&PUM#CNncL6B8EA0u75DEJsx_Vk}^)NQ+_@8>Oz69h_lTqdwJA60D;akk3i>O?!06+K)^?$#n#w3iR6-cfNp} ztS7aZT3n=zf1mv}k}yY!X^){NNR=Athu_KWQeJYBC@HpkOGDaAs7XE&VpBZcWvxei zU#D+UJNI(|Cv6UFvemn_*GtU~IvrTcn{$Dp*mxX9Jt diff --git a/vllm/model_executor/models/__pycache__/phi3v.cpython-310.pyc b/vllm/model_executor/models/__pycache__/phi3v.cpython-310.pyc index daff7babb1355cd338abe76d40b2049d301155a6..359db8a5b9d3981b044ae1f7fffa05889cd35845 100644 GIT binary patch delta 867 zcmYjQNmCj@6rO)KovEEK*5M9N^$32M?*_ zkc0k!oVcedzah8$ljM>-JBgKF@#}^ymP`Tc8EaEf>G=&8?ctqunW7(8g`57k`>mO_h2!` zLQDx8!XwtjM$Y2bV3W;WjI$RP-j@%#e2bMnG+8ml7V}5ku>X^e36aGC{*oe_v*RER zmF=*7rw%K11V{M*JA536cr2=JJKz}a85h|iPB56{GAB;qG?(q7jwudKi!gg`k@agi z17~oSgZKXP=6K({aB*N(1^%mb-~ujk?Y^*KMg(z5Z_>_fn^h6H zYh}kZT<7fvB6)pyqw)WV*t^k1==!PHSL-uzaHI1yHgJ=tv3WZmkrL^Wt)%~X;dy1r z`oV}~%mU@j{AoU3IJ!6%h4=`)I-vx;Hs$FHGyk@5a(-5+a`>xV+k97CHkWSvdSI#a f`Gm)ErdQr~erYAp{b(011#l5<(In3t@*q*!MLk;8RrObp-7v2zcNWtC9m3i{j+P z1N??mdG|N?SG?#!eY7RTO!f4)z1Ll@YJOenKQDF1vBP24___G{@$l-}k!;dYLz6U- z8O&sWp=->|(n40a-U{Uv)nzr*u&m2ks8xF%xxl47L)KFRG$?G5jpPP5dBCH%RW?yG zG%H*tTgVGu@_~<9p;c)%*+zcwQvd=KgrL&OWjlo+q_AD)J17icMJi;3q7bD{=v2H? zc2PHUE9{UlibGssr%X^1k_uPJ9!fz<;cD4Seb7h!(64xn9H2oMRJc|S(J%}%u0xj` zp-~v6G^BMc&qBQ%qj4Cg3}jTGK~B&lOwtrg(KJlc49w`72#MK(4s+ND^XP^J^uVHU zV-q%G3wqIqt=NWs3}6u3KiOdkL&B3YVF!kb1}x8O7{O>!!>Di;%&@||6T6t_yOgjh zs>F&|&6zwJtg+dRF*aku^=6&p8?3}J!Ae4GFyG_@lV5b~5m`*}>J{0X75lKiXoanN zbwH_uIK&rt#MdbkkA?N_1RUm?5niJro5wWA>^O$w9NR`6Gu(JW1lX(;S&x=8a1y7u z@y-Kpnu}*d1vkv9hX1oRoW(iL?g|6vg%1}vmlox!j};ejsc7&FpFHTaxh#VBM_F+N zSGgQS>gMUK#@}aR=T;Z~n?13s_U8g_b)Lo=uJbh3@8%=MMW$dW=>J}LQCcv6HX_T3 z4`-(dd3>-h6Y}U);^gA|@c3PCyeFABJ31G!ll_CY`>(}W$!zmfIk)+Lv002il_ul2 c(_D%)ifYsQAEm4CH@EfW>34QZdlO#cFO;X`>;M1& diff --git a/vllm/model_executor/models/__pycache__/phimoe.cpython-310.pyc b/vllm/model_executor/models/__pycache__/phimoe.cpython-310.pyc index 9c26fe188e005a5a45a57b9793b753dd1993a01c..77f5a83b2c0cccddfcbd3a52ba4b2d5cb750001c 100644 GIT binary patch delta 1289 zcmZ{kTWkzb7=WFvuIjd0)otyf_uG`!HkDM63K1I83(=A#U8^0s>FmxpGrOZ`Db=9p z>W`vA)0QZyXeJe2D(){HTwY{f2pSUcA|5?B|5>8d+J|q>{P)Y5{iwWCEOKmY^fdM> z8X6t83`b>^6=+_iK=CLJ%}sZUnxn+)Z}1j*^#aMWvp{Lm8f2gGDe9S-IE`CzWrPHb zAMtZZa)8AU%v5I&x);%e*aw*j+sFY3MkgAOu-dfh5K3DaHVe_T1z!##mLpam4ly`q zQL)}%C%UMp`Xx=J`%r^k^e`k@OP3sA$IuLMuOd=S6{2Vrs{R-4kK-}xcA~?WRm#|p z?$ZMvQ4c3>L-(T$tN|WM2Q}#>X@)h)C5)_i2qu3`!~#MwR8~ZnTIZHLzTLFl=$xw) z+Yt+K6uPqU*lL1WgE%jfsH8UwBd z(Os`n8Erb@tldGn;E_F>bifyTZWh{yg9P!k4iOHACrrYoQ#@~gHTibl?X~BbAQY)8 zl1HOwQF#t=0dW!0%^<{t`@Mt$zPcVfU1o4b>}d?pWAI{rqx}?nuc)XH;%GIhYY`BeJ2Pks!ANRx z_DM`$idcqNjlcnfW~!pJ%jMQIA8m%%G|4i6s^3FzOWPm+Z>JEK-a1*>o1Q*d_$vKA z>4%Ptm5kWxyNv4-!Ur>Lq}{lgnMG{#M3rwMlnAqP65)H!-B`Y&A!Z|(Sb&k-S}X5o6a(VY=mUgqP7gr;s*ypTFEXZX&3rh5%Ixyu;ON+?jf(-(S z{!vt1V}X!}v6;lEiFi@);u4ojW1^@RZyr2&)Avs`g5n&$_s_q)e|i6V_b0bbN=S&C z!@icgogrN)X6aU|SEg1`a`2*6bk(2}q+ zlDLr&pYk;+g&2M89!^XB?4T`(Lx@($)bAy2N~?aCX6+Hw9A((a#nBG@=|rqRtVE!L zZ5|csybi%m1=%ZlWZH@rjH1UtZ&*dzV7p;K=KsQfds@?sFlg97{4iw@a}Klc@Z4sn z;EQDI!s|{ju!^fu_Jg$WC25B>#!^PV@y7zp7>=isTd>P)9?r&tG@$gP_(#}I%fkt18JsIJ)j|q_M_8T)f3811(~OrXw!R`w`gzlHrQRw_IiP@lc|J0 z{m^f+5P)%09_fY8rX^W0wtYv7$(tx11(3A*ef|0*wMXaB2wmVKWDA&|40aWdz@ zjH`QdQ%OJ>&NY+NAj>#PXb6v}NNTl+qwvYRPdkkD_@N^2+g>ml`M(%uGUM>b8FkHKDBXH596Q7TIR}(e>VG> zmohT`pM1o^hLL46qvbzF#y^{^&oT;eF#=7P4AR3~#0_HeOulcU#>hLF&32;{2T0&N z$d0QZA|FKT01=#%%5|+t@o|gd8Uu8@H delta 375 zcmdlxh4JtdM(%uGUM>b8sNB}Dk-LXY!&kqwxJW-IKRGc+KPNLuzo4=tBR|hr&(J`> zII|>Gw;(Y&J25@Ac=K*H3myR;piVXhHYPSkroSwVZ2vbi3g4AyjM{wPNP$u63sADC z8AN;o5nn;XcOaq3J~_}(bhDm`I}^tb5TCK=&*WOOWsJWktC%Y@{@(0iUdqV$Z}L71 z8zyGP$p=k@C+To*mau%t2$cI}b(T?xlM!gtWROiHAbFEwi~6`LHzR| zyRL$Wd=Rk%L~v|AZCk;_$THc*;Tj|3g#Lr%_5lf?GrB-*kd%xJFUXjm zAYtwzKalWg5Wxx(WuAP)QH_yp@_$E3perSvmN0T`-sfb*Bp?Wq6#x1`JK3xf)wEjk6thOu(pphR>qI@R7pv$ht*4p|qLDUgo@O?QX4bY7ag=iJ2TAHVhvp**3z}wcAM+Odb(b8(oSt>nj6GMx>55i zbCcLiH*3Dc+#ssP zOZ3q`(NFuez0BM#9;1&5N~zdG_lN;HKx}*^-+P46eXM|b*>XC_3aO8+phK*P4zps) zHriMTGmhGr!IO_TCl z##-j3NswAu8w9n@EBjeHm#l+_*lHdgiDhfp+M`Z7#ny3yt>>knmV(;JHh_9Ss~h=2 zP>)jVtb@ewEMV%?w}(vdx&Z{@B*9_A7o0zr$ohbQrbEF0P*@oXF0 z4&jG+*QqD?^l1XuZ}1_wmYn(~Kdi4a{J?1fW$$1fDBFW&^FH2xB<2W-{^^s}RYyWh z;fBhvn5>-iPnL&$a+HV58^qL@s1^q+P5)5k`f%I1hFC)BSohkeiNq-eMj0pRN zCk&_bqUW4CQFM;HuI6%ct*PSw5b|3UHja}wRCZd9DkwcpE~uZC?grIWHbBm+@iGJO zHwo$1b7jOH{|=-u>~dDUSbi+|ZOnHW0cAOBbytK*&AY%OF~eh1feHD0)SpIp62Mp( zE#VI+TtWCF!c}#ra)Mk^`>IxwH`TGKPV$y|x2g*erd8F|KP0p2V)Y9-dZtS_LRaB@ zbZVt)dSJlynyhABm7epv7<(S!Fv2kaBQ{#X9161tPas5ZLglBqRafomV8VzQw8-cfOrqG{ztLV8Lf;}i%9x=5O#*hzu?6YEn`kKHF%Q$ zisN5E(CxXdPBs*fId!(7pS-U!8rzFL0-q7{wfBJ8QLj}jB`k_zDUBv0q?MH zc#MbSRqJ-+9kMi<9enUCAM#X*>E-L{ZgXzzS)>+cA+ z5&i){7y3h9(-#VRr4OEa4eI{{FjD4M9SXWxcaU90_?LR7#hr`OM;v}OP2>Dx)H@Um zMF|gvpp)lY%7{mO+~Rho+wDZTT0P{Z8f-OSp*-E%M{cO=t)1kCRovEQkNr0$y{pDM zwi1W+a>v^a@{#qOb&aGbo`53(Ar`>Mj5uH~MqB{iu@UcZFfigDm7l1a>kIM{G3rxH zv=L#GF3#iuIp2;Io!d*D7y}>EXu3$k!yFGMN<#M{_2bT)WQlcjLpju19kOla8M@3M+*f;ll;Or%Dt05zx0NK6Y_bCc~!mGT~C&( z54#JAR114{I+F-I2i}uMmRsNMSz;&o>eRMul5hQb+Z*-_Jv$_`ZIyADeF4Hvb;8r; zasY+Zb^^10u0HVek{s2r^LPe)>1_sq7e>$wN+V51o1(7m%o+KbHbk7`L4P2+0auI=5Dasd)j z`@tFs9-HBi7gW=}ad$h${Tb&fM>#QCRhxQc-xz6E%e_a*2kJR*TkIDY(x`5E3-ViV z2zEiXB8x?qi0~%D2BNOz=8#&oWiXgk3jxMcata*-0FfBUNBOi&Qf{ zrnPC9sniLwVW!bEc*dFOB7S?{!oo0h*q>Y-VnN6aZHfx@4 zE)y-ZMYPgZZD&lIZDKiHu8mByU3Ab6(MdbCon<~GR?roqi*{){+w2xA=}OIW%vEAF zU9I^-bB*YsJ(@2v*NR@+t9h>3C)Uw*n&+A8ML+Eq8|VgY=bHm!Bi%@*Ev$eoHaCgQ zbh8+wgWxP+h31ghLbr&A>BE9jDz?(C#KPTt_z0ofSP|XMmQWunraM>(^|MmClaHHs>jvaXxC~Sm-GDmah}rGYhq(m1CGP?}gXD9v-q6e!DB3n(po zI@Wyvq*m4jQrle6Znm87VeMS94jvq}vrhKVQ5y}h6}+5vaTlmAP`lYmP{UeX#rJ~R z3+igN2Go752QqZgQuTe2PHX8`uDpJ%DBN&3y1k+z}G{)9J|Xt&X_z z9#1$ZJ!W9UZ+gt}ou1tXLSuoc+Nx@=CpaGBmAm~Tlm1;i7_mBTWf7`AUc8^Y5Sb{v zX{5Xadsv=Acn0AoYI|`$c~KoI&QAF$3O_^mIl?a@-!HyG(oX}A#sx!=(q)rA^qf)O zEd3QZt2)y2B74g25b~y{NRer?`Ij^3t*aE7c^E&q`Zl_-a&7ev-_pSF4}P)!n{<(Yhqt zgLSB5HGRhZc0kn}4M`Ye$*@nMaXaaGkf z4y61Eb3BKj$Lg9o(O5*Ts?&`_fAa+L66+W$gm#ycZ7BT8b2;} z`F00_vJWLJC~6&N`(ygf7tJNIqr9qjPCjBTirKFPUNwbl~9ZN(V8%EM2dO_2pk9DwZqd%81xbLla357 zW{dQqsasbgn~$0<3a)C4yo1_Z02&|M6XyINm#?9;0G$>DJ<(r$0bM(Fgs0}3MDuor z$4%x_{kw+-LI%&rq90>2J;{$EU z22fb8Ph;=@g#DJLZVhyjMar{rX1W4>1kR#>8IZ0td4I@iA)Ka;%7E~N0+W0S<}o}K z3VzktMQsy-@u}GA#$m*C5Gx7RphxZAAX10U2vND*IYWnJMBm0Xg8Y&|nsGgy!tiOTqg;PYgnvEPAI%X8; zCVKdru$^8idNu1ezpC13*W#t%Nl#87PS|cRxiEV+%@WbN3mflyv?=4>0VE&T>gq$f z&D(%QVn42g|Kn7Um-L}}d}}?qq|R^c&#J@bwE&-AZu;bERF%WS_9l==tg5giTm4`- z*9qT&_oC1x8`b6E{}_9?dV5<>>Uk)E8vAM_cq}ffJg+?4C$iw1&?5f`imXI=UaZ6x z_5AiR(yDTNN6B^dU0<91Qw(WP*L_8c;j_{rE6`qs%#Lgx!UcpbqB_%aNwwkIC6wDDSz qdfN9Q+lQbFz#SuV0HXH5&Ivvel7*-gBj8??UghJHP~e;V?0*5QQ%2_i diff --git a/vllm/model_executor/models/__pycache__/qwen2.cpython-310.pyc b/vllm/model_executor/models/__pycache__/qwen2.cpython-310.pyc index 06ac033e1576a1ab6a30c00d6a695489ceb834a3..6c494900d315ea245caffe7c579d10c1e940f993 100644 GIT binary patch delta 831 zcmajdOKcKR6b4`~1saQE4Du+YJW8o#BrSHK(q)atMw7-3>P9P;2~ZgZuR{=((kfLK z_0_X6L};q^VT>_#_8Q}|n=TC-qjBlpxbyzd7~@73Uk>MkBJU)g5Cq z^wu48Vw`hO0!KiRzPszvEm6uQei)q^jr;Z+&E8Y2il>S8S+v`A50_Av0d`szp3J8e zK8r>b%z>N05AF!$Jv$epkpOqWd2kQh2Y(*YV%e4@mn^5-&c_^7P45&M_8T4{XVAAl>eM?bFahL@&}po0rnq)N8mAd z@-Fz5v1{~gAUv^*Mg_#cA<&Mui7E;-LCd0QDJ92mpwUjFJEu-%lw^u~(7H~Op%HeQ zDxp5sq^F@7XASLt6QFH}gQ9~`c}1Mc-T%o7G2sIs8mzcq;J)WrGk4b7A+Ay+e1Wae zLU_#n@~^`+Os~>*c#5jNhSLZ*4yFMjDBmdFVJ delta 785 zcmaLUKWq|l6bEo01saPaN&~b7PFtXe#$JtoqC?}N(b&Y87^+dLo`8To{{4U|wzgo^ z4)tI2CM-2psf}SWm$(_@tfLcye>Qg~69?~mRAU^x;ggql-`~5tcWaSm#Fn+&yEf=o z`E})$tz_LkDwhgERmDSW`Iae+wvza|ZyNBgMsuJL|o*-B-js%{Kfs)KBbpolh}vOoHpMxPP1yeHHMZ^cL_V{>j3$dMJSm>T--!s z2F!vRKmxaP!kgBIq7eaiz!`8C%!5A~D_HAM|(w|jSI zF~_317sq;5A_+=_4$8Ld$cJoaq1cZ3hy5JeaSq3duQ<=n@toLsi92~OmhHr06316! zOB4v?_xq}Qj>Q6^HT$Nvy1Kf$j_>}ys%Z}oyBT~Q{OPaF|Jm0vnLpx1|7QdjkK-Hu zrIpF}8871-zS%IEre`*@Ue@4swqZ4MUao0-b~Eqgn~vu+3tpk=dTw*b8)_E4VsqFV zZkD`KbHp2wXROAkH;QMi#)f9uD<@@R&9a#>GR<*sqm<+to0^-w&CM;|7P+5WqJEhEN+}^BsmF6yQms}SbcQoJSy-V^|)qSD&$~~`ijDi5d%Qi(NpDiFhZ}pF4|oqWAM_qM z-ciYKZ5(S(c~g?#)_Asg+&kX*Fe zk4k=L<6}+F^O`SsFUa-njgL29^j>U!!uy0=R~pskY45b;cQtCwX>S_&JN$PwW}3d| zHv=z_>pL6!o3q|*bIzM<&U^DlCU_*MUoyOfr!xLs{@t%;{JVqFrL1=b*Z26lalKov z8^K6$CTPr>TQgo0_a^*%aqnKa*TVIE{{6VVKPWG>@${nK_9uhUg|q(NK=}_aH*5P3 z`ukqZd0}Bs_wIhF^X@e@UH?7)L#P?~56hkRN}9IvKL3$dEpG|$e82xF-uYC;TT-@?=tS5hVxwgD5$elq{p_OtKlZxmy(IZ5$-i89ws5p? zhrj3_4_@&e-Lu_t%m1kVF_gb5@7C{p1#{{7 zFW{Y@#(O@Uyz?`X*YA8yYJVK>crkE;PojOS8+uy|UI>PQ4{y!z8a@AnUqvgI{nNo` z`Nmnxulds``J6w45+Bb8fh~QR4RZcm-~_KoJMtfWp7-mh{dsxYLhxR^;l1eF8NY$j zF9gR|Uk_foV&MN5{i)#PD<*Q^9ehSgz6T|*q2!^}?+q@a_vd||Z=K9csO5u4TC;%)S~J0(cB^r*^5OGAYv1I1_B?;I(ro)dqcYQO zF4m&@bR(#ouSfHhraDrMwHXuy^||>doP3isb;67b4YgFAsm;s>aelF;qI#_{ zF%)N?XkCn*1GPq@hE`(dNE9f^Sx4((6z7lDSrRkIewrKnwPEj1S}R@vx9v_ICYoe8SbwFraq ztLN%|&<^8b*u?0nDqy2{-(V$qUx?xjPef7B;!utSQO&PKHFU|TK3SVN6SVwzd|GF! zty(jv;>`hG9q(k9=Nj$lT7$is!CPxl)It~JDRgP*0B86>yER*%i${+wHKO{lwqI-L z61<|wCKeZ~bE>_x7?-dTn0pL2jA~I3SJ0=ht*WxT)$UDHsm|4+`9N_3m!f(j zI{w_L>WM>79XWaG#K+>|k=Ei;gf~UOg(xl@J$g(EING6ls~%Mw?YTK=V)SIKx!AyR zcE@hS`4h)ZPGP1oi17pM#!|C&Jn7rfdJF3qZ#dCDKUjo@M~=4V>QQ)HwP%75Jx5Xb z!%H@one-Acx7#(8;VpyJ^q^XyWD-lBe~+vu^UgPM<$jeam&!_-wZ45QyQU;6C| z24F&i2F5>j?75?-jvRaT;1frClThx>`9UnIKxE%KbZ4YASPyUACdlDedtkZPH>%N@ zB?VN(+BIqsA(HTS1XHb=fnUekosyLU{GANWE)i$>dQ=*fK3CsUeg0?y7Mpq{&({gz z$s`%^umDHjTkU#SompIZ)6h6vKDo5G*j7>4>wN5{Wyg;bCXOFJRu4lg?a|sr%=Tt9 z0BCFKGJ&XOfKJEv2<`;U#pq(S-ZzY@hQP2oTbqg6>f#K^NB<{_i^uT|A3zdhJOiSc z`CKN*`o`8wVEN{wnIN}dBbR+NQ%LjHqZvO3qGre2dZQOgaJ+sYXy|2$i;KLdo~t#M zf-trsQWlWws1}zrp_o&3zZ%V-pL!z?WYx%7jom5{W~mWWt8uYfJ-bwE2-;SagFeP1 z)hb9z8wiHE4pAqEfz8avwqCL~GU{1WljNH_p$!zl+tiW*hxRf`jBfvO( z1HwZVBjf0D5E|?tA2%M~_b(Ce5zSf@dy)mBl0Tb%-i`1=e)E7RCi2X|*AkUIf^K zJk1E}nXzRQI$@sQEWRP9F3McWtQuFK?nGwC=$M^s2dnkE)yY(|HH>ch()yL4LdI8CV6X(LEMUWRDr?8x=+KuwK0PYo3K~ERr{L-Ri)P&sd+vi*Q zMiyfMeXv4E;OZl6@}o?oagRB^;SD1$RI4+MS_nk$1KLmE-gn^}-hsq*EZ`acoVP9O z#++*{_oz@hGdIM}tCbcI<)?ia?9LDt58%uE( zEFre0+wF$Ru{S+5BND0mm~hI~0+M(*S&^9la!Rr)f{8w>2vK<+xr_M9`ZyUgXQFTT zzGa%`H8X3zZCd8l(VY1$+b+GebF*Uo!!ilP12C*cP&*g+Y7XTCtHKrG%E+p;km(rV z#!hBItOb7dbyKfSWGn#8hcX>=*7Qx5pTzq4mJiElb|_MZxTq}yp9imGYheGQhfj=%UdQVCo6s>I^VABd91>V-EuVnStE+3T{IQpT? zD@J6H6oi}nYzr2YOXdnoFtg$9-4Zi07k~|Z&Ih6RH0B#KYm8?iv^7wcy<~Rqmd%{^ zT*vZlU3bouxyAZSILj})6?`r{QrRt1z9sG{y)p5XUY?R%wHAW7eG1p= zB^H`c(z^9xyDj>_+F@@W81`a2ta9k*glK;atq8SqOviA9+Nnz@BmErs3?*0L_aKup z^@5@Q{4$w)U;*Z{$$u;PpTqwg%7N_(L(lsT7`p8jg8YI5_OJiDVrj7aA-@R5?iLJx z%paB-B}qq;+IR-`h*5t7Y#l?w{)>R}@p$tfiSBBqQ*lA$Ho`+(fC5?-fR9JWNP`)Q zvw{)A88vAnLZ_bsGQ7^>8=6od`uYB9_6nA`3husYV>!($U|ZF^Tp_n$$+Z&|I))E~ zAI|_m&DVj}RW}+!eWQC_jD{~|2n2p+DWg6Rl@>-;?2e5q16QLR`;vf&+zp})t7Sh6 zpviag>NLo2t})geUvZ2~$GMbI&x2%Ssv9X;M4MJO`}r#d40=vl*2{Hr(Uyg+XH3=Z zJt1Y=P?BIsBlaL7H|Q=rJH*Z5VJWOJPvCKxH#fVI?s#@PP;fZ?f{S_EKf0 z)~cwbR^>EQ7P$jcL8aGxC2C6}-4bo`NZXn`yu3qTZ;u$2{B{slpeR)!!%@wwEDxtO zQG9-KVuyN>^CF!8cI3P}sj#kZvpC;Y4PRz7&PR(nLslbuR_l<6VUN!7`|{s0ZsvR3{E-5i@)C%sDMnT0{@E9sP@~pmi?vHa!npNcD+R zrw&b>I`ZsP^~om=JacI3pxVa4Jj8Kq#4=U=;9PwsfQ@XiHeGMjql;cSg7qp)7GP5P ztv<*4BULO-A5g@$wynf@h+!>gUur9>xrdKFaq?-tdCGG>didEB#}1u185d71!9LOq z4k-nLNkPkdpJrb^!{jw4FYxhEh{8Z~SecTw_sXeRYWgB9QsWzq?Q=T~s1_ zi4-QV%r*Nhd_yWrZr(L52w?Vg%e0whZ3@d^7$P)ZvvZDNgQW70HH(IAf}xlY*si-d z*Tf$f3^Xa0USHP0PZNjGeoQ~6hMHScitt3qjiBNK7 z<0{|1$_p>cEP%v7fwMlF5w*?s^RJ?Xj@`-6W)EgA8QnJ~Wg_>9l&3DE>mnX#hHrQ! z!fO{c!x<8h^g~IJ1Ky8sNa%YRH26hFhL^dV`C{gI=wxS2(m%~mjo3O@56-_~#^&S$ zA}+jPc!gGQzN*EF?)t`sN9Tf8aA8qBHikEboLcjxEt%za--NeJhA;p|RUpmeqmA}V ztr0#p*==INRV!#feV$2$$vGzMx}ucmZP!mHm|ttOTXRrDf!p9z;P#7E;LREJ-K_sb zBq@*+4B|Y*vMS`a*qjbkoh8QE*f(Jl}GVXLhS*3!#_sS zr~es*S?GV%`cml3EkKe5{5gc%S2OFvQ&!mIUdU9r4&>pL9CBdC$l1ai;oV#*fCWN2 zZotF2;x?U?AuvnI$eB-5vIemDdFHlcRtu2Nik+baw^Kx^156n16c&c`n>)j3C4=kY z!tiS8O2#j|o?j_NBb}1(UNTol@oWiW*w86q4CcxRMl=FAADR+4zX6OXSkQtZU_3`K zEB=f5P;fvk8EBg)`@pEG$_Ca3$FO`K+-BK_5sI#AbVOd7Q(Xhwg_FbMU*7 zpO`2M6;xL^PQk8A$a!1q34@>HT&Vi=WXkZ>PxAiu^l}oNo}6vY*CxBKRezst{S=be zj@lfiSDaPtW(v;U9nGK#8*Vk2ovqK*X}!j?33E;6$+Os|2e};rj%OV{|Lmfyjrwu6 z{k=#gMtc?s^;MSsJto9l^`lIFjLF|c;<-I74F(HzxUYvqdtiO2-eApPjuvhTZM;&i zun8e%U5X~Ag-u-beYjc5k7iwPA;&0QcaU?9qB&~p5WYn&wn=yyxYu=<6|R>+1(t9B zHV`slP2r>I?C=^(h!QhLlfCNMI=V&>7?A1u(o0DTh-we^-{&O>mwFY+zr;7Bm;t*- zVvVxCWy9`a!|q|j?qS33VbbpLkh$Hu3N}kdOv}|(D_8!Ov@wIn2Ruzk=^V$0@;FNgbyssn%v3 zdEW6${s{D(5z$~qf#aj`*x+0XCQYdbT@#rmE;SpA)kM&va_iwv?6x4;CICQrM{6)N zN2DL-`OV@RQiADeFp0h~8kvz;W}%&ce1gfC`ZvG%vyai16M#%uY8}b!6m<8SStuul`h;Y5JT_Y`c;jfK zrGG8Xao7*)fBR%{V~Z#)Hm^8~nVQIJjO)&y`Uhx7CQbbub23{3WIc4@^dQVbGe@`J zfEf}^v`E))2{n!4)kN&?ifpoAJ#lT8FX^KC02j1yi)8o!zJi&UT-bOe~Hj#Aeu16yfN1`1pCCI0g zV#kU7+t-1}uHkdTT690dS2dUj&Xc+I**xhKP``*Iw&8n(ex}Jok22hv2K+3ZL@Aw@4DjCoQZ+YP;wQXKqke0*fY#RwqU`+ z0Luk%JPYj3`VPLp>BNFT8^y3^!9D?r8Fmb$aB66b&I?96SfLH^mcjWuPAB^zI+5Ni z;gwqArR@9WOMr;jMHs@&yjJqYB6t*$3LKbNhYG3lr;nuimeBEB_1T)5U$iC`xwT_1Md8u`A4%2jsi4rKZn za6kIN9ibWUm}31K&}|rn{0I*kKsN)Z1G6DKf>|IP{DKR%uvelUe1i#NE%q^1`T@au zftE;tdfFR^8WyA?px#Kl#$zM1bu554T209W#d%)`h{Qvw6h)p&&JdSFARR(`sxTQP zfi->BK_XZBVcx|zi*LAyqz}>HuJVns46J@cI4UU_wHb~OYavHv2Anoao1t)8JF-^u z5fx~Hl?kp2-{|WWN}-NKu9U-7piAdq`$L;U3Afej{quOa`UNDX6#dQ<#Xf`-G-MYA z7u7#PF18x2>e<-Uq?ln!VgT~2rw$!`PAoveMN&uFZ}Z`Q#Y9-=zh>@c{PU9plsi$w zb)ZTL2Zd@0I2MWxSuI6e>+RxO%Xh3pBK11m0&^X-PV5!TeHt0yC9oGJQDEaLtR9>& z!A;<8*B&BP5NKtvdtl;W+kmKpDTQUiT*;#>4}-yPqA}pnzrjBxNGx+lh6)l#kQQEw zAX$iFvojCs41BI>$v)4$AORwbN79OU7Ix9~u>1!&PvisiG8WAu=BkKUT9=e1Gm;{D zR>SbrL}^{z?y_3-%j_`$bUg`Nl!Kc~-M@v$I_X*h>1|oRuCLL7WKEQ}!Ew!e>6<&Z zDn7wE8u*aH@-x6?{bBkGfbf%}wsncf&8dH&AgJyF)l2bh zgCKN5996<*8N%@=^7hNW{I#aqwnLq!asM3PI@Mh+G ziPQm)KUbw^=`hM%m}o=bCbUghlU_upwAol>+JDc>V@P5fF=mJlR4?Pg8&Sa=A5qom zrCG!RB626O73si5AD(9MTqTz&OX{`xAK0+ZWKb~vaRNgb<6zTMxv!*ST5gB$I1H=DYzT{k!UXh35v0!7)ElMj3 zmR<+Uwk;l1QUctS)B#C_Z8S1h3&Oo^PzaLXL~$7)r@xDCXiJBweh+zA+QmSOK#l** zTP%Z;@}HRRE`<7zyp)OLQYe|oZuK|^LIA7W@AJ__FprUkLpeCBUg85X-`z=%%S(%h z+k%Oljz+y)Kf^WHiMq7gapn=80L|Tn8Z2_rwG#At>#vs|xb=G6*zmxLn0Nv4KvrZ6 zGAVt9)r|IGtPrhbse#p0{}pxgz)VdgIj}Xu5pwfO>_1VBL~r@7TlX?0cZT|RcmmVC zo**MLEz*p1f(W5wnQkr8{0{1Um7O8ZJDDA3+1)X$SUQ96z=yEOPx!+~`UMw%V7VxeUqUmy(>or6M-2uH*{+!@0E zp{OXDNB%PKTucnZ5iP4CDt*?toVjdn%d8aO3@!M^Huw|p%!a7EI`&%THRCn&wd`xw zEP~4X+^bGB4o9d#pMwZW8>3Bl$7ZxZYG7RkZ5GXDi(q_S^HN~suVR2&X#aKQeuK#` zAi2S8OMn=|H>@BLvu%-PTXqpIGAZcE-$uJ45nHq_1zm z==;zh()9sJmrSo`_r)k~CIwDx?c+_oS)`OG0eDF?dMNz|qYD!EvcS=8gY`#B&%=Akij1%l?ST zaV8{6zs99_92pmKlGa?)l=PcIA9N@YjbU}UTC^!JZ!+z?`%SZuEE+Z3Z><%S*ITv$ zK*fvU2h%kCuP6}$_CdQBz&%sCZK*d=E;@N^>o9R)Y;PEP1_s%Y-1QDLFc_hHPZWq-5VX3goKVxpq+j--!@pkp+$gEX{2i`4=I(E{4*8$E( zn-3}40enLn&CN-4&cV!!FG5d%*A!L|`k*Z6_@+-yA6DQF^?X~(b5afk4E8t#bD%um zv0)RSw>7tob4;UYH-E)ig~1e52|iWi^Y9Nr&-h!_hj(?=iQrkKClzsBCa9OW>e51Z z1(A|)by~PPL^{bkj5UJa3Vto^-J+#>wTSmZxm+FYIM9&_9mqc@&2xM!ZiiAdsNe@M zC1S+riKW_#5aI?j4dJYmaN@#JD@1sHK%9ZMw1%x7dBoRBjFupM9&&3F!VY38iM()A z+6Y0ymJoG;FBxTWo-JjYwF`o)VD5r+e}PgjPtRc;k=CDL9b-N=&I8MmLeDv$=7#aK zj%yZ!)Yzcku}adR3Be#J#f=n00ZHB@g56^w*`L|P*Q(&ETsjM9K7Blj?yg< zzDl^WR*2~b#lH6pKp|-}y_)X~LDLz=m(mDe>x#89+8LErOK4*RIFXYQ_&msUsqb9LCHF_r3*do% z#?PL~t`=}VHwSoKg?vFsVZ_&+EyJNPN(&x5w8RM*U}ot_b*BWnV+TebM2Nz1 z`Xh)rT@!`yCS@Rv3Ih8Z)PH9IL0bz6T~tv2mt|*=#M#A~ul}Fp!lkDA8|Lhpr6w<^ z@ex&k3BLMiURc-?))X9=81F%TTuk_(@VR&coa!lq)P6s2q`v}i#M^WZ0SKCLb?XW< z)8sF<E$qr>b(AU-Wz5ZhJIs+(t*qKUQr%_wF5!* zzWNyq%PZ(2#8!BvUPM3@+ddO^Wkvk@KEonBdFC_u*aI>+lP<^tR$G77SwLWBrKi0M#)$o4>{va4ef zv6zKuo>|yP;rzvo7@G^?MC<0Ja~bv1ox)171$BYp7Z@AV0U$5NdG-qCakHLV^lS?V zi-DkwEXb1{H+sNvYxMpvSSF3T!qCJRjs>HrEmHXJ>Ac)zxw^{apRsgnY$6_5BoNlp zqRF?IL->fcwRkpg7+dtb>;j}y7eS4Ys?EU6x_p}#}Gr>L(TnQg~}+4$yZpf&g82|Qr!Y?@v_s6GXp4#P(_-O&cOf`Q0zuf zU$_Q`MWKI)XnO*!m2IGDmO%s5HpUJ6ZP%hb6Flglrk; z4OE4XgDCA>LvWn&)7j=BgB*Fq84amp=HUZ zSh=^_w>BUA0V@9rrc}JQ$ySW3sW*h-2xhMIE%O0{lVfTm@>Rv>v7I2g zAREczVeZeXN`Uv7;Nk%3(e{ai^icOBS3`jArU*nRGA=O(nU8WRI3@ps2>I5Jz_GyH z8PLqL*nE^lWM7t+NuVcC-M8V4n1~!7QGBl$zP$qe4U(f3!@s@)t=ZqOX!W|1J zv6o97>hO>&XvugzyWpF{PA`q#kkN{JAd2BL{)DnW?6rylo3!A~d)v4ttrrHDhw6Ugo z>ujZtNZ~ZHn1Q>=oeIpph$_Z=D(z{8eaAW378jd~5gePg+zMk`3K_yCTbI&(oXa~7 zBUm}W&XZn)y0P7Ng%dDAgAg#HxP~38*lURm+-kopFgQzG)SDbZ5U`zDy@%yFDN+nF zRDXvB?jlHn9)kvm!l4T@P?H&$`+f2R42Otwb<`-IIgBE;fw>(>;t}Z!H-PC$P@8yb zGmw9+j>>F8M}J6yY;e7#HL_ehT&hLSg!%Dk+ZLJtAGVW7Y&wZ z3k?<}*G<#9=H!c4i$vsW>JIjzjAX*logGL1RBX@7rusN{zV1i!vD<`KTlOu6$U~q{ z@&&)0>_3kk^mL|;c;6W!L;4v(rmM<*2^XE5DibNhxGS8QLLlS+ z={kid?Vw(1mi#EUJo{7-A*LL2i|zMV&dP4Rsouwi8=ftI%``F(6=+cvP~vHzM|(Dn zWRKd|NFVAwIVhFoO2Bw8>R{(*WmaKx{Uoe2@8Wddi6pl5wqu3EQZnjpCR_!@=@&^C zl{aC&M3%)FFFhycH(2^>NU*DI7i)Lh>}w0ht|Y*>8#xcCLiPr!QO4s9r`Iwpm1Aux z+A7c5sR2?CEZ#_IltN}=m(;~;A$3%?lP6U;mp@F{+>L%(!&(ZY1V}51>o~BoFshBw z)wHfqf^@U$KD>N@tWvt89Zw{>yO9CpWS}l^D;8xs^AcjBki%Y8Y_S5=z`+0q;Y4n# z{;4njV5UBb2I`sPBiw7a-Yf}ra)L0~e7Taj<%&S*t+!-ZCbD{#yLHzNd`t#Tq|g}7 zvHvQ^UPgzx{f~bxZMC~?30q0E}YS4Md!G8`q1KyZF?d^8p?(1T7=F@A6x z(gfU#6p!HR==KbT8d5HyH|jQyhwsAJg&s*Y0!&4&I}3U^?K?6tI!@l`t#A~?!yM357Ay&g;zA)^&P$?jU zLkAy%unf^zdR_o&Q=MYnpw`abZe7BobV#ef4{RAX?pnWUPQ=_vnQTt40#w>?P%+Dqc z6ZJkktjH9-4H6?Pu&8-c=xt0W6yyM$ouY5m{q)p@^x7Lss=*e}t)wB$9$Gq1wyR2betAy`|^P>*AGMC#Vt^x&!cr{iSB}B0a(s3E*~;OKEs5 z@!6{HiDWt`8ho9&cMv@;W>JhlC9gX$bZdM}OWd3#dkbmWwyqWtxo2NDv%uTy z6ebj-`UG8tyA7f%DKzDGL01~pHI?29*AB#5?5V?l3nHi(V`ZB%^=#5Ln!ikJIi`cy zgz#%1f)!68?#2PF%ZnL}L3-BmFOfsvg!7UWH+lXH0K3-E{5PC*-3mUZ<{@k19FY08 zPpK1;aM1O9@Z)x~avEA;Z_krpML4O+7!I|N$2H|ka107$LgjF~Yp6JSgaYgFRIHnX zgqKQ*r*$J@%$k7vFmbWa4S~Sd^%&A1+lC}Lj_FimOvp_%lj=zftR829$%r3&KVhv) z#i@8?;1HwPmLN?$s)CvwtLo{QmNL%6GZDz1Rr zr5;r@SGU0p;jqsbFs4#^8LE8(xGV5?NDTKCSnr_KP|6goOn`k)KeShN2a|J?_oplX zbY0V$i3AOvfGOe;X^}{wSEjO?`zR(J0giw#5P#ljlWc>ZbY&~MVOB{RlCsK?gWQZM zsu-~$2oW43+T9KB(I~>!)<8#PcY0PAT7IH3yVR0xz|`(!?}b(t3E#kVKF^Opda9vg zTYRL_Zed$C=>#>*Tl8T7-?@1nhlV9B$gPy!;#NAoggC6*owcA{+07un7cg5dCarP_ zq+eWJOq;N8c2Yl@EZ+%Hbo*AY+l*el8(X3BzV29)$(jL*c0WWeTGL5q1iQsu?gCYK z#)o-119X58s$JzhYVk%^yx%xN!@t0jhA;v+B|q4uDB@qGtNUS64Zgt6Y(f-LRlB2T zlTMi5dai7(lqS;cE;h<8-(-&#@FhcKUL5K#1KD3h9Ps6}n+&DvFkJi~YHADHp~22F zcI26~v*t_X%<^5g>}U;Y>#E!BMAL<)^N?8#x@Xp^%Q$8Zi+-8;0mOlQDms} z6RyJNQ4R4L6TcF?o4;AB9Xr!m~{aM`> z_Vhj|wrPNRLQpE`FaCK_JW40Cftx0C5F8lJsh&gv3h+MWMW*OdfC~gP%7}J` z@o)sD<$byX=$|%-tubw_OA}6@2`x@#6^EyAJZnZBK{ByXZO6ZOe1^vo>a*>-P4{WU zyZFFEOsFQr1;HX({?%3%Ze!9z<03DyfEjTW3e@YNZsxU zh~*m&Mo^XuMo}l-HMF5yT9#6tZ(@04i2EB&p0|>Czj1$KQ0|s(@;9U2Mt=+6;cu06 zo21)=O-U`+-{IeeTAOjE%HE{rPN{Qy+E>34Z1H!YPg^lE-9J5+t#t3rmUuoe&Rf~$ z-zm@C6>Lx1w*9;Pd(id{oc_xm=sUUKHaum^*}s;z)4wmcJ*Wi3tikqh&-Cy2_u#o* z632Z9MAHZ2-d2F4hui8v8%`%$Olys&uqhvIFyyD;QrE|VZV>9EiBnQk6#Pt8^%t<7 zHy-CgV^~+{r^~t*(Fp&Dsfr&0H=$1iwifP?V)Ql-Z!;ET3nVy7_7bQ*jDd_BPBuaE z93NbP#$Q6D0(r*5u-Xqpo4bJB;MI}V2%;8^g$?*3wt-Q|QfftGmmp76M?imZS0Wk_ zt0-lgqb-c6n1gJzP=*0AQ{9?Gk1y{N{ZQ;Q`q&g4YJ0<>BM^*d>la|jnVF|^vZ$J2 zwHxgD^B6Z|l|SSRahgD6WwuIye$S!x&d2GG6We-Gecr~PRm0h~)Iia0HECC!BC0>f zhbK1S^0_)mRe zj}}AXJnV#wu~U#SJ0^HMV#%=YU-ky%4xQfdAnIBv4DCtS-RFI}1~G zI1Za5jM%VOnuO*{##b^wY7x%UdXQco2CRu2MC}p@idWW|ta<=SCZ7~6z;kj4P-I}k z685BCLVOMm8p0L#-vE#8spayK)=V1*z0N=}OO&JK;$-D1*c5sFNJU#6FQc2wla+A3 zz0~k4(?Mn5L7ELk1%raO|6p>EuYMBLp!rAzb_-#q5`jaHEjBVi&xzgVdEDtCI?3dG zPD~N%3$?(Ja4@vXn&JfXjN(Q%y@=hFjBn?0sdWfBIA9AhFHnHNY+`K|cmMBjmABz_ zqX;&^p)LqS(cFk!%0ZBcYc4bn3DlAABb=^C#+`h6=2bk z0$3321(Ik{1V(#W{GE~ZAQGbuo_v{Q8+iUjJYT@`0GICb1qh^BIFDhJ7IHQ;r4C|5 zJ%8_VS!9ihH~}mA4BKUWZfzwE=v;o_M)0)H2AVT_%}uz7{Aw>MpHMXjn(8#mYE0zq#7#K@HYG6uZw-$BM!>`=IEcU?RCZw} zmChhreVu^$I2zWGQKKL;j)+0r6#^0H`e>H%RCJDrj|c=v1S1GcNjZoX&VKmjI|JWa zcV31uMxovuAdb98c#Adld%)x`NnI=!|8+B3u1=n&*7evA{*AyxL2 zhF;N+x(Eba>@V;R*l7f`5%`hpiApv$)dxXaC~c42j;AcT>(>M*k8=)7XtZdSjj|4w z2M{km{7&dL@xB4{JS8%T{5$u}^63k+ygo$Fa`@ z^X&$F7+r<%h64q17?=PTjr0(Ytus6;M0_o29NwegG0Elv8FadRn0--;OwKZ)njKqB z9uBkyFm@zcuGj77-JBu{?@pfE;+H@8P5?tkH>}$pwBvRtDhAGg#+gK-K7{cw&k;dC z^bZ=u;{#iBboAe#BY`kWpR!Oo7h{82-+-+J`;=CIgRsc7fm^Wp)M3*9apQ{yWAU+z zu6K<%Zae`6A3>AyU!FPzW{UmGzFE&)qVvFAMKA*5q2cQVPCrf8mbeo>2>TXTHKM-q zup&JT4F<7WtM-*l%68ET{mPKfUt&Sl8ni**;nTh1NT`z~F6$#Q9Vo~{gsL#SO1vU*Ts z5<_$apFv*&OSAz2mZV22hxJwhNQS$i@Ik7BN`hnkCVF-7Qy!2y!$oS2tvQOZiR6rKiPn@ zd83FUps78brW;0rhY^Xogdfn*KV%Y4+%I-{5nT~fgflE5Q=i_wU(WjFVQ~|u@4vAX znDW*6Ivx2@-$Tik;rrp`VZYN)|M~KdRF3n91`;7noF_qLR(ob@x=Vu(vyszN?N)&E zI%jbfX6jO^DflD+6@fokUvs*Yi^CluqBus>N<88BSN2bwri(*Me^3}$8SqfSQI&&j z{cYdfKhWeL{WasoYlYl~-^s|6CvP@#O~=|0){10yT_K-j~#`*EaeRGEWX z2nz(;2EPziu|zIGTbw%2$r#xGM2t;N0#z^eb)Bs!cHJAo zp`S^_&JF#ywe{!{`^{Gr@v|4p6YrqU`Z*kCD{+y72Zb|mts8wv@SV%}##b4WCo>O? zKKnXMD-glqK6>$o;3C1sM4q(<7trRjFe-8zr>Zan4JDPcCBzXR*S^n(qvu>^@ji$E z_z&lntqy=GXU`dGKb`}FrsE0*oji2&9K;G9^O{Gr146ZN-^AM{5g$`Xc4k<3?%A`4 zus6g;#A^Yw$$cVu-@Rg}YSM1?>>)V7u-649qyTl3cXaX#g|zj~(4{N`!(028w{)L> zDS7^-kKoPS7GC33+QvsRtq}y4yBEKb1eOmWtQ2!gE1pJ09Y&i~FA;>Q zEI=lMBRjlN#;KnRsy+@ktW!u?PPZjO;GRqm_gF3^HqFUo+pQ>2(h!@EhX;PNX*oAJ zjRP{5$DZTiv~rkn^2=l}h!w@LDYAa-z_lCF z|Er!rxq2DZV&|FQqPC#baEXRzc#FsRc$*N@hF|AO+7BgS90Y}1un~TYQ=b{~PQ#iv zEWb15C%-y{FrkpKy)Xk;lSz!R#SG8rSK`Psw9Ej&Yih)fSp070;LXqt! zt%si{Qc~f9E2toQsl~mlH*qp1UH@1R_kSTe7)m9N^p_ZRT!GMaRB}^!?_~5!wKbNPvpwg|uX7hA7-lcwCcZ!uPf?_b?MW+tl4mI#?{Vhq)Ez zs8*>VCYO2HX0A8$J}<@NdJ=bk1QLDtlPJQzml1KVVdl8^1+yndahg`?s=1qIUt>=I zLj7>+||vMnZp`fhXpmw;bfuS;hj8U$g_Cncz`3v&`LlhBsmX-D4>Sfj*V?u83 zJv2~pZ7iaGFfpG{MmQ@wK+ZL^%bEKGyvg-i2%1a#CvSL~rHUSGufRk4CwX+d`Vy~8 zaxJ^TWm^k@(%U>(IH}KShZeULclFWo+gWc&>S;fp#vUS*H!8(E4Tn0x_A(tOuB* zACvuTW_->4$!Ub8t9SF(#b{)|I&_@75)-)SZ%0qYWH(Miy`S}5>4V1UN2NeaQP|vrt(cFYKz)$O z<4m4lLjR`bJm1G0g<&GkKoL6q6Q{WhS3wa*4^SOn#Qh*O>ekliy+T z2TZ2e)aRIdmI?QGdAl?j(6*X&HFhp;x zd%qV}?``Q8>bdIy0C`p)0~S_%9P=MLj{=!+dM<+SA8EmTdsA8W1#d@>P#-c8lghC&XExDbLT;URc*2FlK?gR7A*U3(e5na455lMp*qZ? zFmPO|QDKyD+dexm4wWj;31Ls9>}C7;a^9zwCkiSnTN6w%F0&Z@HzzFP(DPMBMfpR z4(wj>97mEy|0`Z`+@``5ossN#bj37PqsU(4`{Yr0h`*9?S33xR=~OsKp&dm2F9>_D z_`~JyYHJBv>NMQIt<+U%oh}O!p5a)!6E^T;R|pzdPAkx`x6>!uMEa_%fw7^&Z=Kn# A4*&oF delta 698 zcmaix&rcIk5XYU@?Y8N*v1v*cp>>O;^cUC?Lm~%bJP3&%M2{W}E7V%uw%ct58qu~; zBTD^|Of?81{yR6n#T6@nGWH!=YYcw?3bIdEy02xIzPLw@Tx|caFuWw-|tbNf;|D*?C5&SU>-mEitajT z(}Yum3TFKcn8ok@5ow+R!-Q+*@x7zqs_=7^{V}d7UGf5tw5*1jOQ(z*@@WR3NVNDKnZI2Eiei-^GMG-@YJ}aWzFU%Q<~u?`*n;2 z!?1v3!9lo%bHPH#KP#iX_i*1mo)ESDuRpy9)_be+64k#?IYK*U`)bSB9U6xfoDB_o z9{eS)kbBwO2n_)%Y~ohm6m3)CFVY$*LxjiXbYvBL&*;35Fhfu{qPyEI9$_+;>wdx` zEvv2?YStig%a&DjJ(EitPw`dk5G>)>Sa?L_(`C%T81OlRor&NCf$z@keQ|v@ZuB3sh%^nO IiE{GXZ+j`Mxc~qF diff --git a/vllm/model_executor/models/__pycache__/qwen2_rm.cpython-310.pyc b/vllm/model_executor/models/__pycache__/qwen2_rm.cpython-310.pyc index 8b2d8b0aed8da1e351a6f7b160b69d86d977b7f9..01486a9de78323831befa274d3192e039afe9331 100644 GIT binary patch delta 62 zcmX>ncS?>spO=@50SFA&?%T*6#jN6`Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrlcTSEwpO=@50SGF$HEiULV%G4}FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` UN!2Y#OwLYBPc7cu$$XF-0HeDV$N&HU diff --git a/vllm/model_executor/models/__pycache__/qwen2_vl.cpython-310.pyc b/vllm/model_executor/models/__pycache__/qwen2_vl.cpython-310.pyc index de7b1b984d61675adef4b348e9d1a0f9763f0a28..21a2a47e857a46b537d7a039fa8b20a2d9d3a638 100644 GIT binary patch delta 2821 zcmZ{me{56N6~}Y!*z14+Uhm*ls6SiH5g$&p&1RU z^-NUv=?A>=*qAqU(1<1z<|9R|<;*f)uhg0I$D%WT4VVUAH`i1}Y|2~E7wE<6%Cf9P z`=`KB;B5*HyJ@!ita1U(x9F9cN#`4o3E&anO{%Qj#Lm-Xtyl0#PpSFc+9+c`BX^yL zoukgW>SY*FRd@*DzW{y-{0O*|LnFgW>4my;?w^acn#+F$^DDqRz%-@nKV=tb)Z=3p z%_lt~^=0~J!+>%b-VbDfvBpnEe}g6yP;LAa^hw}(7#!S!mL0Z3{TA2<90ooBP6Fs? z)VcJrVgm zQB1l(h=QC7o2#gzn7=1ir^h$V9P<{N+)X!??5fa`<|X=^>k`J3n;};MJ7VQUw3HF$ z$Kd)Qa2{4iDr}5LgPK03MYtX2N#GoSTKI9`UEoy#OBstN$EVW#BAse3X}bdZN5C%N z{}%8k;SCf-wQwXDiRnCy;6KuA^Q+3AA*boZmUQ(eke>>uc|2=|Aqe~hI0^if#KO^z z)+duv>M)-ni*S1t#hm=)ZMda-xI1cMII=FV4eL>7u$!2I|T^pM* zPpr$ev77W2l9q+sVp0D%Y1zO9@bk7`vL(= z*&7}gb@7F;IPZk>TS)h1bj;&!Xe@W2NY}(I4yI#=G=3UZ+&6V0chLIwa>pX{mUXyj zce}~T$l0-*{OzTyvPR(+*~$ZSkfucl4561NHgqG%Cf^`Y7l&*HY$yS)(*|>vYYDeZxTKLrhUW&m=02d&qJGZzp z{ETp@g}fRGv(-YO%D|#nB9$?Mk+2aC?oDz%Z1B5##V3%k6tO)}06npJ6RV-in`@ZE zyt(;(`@QO2{|*FwQ=mZHwREl!O3q?N|Jbe;%OhdCJvcRVZ&Ut&U@sl+jx^SY3^>t- zmWarUs21~DWRBh&7vU_ncr=a=GOJs+XBkJgKLQLDgpEr^1m) zEHS}tbgZ|(xe}>70;d_Tf|k>|TlN-|jpszkQCJbP{YPPkR?<`b6;#uAp9{J9YM@m> zE#r9<=v&e~x3%&#-G_h&L=LOaNKR=9oLp{)F&FRw*be?OunNt;K{Z2F(i?p%9P)6q zpxsKdef3V6_wML{rL??fG5PyjoDGO+1mrx{(%1W+v29@Vl&8dO9oTKNB^J{0o!?*| zQQgqi`VIv8ff)>VMZn4zPh{9IxTWlmr8D6;_rjG=&kqf5yxDw2hG6nV~pA9 zJfZ%3YPMjd-f&2_ulY%TpT$a%`Aq#Jp9VA}z7qUi^E1;nKcK@XT`MmTd1B0~1> zhx7K^GGMmuX=KZ<3DaqNHo-;&o|+dkOh-p&To1v#OW;n|5i)|0vNd!o_?UAIoTESx z2$?5Bi^qE!IglCwkpmVb~&YXVRT8L@5%D zvlzV_UE|s|&l!_Wvm$msvn9S}c1$+0GF{jL%2ZI?mPvjVbG37w9-Z>B1id!3lWn9$ z@xdcFwE<@$tZR{AD$K=y@gpFeU4>1;hZiUn507hBfw;Zt12ORmx1-`DhP(oG43NK@ z@be{5Xz*|%ol2%PJ}cT*!8Yw+7w6(hkVi!>a-(p_B@-VJ9;d5um35O#Z(~WbSNF3c zI4zcv9Gld}4a?PcKufF|+P($f&Mo+yrL&ucc z`J-b7Y8?_j3>*ONp=-uAM;W9WsG!b_zib7hyhZp#X1@^|=-JE*tleC{Kg#|K#aX$P delta 2750 zcmZ{mdu&uy9>@EeX)m?YmQvbImll>sDZPD7n?C3wrL?rjqtBrfm{O)g=h7KEk8)-P z#TN^k&9Y%P`^Rrhl$ZrJM#T6CxzPv;xaex4f{KVbYXn^IwcAxmNLJm7=X<8u#;pD0 z)8F~M@9&&*?;QA&9{rMR;f##5B>A`N*KNS>^@T$< zmDN>_h(BsnjCzJfJi|uB+>=(HPcHMh`9aEhK_(CK5+5v{pPLY| zei_&c{GG%3b{;D}roDva8GdBZ_N*5nhJfD!f8#kNchG6xR^pIsPR}tPFYyt*!ZSKClD0AGin{0uD>WQ^K*RAw*ot zvi2bK|KKMaFK2%QQK>Dr)O)Me(mQ;vs)#<~it=(g&vUDDCDGKH>QiK!GD4nNGv57^ zXWfJ%cF~W_n}JFHvskLRtB1z$<0)QaH0l$-f$16GG!NDm>^=_hJn(1WE#L`>xVBXu ziIIqSO)Y|k7&e4%OEiBOURMA#@$-eRN~#>P_538k}Fdfi1o5}`4P(D^ybYg|6kOP0kU`wGN@YUFm4U{L#j>Pny8xa z<)@lgP##}z?yi^&P8PN35knFhkS8Iht%j)F(m33*hYHNETgphon1r3@xBh{~`RUfZ zwkd(UwC%pc@C%V>Hh_nArG;Wax7vV+$cOe9z%0Jnc7}?~BP+Y6%=%~NqNj=+6rTxX z1L~X*YSSUC&Sl#xhZa7j&%EK1Pa4j&^t}i)Gcg zX51AuLSA)c^$f8Hosae28pn%<6cR@?dv95%21D*3Ls* znZ!{N3m|u*qPnjSN@=wMBAGjTW_3*NojRLy z;m{!Cqg>qae>9WA_X{R4D`=k%>9TMnOQ;1Wt)mWWRqHlm(rRK&HN z{z%Ld5Du6$=DuD!$Dj4}+a{x0%+3w_i7Xu7xMbQ|EFGw%Ib%|F)S5`p2FJrweEN9j zmdn{2px!8PE7Zk4_wT8JueyWQ~Cgfec0ehBaa2A~2kPd!ug zLa`ob1=K*2A$0+2N8 zhqQuwhaaXD{Pl3ReKi!TByK(Q3Mhtoqc5QOq&Q^d4+rx3V_#wRnkil|iD5I#zkn<| z-ZSgA*HCUi>Rj3g-sIcGF+8+Y1o*y@Y6|kxBkQS+Qv$tBIIym)kSAz(-J>2M|I1H* zBr%Sa(iWd4jM0E+$cU%P8ydOOFTcLa(Rv6aFY|+eImKVebv$*gv8zo8`R-2~4VWuY zbz(##{9!<+cGiN86f#?bEkr&1yU<*x+6Wwx#BQijs{#9=Q$x>(R1f%og@7Lg${}rs zq(QO)G2+JZLTci?u$kW^Z91*gt-b2imiPu)#CPVE@T19e7w?PKSDr=`ejp@%L8xoA z1Uc^nb^`eDxqhi$%$yOM#ae8UO}$j{4G;y~5NpXTf~f8W-f4-uzKs7A`>Umict(1j Jxq4?0{Q!}WoZbKc diff --git a/vllm/model_executor/models/__pycache__/qwen3.cpython-310.pyc b/vllm/model_executor/models/__pycache__/qwen3.cpython-310.pyc index 11f7142085e092126de42ce5ebf3fa097badafe4..58765bcf884f20df71c15c1bace36ffecac9c111 100644 GIT binary patch delta 1520 zcmZ`&O>7%g5YBV_zw2O#yLZ6aNXU{~p!k&Uti>)hy`MvOJK=82Fx21T@ z3whyI|FUmABrPh=Uc~G7{H?&cDtuz3DCvy>{;Ei=9dPW5>GD&8^BEZY4bx}}b6K|y zegx*%1?1Ih7H{gjs1@o(y&WxBHP(hv_y;XlR=rHL3iT&<1$Dm5!~nK ze!Lp*&7Mv?`)R({DBQDtUV+L4Q~_(S26ycNufb_Y@i;EgzQN1N70^839lAZ3m{|dp z73pAC0SX`pKxcRX&<)n<2W&<9d2sGPQP6xuw80Qx%&PH=;+*xjBWBI6yP8>a_#({= zJ!A&`HFQbfn|rdkZXcn}20E1(2zm@K1vn1)PvgGcbF8WPx?yC*aHzSut6$6RqGu+H;z>Z9k_2HhWhv7=}F-5t^m#DX-h z)QlUh=2~k;?P>jiu`f@_Zr{KQYQ@rvTGKE~W!K5}cM|vjH{xx*Xz-nHBlsq<@zYPu z&xP?@!z;MzSptuK9Z$^51sKEiZ9o$6KEMZ%I}!lf1nfF|4xLPY#2orIJ}6NTo=CDH-I*9q$)Rx&r`vSN7U7fa5cc!Gvuk34^J6D*l#+-Ti8vvGCI+{mq%moFKyChN0n28+*qdy;&fAwi zSSKKkRjW#K;TR+JTvd^J=2WSuQdPAok|j=@D)qpj_wwc~!X^|SK7Vg!zIijV^M07A z&qS?gw9UhRdq3STdwz`m5+a48XQ2@?GN0M9X~wiP)y$a2YNoo!%2s7!bbKsh8%#e} zRkd}sq}y;hGEAmmF7hY&7gB8oeBE|67dZ?&Qk~Q!M>_O7;k5wgVaIdW<`5_3gzLT= z-dadlBs@D2$LIL#ftt)?WN4RC@hHvlsu}^iY8s4Q;+$TFD^l0=6;2B$?pSn3rA4Kp zGGkk(pP>I^glUA2IHXU|tH`e*%prV+Fb{QUTAD>FAP@gY1Cs2O$q@0A@P9IN$q#c= z+}{W=i)!UYa6zxw7Nrtume3JZ6wOp^ThmQbQQSNt*$jr{kN%SX_NFG0V;(w!novn+ zDr1z&Xez+-b`~rm)nPeyDJV+S;8E;@m`LK*hW;sd8rz7y(?$N|H|LKVd3f4S*HBeL zSVu6>8hkwqARVVVO*FSm0FO&B+Oa4tBV9rG3cl^=$=yOKdQgzvMi65NBEwlw6``5T zodDWa;YG)%r&l>GM0n$Rg&9_be$LNne|G1P40y|q^1!_G6LdZcuIM@SA{cEu&!KCwrXLVNc_ z?AY}-e9=w4n_2j|dy$vj*K>BLS+TlGbNG2Y-UV;+VlS>nBeK4&XsTA$Z90#x3W5b+CbP49oTdq7 z_!o8uERuz&4xtTtI_WtR&7N*dD@1VIb&8@$S;XVYh|NY292;vd+A=^htARHig z5yU$QAbWuD-UZy`ULWyzY<>?cq#Uvdzo#w`kQZ4g9> diff --git a/vllm/model_executor/models/__pycache__/qwen3_moe.cpython-310.pyc b/vllm/model_executor/models/__pycache__/qwen3_moe.cpython-310.pyc index 6aed6f1dc09aa5a79c98337b0391daf226408cff..61a305ef42f6b2335207b611d9d93cab233d365b 100644 GIT binary patch delta 1070 zcmaiy-%pZJ7{@#OM#R*~6hRRckQC9}bY{)U;>N48RpSN;2@rUBIUrVcUC66McROakq zPvi3X8%49Uy3-mB@>br*TcS?taYrpJ!9H)WF&MW7eCMouf7Bb|QalHLp1KBJr2$p^~KyYiYs9RMeq#fJbDmyAEFBp zL&O>E!mvL^JD5t7aGLnjBxaX~9VxzOR79=-QO_{WsGYOa||3vOWL^rA&VeXb7Jb`JZ?J5G#x`cfE9gl17JFLyDQq6eNLmok4PUO9wW8~`mSFgQ=qn%!G=an zhT&snCnMWRs;z22A-905UM07|Y|yKQv8)#H6j6b=4-SKgj6lNBC>cj%0@e*K(Ik_w zsnfwRV~H-4#-Zs$MEf5cMl}Tk##Yr|$AtIBBSx$?%l@|`XfVwdKf``=m=|U9nLWKU4oL@2E{9E+KO08b=A%h?Q5pfl0eAA4$Gd)u0QAFJdP0Oa?`6&U{R5mV6qHq zmN6#gozxkmnG$Kx$@45qSKyuH5E+M`7PCl31O)2pE3_zNM8a;kVEZT85{Zk1nLwca z1bG7M_4drcR_b2hIOT{%ga{!+ND*t$ttul)xL}QtWa_K6T}a+SU6V#JgsYh|Pr}J2 F?=OtU6B7Uc delta 1140 zcma))%TE(g6vn;Nc3S!%MIjXs%Bw)dQV0nKP>d1Tpix62qzlVfN+~Vv^iCOrhKDZ@ z4Tv5UAw*CFMUiMGk%XNaHpZ13(*zU$09a|y$*J9o*q>NA8* zCjBn<>wP=;#!#&-J>~3?s52P$2tjAif8HtfMmxiys`APTr{s@%9ird~2tKc*c(s!$ z#HDPRH@SfjYY@{&V$dI@L8fUpq6Kjl(T<=DuGEe&y&%wbcSwl(WiOR5A|fJ)FoQjn z9zq>OG$VQtGJ{JM3CQ#qQ!x^WkwA>du9S#d38s&$$pHM^JI#37VBt4diqr}#nFsYc z!fly3?w48xUo&gXJG(-C)@b8SlU3W*^cq{}WyE#FRdo4(&PInIEqjgh!>8=yjMl;& zrEcGQ!lX7=Hs8b!U5NOOhF~;zo!o+eb=)+@+(jrv~enJq4pUvhW&sT6fnArzn!Sgc{v=cTuqrsIe^m}z90LE%qg5&Cx- z?8fBF(TE?#LsWR+bP_Rz;FE)I@fGR_ejMx8GjuK z-W4A$!+g8$f2MC{{VdQ>a>X)-?H^;II#C$k*F3D3w2=jBXMzB%lTJiF^0 zr{_4rZavX)JTVeATaEGmMuL%a=3GDI vdxpqGJV&SzI)oOn3T>twG6P*siOeXUokvtef!wNWLqA62mth7PsycrIPTL-- diff --git a/vllm/model_executor/models/__pycache__/registry.cpython-310.pyc b/vllm/model_executor/models/__pycache__/registry.cpython-310.pyc index a3999c81eb7255515b6806914297e3538cc43aca..576a5383dd6e8127e6ff7152ae0e44aa8ae3ec46 100644 GIT binary patch delta 3264 zcmb7GYiu0V6`nggo@~|+*0HmWotT6KiZ`*ne#DOwV_^a!pb%6AA+$7|O!nSgPdq!j zxicH%G~g7w0YNDVmk^+)B!m#0IFNJ+q&xx*QdQIkKPpAlsK5_ep-NT%^hc#us6FRS z$ZpookJ_4V&)jp*x#xW6+uEyIunu~b_0V6ide*>}?d)q-nw7Lpi}dYj4QBQ)II~;MIY-}-a|YOA2K4?#ir_Yt-s{GfO;`ay`KM5gh^E(#;F3Qxn&zwb$S*?b~z=1m=wxSHhVQIr;%j7eQW*zX%C5-~CjJRLZWJJ*XlhuiBdQuBb^5Y^7Gy=d-SP!tLM%7eW7t60 z6|TzYFXbUSBRpiA*&Wmz{;OzP@lbO~D<#P&#`cw%S&=2Kh_tTioq~6N5%jd_d7Mw< zQYs(E!4R}pWj!#duf?|3zOk$6;XjfVF1V1?$XNfc&Up+Sz~dsTl9f=H)Pna_$BWJ}m*Y}aO?I8P+2TZ%b?&Lhjxrqb1oy%kx_ZN+u+_9Vt-y`;|T+#beG(>Ai z$jwwFtz1VAiT|wJXUZI&MHdGU1OV`J#b>3vm~=O9e`@4%xz(x& zsUbR1iS}PzRlniS7yrDfUWG#cV|CX^P-tJXEgNh~i47ZTa=eWnH zVe-_d8xzKwgf4@7r1;#LXlN3h1d$&^cM;2l*gVroG5!<|RJnQE^8Ap^9R3W>#WDn2 z6FWJs%T@^T#eJJxEDa1S^m8~>mZfwO$S$noECU%ZZs_uaY8LUEzwDpE>9_{8GWHig z29RtpZM!m!a#F=`+j6o&B-;+qr4ajA0C=W*b5 zgbEu}+$|oBA02rGwa8D2x^EZ5peqdhsNv*z*0ilXEU3eMV*A=BHwD$?Z=i)-^fi#; zS}A#7!>T1C!7*+*>0E_pd445D&pNTC+!-d%E1mIK9K{+{IPvQ_b944?Ryy`GqM<#t z_A)85!<*3V#C&6p3Qrtqzjys9)Rx=Cu4RLYJ<#!dPTbIO+a2=^8?RyLH(0KbE!ds~ zjF@&1@4mp%@s5%2%yYDKAxEO7vqj$@ShaU<9GPc@cke>E`b&dCjGC@tIS#Zh>=cjv zM4aioXa3p^3waT%5-aorxb_)wd!n=A4&hZ`<7?DP1-qMv(Z^E=cy9(L=VFxPUa3Q= z;*NP0$FTGqFId^;!Mz|GOtzY=XEkb1-iBx+$ok5HoyONU5#B;Li%{AKQj+(?VNleI zMAwhWVR5c&Yzy8K!Sz7oAraSnwX;iZzGO8JXK-daW|sM3_#QD(DswB3g~$+Qp2}tO z!-s^^-9*k6_jg|+z2*lxULqXa+Ah=b_jxR;otTNlew%8g&U-EgtM^XvI&s zE%9OgIND-B{9^v@S8qpA zc1c!z(I1PO_%1J4*){SzN*>$t(@Y)?vKtPI)`6CucW^e+!!IF}a*&ctBs>K5E7)up Za#7r07p;N&$s+h73I9!9E-nr_{{!T#F?9d{ delta 3156 zcmb7Gdu&_P8NcWH+I37EOdBV0(?D1$t(%9F<~bTVqEanFq(v<%U>>)w&q?aWvAyrw zYf{)8mS%qxmC~Mq*eHELOVbu87+M}JP=v%wAb|uDmq}A$>ooT7gv2xrzVF$s!mbKpXJZ(V*Gj0 z!cU78`~`89SRm@Qc7?Q%Hss+i^1==SExYHmY*#if@t2iNkEp;+o#AJ3iL+{xy`q=D z!e8B?iKaupJgnWUO)`vigQ(`OP4=_sO8&a28rH;0$`+SiIb`s2{QM3h+Q%>OH~5=4 zx=}3QZ;j}W=-?AKPHIf!Y=e5jZx?Pc=2yyx1FQWmxEm>ldkF3=d>uIFVw>fm>gzh= zD4Etk;Lm^7MsgNJlIeIX8A&EKM>6BtE$LK8YkOP7N@PV#CKexw4GT;DySj&+l+D3C zR}WJ_axQ@(nr=ooBEJmQ<2n~>8)S9O2FB$?s6kHEH2tFJLB{q~iIkNQ@vJ$T<|1jv zlh&*9)0$g*e?yUgz#_;Il(|+V(=lH3J5MHKa${|?xrK%af~^ED0@@X9Bd8=u5u^#m z35ucBNac}1#aVnT>RGR*>j9>_7Ba{bF4lIl?)%B_0fev%w$oUxK&(tNB`*o8;*sh@ zIT%`@*jToNvI{d%apuTRZT3_7QD~s!_Y_`{@jDvLWlULoM#?bjjl~!@}v*b|5Z{uSH5PX`UdyOil>ou&(Q|Isz*W{(zE9JKf zKT-Ks%fHkQcB-6RMXE~JFJ`40!`qjPjc(?#RezKBF1kBZ)T)sply>-){AAH61Np0l z#{NIx+@3cqvaxIyU=n9x9eztf7j{>9IViPD_*e!)C97oH7t4!_f-+MZ$XAvT2NP&x zyDSW=Nc;br=|K$e1wIz>t@v_zS(U5K0Mh((0wK)od84s0E3v&=*goex#2~%}=%4~G z+h#0r#YHE7{*3z_cnM@k8f}2E!6_ooHM?7lz2MX^m z4!H6Z#M#>;6wa5h@J`9bQgH!0N#M3J$wbz6B}EDzCR<|MIkME~VUOw&CnGw~(F)~Y zQne+SD*lT%glf+!5W|>(0Mnx?RVVLT`q%kSkU6b^tW)E`5xH(zXla>mjR~=YCCs5T zn7PzX`Q0FQFB@xD{OF1q*oPseofdYsH#?Bh_sib!t&yi`u~OGZNpO^)%!d>MvJgJp zbbz$PP?5YJ7duksDD%sMY^{8B`OX2Se((%gs70Q_QP`MC7ss|ib&Ae3a3Y0SmTiGL z>Ml9lBzsDOQL<1T433kOs!|$6wl~+XAvw?-Up|wwYSLOVJ62{(Q&L#+v*y9h6ErRL zsUg8!KBO4OR)&*uW6Mp~U*=dnm!mw_Qs>D#UUp0WfEu@-BmGBDEPTxd0LZC{j zYIKUG&k{UGaGIdlS87BD6COhdNZvNZ9+Tg+jnvUg!Fd-jb@0Q6t+%$pE;-s>-%$*p z4z;h3a*U@(GpqI?85U*Y(R^;>zh0&@n<8F*RNYWXl}Tp-(0_@f5W=9 zu!#&*0aXX6@1F-rraq}uc~xbp8nzqr8nvSSLHfj7ukKA4hnLBmxPi|Jib)9#s}8Cl f-afosb4jrZtD#x%6b|&<&fL298-1btt~d1q^(zwm diff --git a/vllm/model_executor/models/__pycache__/siglip.cpython-310.pyc b/vllm/model_executor/models/__pycache__/siglip.cpython-310.pyc index 186536ae50217fb8b119f890d5a3d2175452ff53..b3c6fe0bd4eceb3e0b2dbd485b9db4d864aa8b7e 100644 GIT binary patch delta 2639 zcmb7GX>3$g6z0BJ+Rh@SJ56U=C@nm@x3pzbD6z!_XrW-+5g1-OkC|a+-kaX{rnMEU z3(!Pk5idr;g@&Ne00NF$QDY!RO;}7c`okChkeImqHU1(J&$%XX%S2agsfk<6suqGVrt%(ll z0ab}dEDu=)rGTBY7YK?y{*ArOM2xs|{!T)=;-Sp#rkrhXrT_Rb{JXsN4->3t2m3Mm z0NKHMat5rsP$99Oa!Rcp6rW;uayF1A)|Ojm&LZiA?ayr`3i~SeaL-nL7NG$^w9ySH z_aMj!odAZQt47+Mu%zpy1%)P1_raF5m-$lIfGx?&hWF(%WW&}g>3xAj zV3vMwSXQXU3SC~JvtgHPAHYL{2v4(HOS7xzP^aV0Fai&T1COl)b^BO_yNv8(Tih=4 z3{&0tWIr2qzvtwfIg*^QmBn3^v+42J`(u)#2ZyEJuzVL+?2FOq6J*Z=uvg;a zJrpxjW&E+Y?h&jDBZH46J*X=57@8gDO70&P0mahb$)kr*x-0K1AN;fSEbgpEIEQc^ zf#*9}Kp&vuWdv^dZnD_@745UazFJZA|2lSp*(;05L^8Jrt$bLGvul;VrNqgqCxRHg zF@GSaL5$v*CVK<2r_@U-);*@&)62q*AtS~6>f3Fi%FHj(%cO6dp*=2)oO z)p`lmp7hjb=mabcGk!5u4b$B;jz_x@?qc<3b-_cBU>cG7h4cK7;M4p+w(+EyJM&B`LJeEoxRLZSwJ~?(Q?NJ8 zzF?p3$yB6>?DIw?3jcMPYBUa;l>5i?iZy1~H29IDYlA^Oz!S}1e#4?g!$I9hqjEGX z^~v-Knx?^TA?RaDb72L!=CkT^kUe>DNnZ#)#!O8bxxxmU$_iG%hS_SnEm(xx4(kKN zA=m^55eWOFsWl%9hQ{!kyjdla)m*=8x@55G4eKV=7lSA7GdwaqrG{|HiwO9iM{#5u zCJmgshRgqaeka+<=9SJ#un}A61vCxBe{XgQ*}OjNk42&?)mtf5DfP4TRh8m(wBfC~ X4<$aRj-rH3%Nvi^5uIc^SN-rW-Hn3n delta 2753 zcmb7GZBSHI80Ow(KUi2nSul~01%$i_EFU68Q>ghd8Gb9~8ZH;OunW6;ch9|`AP9cs zOig5Y`jUcioQ$yywH+;Ma)zeTrheF;e%v2TziR4F{mz-{JZD*V1+{U1Jo}#ayyxqA zpYxtO)qk-+U3EC@DeO0Jb@Xz2qj`C=yH6wTfZ8Dk+yQ^PJ3OHK)KFbjO|@I|>q=!< z?&y`f6)oyFKV`{}H0h=xt8VGB9uvvRA#0EA1=Dcaux;2LX^MW8zQH7TqG_3}g3uD} z&f0Bq?qn-0AeYh{NeI#}b50g-=koyS7)W-q5%%+dPQVTt%+1da!rTYg#z0CV ze6lLkR@DUQ&n{ z4*R2L7fYfrM1NRPlt0AWl9TL4FQ0WYtWAJD)S6c%^w3p#S`pt0@4^7GAHXMb!D@-# z%)2Cv$gshnB#;1XoR(|_2n@DJSw^bnA5_Q@)-uc;zP?Z|=|%T(zz84$7zOwl80M~k zD(n2H9;>Ey=|TA*QPI5vpa70CkTOVX0U9S581{Bq@9=rCmd70N29yvX)LGyaG^!UU z&3y>$2OI#T0a5|kfH~ZPOELgRVh~Li;1DeZ;6p0Q77T{gLc+ATu+aD^yW-RmIEK_=PS(!i?IR*5a zWj&0T>av+45W|#C@h2K$RW;wyc`=^xtn$5<*uA1^`O|YbnZ&YZ0i2UFuv~x^`cwI< zjqfv4GRJay4sIOY<4{5!YNtZH0eL_n_hDf2(c1rEpo^~qNYs!AGcZAmm#+{e?#RQx z{4`_1B#ke61Jj&gAZ5jceNkGyZkTzDG+Eabre`%o-bUCv+{yPIQb~}E!HEo$7XkCc zQTNy%>&~O+Nx+AIj{sa0v*cWW<7EJkd=C~E7zY=c8kJXUO-~X9{bEIa)kEF$DQd1L z5~jEU)>aHzcom$aUswDVH!oK{Hv%q<%znSdPVDW|6t7Q_J9ov{$w|68i5lCC{j~um zFxEPoU&Dl&1r5X`(gVu|NbtBItZI5p2q4q2`kG~p5l+ZO7U;3X*C$h~X{2H+aX}>t z`6TAt1DHqtjVhmI_VKBAx4VNZh^ZY~WVNOZLoNY6fy0vgR>6CMe(P>v<@O)<>b4IM zA?%VIBq;?5np1f1rOJbdd$2U8>11_{FwIgkvk?1@S6qyoq-Se? z`*^ZR7oDkhF1?OEYqz3v$>p#XOE53f*XUpMqr!D|zOuYV=1;ZQZ;NK}c7|nvkRjSd zJNr-)MLNA|{bERi=op)uEDmaKsNJ8C1B7o_HmjX|>{a{>LlR{xArMA*3Na(pq_InI z6V3a++gIp#!xN4xEJj*GK1OJF^p^&Qn9T)|{%kO;5`8@(Dj{8`8Y`;4LkPdDhhU8X WQ26<^Mj}B*M2Cxt(2Ej6TpMlH4!q4`nKlp6 zX_fV?Bh1Rm)KZKW@*)VLyZR5JC9J8kFcFQX9 zXDmKQ*-QrDt>0Tek?FPp9)Ugf*>p{_~9OF#zK1WM(fl~IU;8{jCo z32uSE2lQ;D+uZ5-Mn!J%ZlY0+c)NvES);x67KsYn=L=hLV)da8Px-b5rV#Ie```hX z7VK5K5f6fPFvgbk-|b_FVS!>)$9avsC9GFQQGNvU8|v3MFMjq`52iBx(P%8%cOreb zKhk$RaVn;sW8?9IR##pH#b}tQ8AToymD`JJ?84hyps`Ez6H-Vb~Rvo#r&Ta zW63|g?g{2&Yo(&xsz2WxzxE%ZdG<7QR?Yr1IFIf*ZJ=p88B&V2)I2~{i>Ud~WGk<* zz`?+NTI7+yu9_ZEm&hjBNFsyy3XR%_z!1@8J`ikh>2EZN6;=y+rQOk3Dx1jW)FI|z v2Q6#wf_F%MiiTS73{(I!*aKdGmptsKqY}?-7^jjJ2=y3E`kzqZiT22EhaJO1 delta 818 zcmaKpO-vI}5XYVE+SZmv1loocDAuL4h~27HVBnS$LW+Mj^D#CUL%{bk;N=KbHydtaolk~w9u znAWf_w^V#(erfRbi9;DhOr&CwgqV<{Vmg-{NF}%Xw+6(FoRzkuBeB8ADJi2a8Vks$!}?QKJ4Q;5AQKA6J62%?dFKHrVV~0h7qQ-x1itCj1q+cN*CRzmjIE6QGvPJB^N#QkuK)A)=+wj|& zgaN`G!XV);VUqBtL016o;SSddAa?nian9BVMLgMhgfFrx46JpiA6m-*WjyW`~VvzSt+h=J%o#f-IrP?jc;akrMm`7*(?z(4xCFiMnPVH~s58T-ab-{ZY z?2Dwisi>yvu)yMw4Z&~2eH}Yt5%V1fZO52sgc@TF7=dHI9=KJGS3h9a}B$jMALl8i~!o6{bC9hDgm#ie9c&gPUnj(6^YCG~yheGs0LPZQw< jfhQOUhY7CnGUvBSnguA&at2*& zn9ez3o?yfhktY^7RY+DvT`g*iZQ{GEIy4>*HsZO|jVb>u#PHfb4Ke$}UjZpb4Wf~a zX*!c>LJFVS`XP;pDLzO+C}6593I)5;bs;$D&#(eoJ*!{2E{CQ7 delta 550 zcmaLTOD_Xa6bEo;Vn)-dG-W#VD4Gx&VTcV2uXrTHV<`kRrlZQ3X>U>WCRR4Y*;?8X zGKnw1%F2R7y6_n!EbO?4jfI%x{&MgCo_p@i+z&nsdTg)PoyWiI&EB==MXVoHSJO;2 zZCx`}Gcl(ovnva>)!Nk3tfmtyMq^Ubm$bN%cDz!`4U^8UZyn@W-hfRL8ZpC(NT)@m zPObk^00SROk}!|`@-am5NgnVSR5d}UMBHfzjDoVr=Q)vSR@`7ql$*pdo+wJ2#itQB zYoa7c3==70j9|nFCkKg~Xlhx5u{plPo}vr`0q&&$wPai(li|Lk|qpHg}& z+s509S=hmvP`iKY*XGXmrelYSK}cE7VPyv>2bA>^rBvzpX|s>dRSR%{J=L{=Zl1fK z&{YU75crTl_!RPSqxzz1m(B%*D$wSKPNLu zzo4=tBR_AmFvk=&##@_L@U=1u!~r!IMS+NT5D~rER-lE6F?sSKp@7rN$GMpWs z6TGD6iC2P*ssJfvfhe^B2~Zzi delta 493 zcmZ4Ny4;mJpO=@50SGF$HEiU5z^)OXUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> zlB!#fn4F!Mo?5(_pJNIeW7Os)e65TEu|NZgB0)qPh=|&3DbT{im^68xP%dNgWF6tz zY|$X`n8{~_-MEuLOmh&CvRO{Vi%~os$iBr|l$e*ET9g42&jb-!lj}vr6|;d%P0k`S zkVr0wum%x%Ai@qr?88Dx;nWJO-_$w^X8;uRon zIYWvWWs~R0N;1|> z-XWX8SU*`&?w))NNLUO+)Pe{m5Wxx}ia|vCWI1_R#*)c4^3jYXn`g+cWa3T$iI;!~ MOP~S5ljD_K0G9-LqyPW_ diff --git a/vllm/model_executor/models/__pycache__/ultravox.cpython-310.pyc b/vllm/model_executor/models/__pycache__/ultravox.cpython-310.pyc index 4c598e6904d303d940ac2da5c387ffefbe42f5ff..199e76a02b3fe0741d6b873a9f793eae8eb6c7f0 100644 GIT binary patch delta 62 zcmbPUHo1&DpO=@50SFA&?%T+%#;)R}Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr$vC;CR=oF@e)ncgiNvU*3sCO^7JhmsACKn zW9l$F5|x=P8(v0q;Cw}ssgn^+aE{G6hgqj2&Rep??Xw@2`TSo5)YzoIoadbLKhO2N zJ$=;EN6BqAn>9iHyhl$QOFouZw85>0BJM~a;!=HLi(hrsgkr5BZ)mGK7-)7!I@Q*; zu=Y#hy_A|FRfZkbgfz0;u#icsxoOYM)Tm8mtRaf>^~|R!#(}KIq zmyx=Qr|rekdCi_q{g`V7Lchy@)F5H9+~Xk8uQ~JjDK7%SI$*s-Jn^ZZPgVWlxUt2j ziro-XpZ071E-L(Yrq~0`3(%O=SS08lCGjHC(+8!`NOCTVG*T=nhD?JP)IM5OLNvg0 z1q$uu^@T4{gwGXb(>{HMp?yUeG^Aw~BcFu4Qnt-uH$Y{*CxhoyZx7G#n}QbM+Ye=1(dDWx82=ep8AO zAaOD_&4Vhb-F`8=64V}0^~|G+Weu2+SwFUML_W@q8fpBf%kx;z!>+q zZm~^B(_t1H;CY|NTov>&|LEFG$F(&TgJi?nM-8G9;hp-S4)7KC&eG$M&HLr4D%)hv zr^s;uZomT!@GG8*WuGrPCt;mL9qWKJhvlh=DZb_@$@@$W8&`G&gP{r~fMqwwRKHRY zQv<=MIKh?PA~$XzZoR)vi3R=l$(*=Z_`+NK^71}G*`@hWOKSSPW%LDq;H{-;zUuwM z@fD`9g?%Bv(iGCGM1}tPu*tZ^7m4`8iad)`Y+4xUV4ni? zy`JH(E34=%Q&n)8ezy9(6v}vukyoWI=a;KOcP|E{9#__A?(&Pa=-;O(3Z%sjBRfbqWta1HT%9<0vioEpV*0QK|-v#1w2^Frw7 zD}4t`pY%MB*E~oUv>P?UM6=rP9b=Sn8d1FtT1Px0A=mvqH`O-NMQy5fFVQ7_sBWbE z2ZTci8$~&6Y*AbSHUUf9n&bR>*TO@8xPFso4sqyZWnDVo5Agn0E;>(Pl%r&Q(3z9^fA72}x4(-g^2dG=`_Fm}l5fk{@iEY3j zpnpB|b2xDAZuUr#apMA}*+jjyF|qwO5XcwE}YGg75ppSYSY zXB?Je&b*fNoK%Y4KnEYlnx|)3WLIQ%!qEln0sa{@lf9YtvBU8c_3&kBQLQ> zhFwBvFMsYRl+LS;RO-W8DVX|I{-Y)di|sBai9X$x(@Qz65Ud9_NW|iw4*E4s4adyQ zeoZ_NG4<#_=k`$kzazy9(7XtZRcng`)o~L05uQ3IeP)tt*`%?;w!)Nd5`+5mnj)fp z{vl7H0p5_mpIZ5JekQT8!qCeFX*8s#7i5`ySSDr;gf)Rg;#FV>2ue5;#A~pJfdjxn zZZ7PgL;O>rkSBhuD44VZ?w!CGkJP87h*4?Zf(==ukr0<@5~KWk(H$hXw)hXrGt$YE znW?El8g+~NPKdKmibV)koMC#4&p2!72(K&=rq)OFy(Jw)N7?M!YI{R!#GBmeDq1vO zcV*j-!aL0~uA69@e{nroYdDM|AI8);kS)<*S3?o4y)mkZfTAj*3KMSw?*J3PBzL)Q zv`U)EIFDPulF zj2rL*KA@jp@p+PGmYm07oj{(%erXQNs)$ecs;?;LBROoiVS6wb@+bjpyQxi66;GQM z2u8)nTv1lwMg3!m_qQl*LG?Zv6SE3`c#A4O-3Lg!ygqVCO>bEVeai2a)zC@4Qudqk z3oKy|`$MYI7&5X%g>m6T~3QQgQSMs zi2nw|<$Auy>#O>1He#02$w79^b483 zgJmrGEl*ZINb~xi)x$(*_2FA5DD5lE8hOw-;!z2?@9(*>rU@@o%}Ye*`Jvj;(hHal zVcIN8VdIG6Jg^B^KGsFft#dD4^oQ#<`7UA}dYRdfF7yMu|EC}0FY9hATJFz!1a1V3 zL}*Vj1}yeu#yL5A(}>f2Al+NAI0s!9B>Ml2hIYqIJs@PpON}Y Fe*qz^qWb^< diff --git a/vllm/model_executor/models/__pycache__/xverse.cpython-310.pyc b/vllm/model_executor/models/__pycache__/xverse.cpython-310.pyc index 71a46f3f655b3aa59ab4a584c2accd2e1d290889..e621a3cb8cf0cf7f8a4e567eff35b644afbbbc61 100644 GIT binary patch delta 789 zcmajdOK%cU6bEoGEwtfb0l^U{r6RULLkNklCYl(v)o3Gj;Uh*NwDK4`54en_plwa? zRimx;xbq_zjm^ZwZZyU(AX^r0-1r^bc>iDx3lnFOU(WpJoSAzw^Ci8NcIYmbeTO(w zZ$E81CT+2ENkc6s%W^qkKAipb!JNRML zOW-nC2G_s}=q^xHZ6>#^O0G^*fg&r@yMV!T+84YaZ0+)y&0vkO8vP0#8pSI3>NXd7 z9_2JR04kIo{y5gzXXjcMVcV+exAF=PpV1gDtjb) z6F%er=d$U&&qsSk4vsy=$iV+LNG-2K_eYkcXPsAKroTJW+4~y#BN?_%Mr6YKyyxaR zy4TFlks)T$BJ^!^X7T}|8|dldGpHYen?1oJ1etD-Lj4%9p5O@;_P&w`aS4QR@6Sit zAWyW!h#JxT-s2)4WX=I68|<7GW`2n7WG7x=Cc} Snr0*R!(zi%;Z2$w&-?}{UADCV delta 797 zcmaKpOHUI~7=}GlIwie8ErEv8GEgyC6RnMx#FY&O7eXY&NKC=jDIMCeGoAL#P#o{6 z_aKNpuJ{iu%tWJcW!&n@UAJ!d2f9+v+tP$Y<1C(h^PKlP*AH`_=6psV;61=U``v># zzG?BuY;x74NzGW6wWOxzlU3U)8I_aAQzw$9YAMI6@^V=&DyCzJX)nn*Z-cueSmqPZ z5}*Mp+X+cTcfN-FE>dHyK{ZI>SAYdTXP1XQlN&4?z7VZK)HpI;&7g9w&ezVU%SKr diff --git a/vllm/model_executor/models/internvl.py b/vllm/model_executor/models/internvl.py index 9024831..203badb 100644 --- a/vllm/model_executor/models/internvl.py +++ b/vllm/model_executor/models/internvl.py @@ -4,7 +4,7 @@ # Copyright (c) 2023 OpenGVLab # Licensed under The MIT License [see LICENSE for details] # -------------------------------------------------------- -import re +import regex as re from functools import cached_property, partial from typing import (Iterable, List, Literal, Mapping, Optional, Tuple, TypedDict, Union) diff --git a/vllm/model_executor/models/minicpmv.py b/vllm/model_executor/models/minicpmv.py index 9ee4dd0..0236fc4 100644 --- a/vllm/model_executor/models/minicpmv.py +++ b/vllm/model_executor/models/minicpmv.py @@ -22,7 +22,7 @@ # limitations under the License. """Inference-only MiniCPM-V model compatible with HuggingFace weights.""" import math -import re +import regex as re from functools import partial from typing import (Any, Callable, Iterable, List, Literal, Mapping, Optional, Tuple, TypedDict, Union) diff --git a/vllm/model_executor/models/molmo.py b/vllm/model_executor/models/molmo.py index ccfee16..2ff4e04 100644 --- a/vllm/model_executor/models/molmo.py +++ b/vllm/model_executor/models/molmo.py @@ -1,6 +1,6 @@ import logging import math -import re +import regex as re from array import array from dataclasses import dataclass from functools import lru_cache, partial diff --git a/vllm/model_executor/models/phi3v.py b/vllm/model_executor/models/phi3v.py index 00a04da..523375f 100644 --- a/vllm/model_executor/models/phi3v.py +++ b/vllm/model_executor/models/phi3v.py @@ -14,7 +14,7 @@ # See the License for the specific language governing permissions and # limitations under the License. import itertools -import re +import regex as re from functools import cached_property, lru_cache from typing import (Any, Dict, Iterable, List, Literal, Mapping, Optional, Tuple, TypedDict, Union) diff --git a/vllm/model_executor/models/qwen.py b/vllm/model_executor/models/qwen.py index fd8a27e..3c94173 100644 --- a/vllm/model_executor/models/qwen.py +++ b/vllm/model_executor/models/qwen.py @@ -6,7 +6,7 @@ """Inference-only QWen model compatible with HuggingFace weights.""" import math -import re +import regex as re from functools import partial from typing import (Any, Callable, Dict, Iterable, List, Literal, Mapping, Optional, Tuple, TypedDict, Union) diff --git a/vllm/model_executor/models/qwen2_5_vl.py b/vllm/model_executor/models/qwen2_5_vl.py new file mode 100644 index 0000000..bae5e54 --- /dev/null +++ b/vllm/model_executor/models/qwen2_5_vl.py @@ -0,0 +1,1213 @@ +# coding=utf-8 +# Adapted from +# https://github.com/huggingface/transformers/blob/19e6e80e10118f855137b90740936c0b11ac397f/src/transformers/models/qwen2_vl/modeling_qwen2_vl.py +# Copyright 2024 The Qwen team. +# Copyright 2023 The vLLM team. +# Copyright 2022 EleutherAI and the HuggingFace Inc. team. All rights reserved. +# +# This code is based on EleutherAI's GPT-NeoX library and the GPT-NeoX +# and OPT implementations in this library. It has been modified from its +# original forms to accommodate minor architectural differences compared +# to GPT-NeoX and OPT used by the Meta AI team that trained the model. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +"""Inference-only Qwen2.5-VL model compatible with HuggingFace weights.""" +from functools import lru_cache, partial +from typing import (Any, Callable, Iterable, List, Literal, Mapping, Optional, + Tuple, Type, TypedDict, Union) + +import torch +import torch.nn as nn +import torch.nn.functional as F +from einops import rearrange, repeat +from PIL import Image +from transformers.image_utils import (get_image_size, + infer_channel_dimension_format, + to_numpy_array) +from transformers.models.qwen2_vl.image_processing_qwen2_vl import (make_batched_videos, smart_resize) +from transformers.models.emu3.image_processing_emu3 import make_batched_images + +import vllm.envs as envs +from vllm.attention import AttentionMetadata +from vllm.attention.selector import (_Backend, backend_name_to_enum, + get_global_forced_attn_backend) +from vllm.config import CacheConfig, MultiModalConfig +from vllm.distributed import get_pp_group, parallel_state, tensor_model_parallel_all_gather +from vllm.distributed import utils as dist_utils +from vllm.inputs import INPUT_REGISTRY, InputContext, LLMInputs +from vllm.logger import init_logger +from vllm.model_executor import SamplingMetadata +from vllm.model_executor.layers.layernorm import RMSNorm +from vllm.model_executor.layers.linear import (ColumnParallelLinear, + RowParallelLinear) +from vllm.model_executor.layers.logits_processor import LogitsProcessor +from vllm.model_executor.layers.quantization import QuantizationConfig +from vllm.model_executor.layers.sampler import Sampler, SamplerOutput +from vllm.model_executor.layers.vocab_parallel_embedding import ParallelLMHead +from vllm.model_executor.model_loader.weight_utils import default_weight_loader +from vllm.model_executor.models.qwen2 import Qwen2Model +from vllm.multimodal import (MULTIMODAL_REGISTRY, MultiModalDataDict, + MultiModalInputs) +from vllm.multimodal.base import MultiModalData +from vllm.multimodal.image import cached_get_image_processor +from vllm.platforms import current_platform +from vllm.sequence import IntermediateTensors, SequenceData +from transformers.models.qwen2_5_vl.configuration_qwen2_5_vl import ( + Qwen2_5_VLConfig, Qwen2_5_VLVisionConfig) +from vllm.transformers_utils.processor import get_processor +from vllm.utils import is_cpu + +from .interfaces import SupportsMultiModal, SupportsPP +from .utils import (PPMissingLayer, is_pp_missing_parameter, + make_empty_intermediate_tensors_factory) + +logger = init_logger(__name__) + +# === Vision Inputs === # + + +class Qwen2_5_VLImagePixelInputs(TypedDict): + type: Literal["pixel_values"] + data: torch.Tensor + """Shape: + `(num_patches, num_channels * patch_size * patch_size)` + """ + + image_grid_thw: torch.Tensor + """Shape: `(num_images, 3)` + This should be in `(grid_t, grid_h, grid_w)` format. + """ + + +class Qwen2_5_VLImageEmbeddingInputs(TypedDict): + type: Literal["image_embeds"] + data: torch.Tensor + """Shape: `(batch_size * num_images, image_feature_size, hidden_size)` + `hidden_size` must match the hidden size of language model backbone. + """ + + +Qwen2_5_VLImageInputs = Union[Qwen2_5_VLImagePixelInputs, + Qwen2_5_VLImageEmbeddingInputs] + + +class Qwen2_5_VLVideoInputs(TypedDict): + pixel_values_videos: torch.Tensor + """Shape: + `(num_patches, + num_channels * temporal_patch_size * patch_size * patch_size)` + """ + + video_grid_thw: torch.Tensor + """Shape: `(num_videos, 3)` + + This should be in `(grid_t, grid_h, grid_w)` format. + """ + + +# === Vision Encoder === # + + +class Qwen2_5_VisionMLP(nn.Module): + + def __init__( + self, + in_features: int, + hidden_features: int = None, + bias: bool = False, + act_layer: Callable[[torch.Tensor], torch.Tensor] = F.silu, + quant_config: Optional[QuantizationConfig] = None, + ): + super().__init__() + self.gate_proj = ColumnParallelLinear(in_features, + hidden_features, + bias=bias, + quant_config=quant_config) + self.up_proj = ColumnParallelLinear(in_features, + hidden_features, + bias=bias, + quant_config=quant_config) + self.down_proj = RowParallelLinear(hidden_features, + in_features, + bias=bias, + quant_config=quant_config) + self.act = act_layer + + def forward(self, x: torch.Tensor) -> torch.Tensor: + x_gate, _ = self.gate_proj(x) + x_gate = self.act(x_gate) + x_up, _ = self.up_proj(x) + x_down, _ = self.down_proj(x_gate * x_up) + return x_down + + +def rotate_half(x: torch.Tensor, interleaved: bool = False) -> torch.Tensor: + if not interleaved: + x1, x2 = x.chunk(2, dim=-1) + return torch.cat((-x2, x1), dim=-1) + else: + x1, x2 = x[..., ::2], x[..., 1::2] + return rearrange(torch.stack((-x2, x1), dim=-1), + "... d two -> ... (d two)", + two=2) + + +def apply_rotary_emb_torch(x: torch.Tensor, + cos: torch.Tensor, + sin: torch.Tensor, + interleaved: bool = False) -> torch.Tensor: + """ + x: (batch_size, seqlen, nheads, headdim) + cos, sin: (seqlen, rotary_dim / 2) or (batch_size, seqlen, rotary_dim / 2) + """ + ro_dim = cos.shape[-1] * 2 + assert ro_dim <= x.shape[-1] + cos = repeat( + cos, + "... d -> ... 1 (2 d)" if not interleaved else "... d -> ... 1 (d 2)") + sin = repeat( + sin, + "... d -> ... 1 (2 d)" if not interleaved else "... d -> ... 1 (d 2)") + return torch.cat( + [ + x[..., :ro_dim] * cos + + rotate_half(x[..., :ro_dim], interleaved) * sin, x[..., ro_dim:] + ], + dim=-1, + ) + + +def apply_rotary_pos_emb_vision(t: torch.Tensor, + freqs: torch.Tensor) -> torch.Tensor: + t_ = t.float() + cos = freqs.cos() + sin = freqs.sin() + output = apply_rotary_emb_torch(t_, cos, sin).type_as(t) + return output + + +class Qwen2_5_VisionAttention(nn.Module): + + def __init__( + self, + embed_dim: Optional[int] = None, + num_heads: Optional[int] = None, + projection_size: Optional[int] = None, + quant_config: Optional[QuantizationConfig] = None, + ) -> None: + super().__init__() + # Per attention head and per partition values. + self.tp_size = parallel_state.get_tensor_model_parallel_world_size() + self.hidden_size_per_attention_head = dist_utils.divide( + projection_size, num_heads) + self.num_attention_heads_per_partition = dist_utils.divide( + num_heads, self.tp_size) + + self.qkv = ColumnParallelLinear(input_size=embed_dim, + output_size=3 * projection_size, + quant_config=quant_config) + self.proj = RowParallelLinear(input_size=projection_size, + output_size=embed_dim, + quant_config=quant_config) + + # Detect attention implementation. + selected_backend: Optional[_Backend] = get_global_forced_attn_backend() + if selected_backend is None: + backend_by_env_var: Optional[str] = envs.VLLM_ATTENTION_BACKEND + if backend_by_env_var is not None: + selected_backend = backend_name_to_enum(backend_by_env_var) + if selected_backend is None: + # For Volta and Turing GPUs, use xformers instead. + device_available = current_platform.has_device_capability(80) + if device_available: + from transformers.utils import is_flash_attn_2_available + + if is_flash_attn_2_available(): + self._use_flash_attn = True + else: + logger.warning( + "Current Qwen2-VL implementation has a bug with " + "`vllm-flash-attn` inside vision module, so we use " + "xformers backend instead. You can run `pip install " + "flash-attn to use flash-attention backend.") + self._use_flash_attn = False + else: + self._use_flash_attn = False + else: + if selected_backend == _Backend.FLASH_ATTN: + self._use_flash_attn = True + elif selected_backend == _Backend.XFORMERS: + self._use_flash_attn = False + else: + raise RuntimeError( + f"Qwen2-5-VL does not support {selected_backend} backend now." + ) + def split_qkv(self, qkv: torch.Tensor) -> tuple[torch.Tensor, ...]: + # [s, b, 3 * head * head_dim] + seq_len, bs, _ = qkv.shape + if self.tp_size > 1: + qkv = tensor_model_parallel_all_gather(qkv) + + # [s, b, 3 * head * head_dim] -> 3 * [s, b, head * head_dim] + q, k, v = qkv.chunk(3, dim=2) + + # 3 * [s, b, head * head_dim] + if self.tp_size > 1: + splitter = partial(dist_utils.split_tensor_along_last_dim, + num_partitions=self.tp_size) + q = splitter(q)[self.tp_rank] + k = splitter(k)[self.tp_rank] + v = splitter(v)[self.tp_rank] + + # 3 * [s, b, head * head_dim] -> 3 * [s, b, head, head_dim] + new_shape = (seq_len, bs, self.num_attention_heads_per_partition, + self.hidden_size_per_attention_head) + q, k, v = (x.view(*new_shape) for x in (q, k, v)) + return q, k, v + + def forward( + self, + x: torch.Tensor, + cu_seqlens: torch.Tensor, + rotary_pos_emb: torch.Tensor = None, + ) -> torch.Tensor: + # [s, b, c] --> [s, b, head * 3 * head_dim] + x, _ = self.qkv(x) + + # [s, b, 3 * head * head_dim] -> 3 * [s, b, head, head_dim] + q, k, v = self.split_qkv(x) + batch_size = q.shape[1] + + q, k, v = [ + rearrange(x, "s b ... -> b s ...").contiguous() for x in (q, k, v) + ] + if rotary_pos_emb is not None: + q = apply_rotary_pos_emb_vision(q, rotary_pos_emb) + k = apply_rotary_pos_emb_vision(k, rotary_pos_emb) + + from ixformer.contrib.xformers import ops as xops + from xformers.ops.fmha.attn_bias import (AttentionBias, + BlockDiagonalMask,) + + seqlens = (cu_seqlens[1:] - cu_seqlens[:-1]).tolist() + attn_bias = BlockDiagonalMask.from_seqlens(q_seqlen=seqlens, + kv_seqlen=None) + context_layer = xops.memory_efficient_attention_forward( + q, k, v, attn_bias=attn_bias, p=0, scale=None, op=xops.fmha.flash.FwOp()) + context_layer = rearrange(context_layer, + "b s h d -> s b (h d)").contiguous() + + output, _ = self.proj(context_layer) + return output + + +class Qwen2_5_VisionBlock(nn.Module): + + def __init__( + self, + dim: int, + num_heads: int, + mlp_hidden_dim: int, + act_layer: Callable[[torch.Tensor], torch.Tensor] = F.silu, + norm_layer: Type[nn.Module] = None, + quant_config: Optional[QuantizationConfig] = None, + ) -> None: + super().__init__() + if norm_layer is None: + norm_layer = partial(nn.LayerNorm, eps=1e-6) + self.norm1 = norm_layer(dim) + self.norm2 = norm_layer(dim) + + + self.attn = Qwen2_5_VisionAttention(embed_dim=dim, + num_heads=num_heads, + projection_size=dim, + quant_config=quant_config) + self.mlp = Qwen2_5_VisionMLP(in_features=dim, + hidden_features=mlp_hidden_dim, + bias=True, + act_layer=act_layer, + quant_config=quant_config) + + def forward(self, x: torch.Tensor, cu_seqlens: torch.Tensor, + rotary_pos_emb: torch.Tensor) -> torch.Tensor: + x = x + self.attn(self.norm1(x), + cu_seqlens=cu_seqlens, + rotary_pos_emb=rotary_pos_emb) + x = x + self.mlp(self.norm2(x)) + return x + + +class Qwen2_5_VisionPatchEmbed(nn.Module): + + def __init__( + self, + patch_size: int = 14, + temporal_patch_size: int = 2, + in_chans: int = 3, + hidden_size: int = 1152, + ) -> None: + super().__init__() + self.patch_size = patch_size + self.temporal_patch_size = temporal_patch_size + self.hidden_size = hidden_size + + kernel_size = [temporal_patch_size, patch_size, patch_size] + self.proj = nn.Conv3d(in_chans, + hidden_size, + kernel_size=kernel_size, + stride=kernel_size, + bias=False) + + def forward(self, x: torch.Tensor) -> torch.Tensor: + L, C = x.shape + x = x.view(L, -1, self.temporal_patch_size, self.patch_size, + self.patch_size) + x = self.proj(x).view(L, self.hidden_size) + return x + + +class Qwen2_5_VisionPatchMerger(nn.Module): + + def __init__( + self, + d_model: int, + context_dim: int, + norm_layer: Type[nn.Module] = None, + spatial_merge_size: int = 2, + quant_config: Optional[QuantizationConfig] = None, + ) -> None: + super().__init__() + self.hidden_size = context_dim * (spatial_merge_size**2) + if norm_layer is None: + norm_layer = partial(nn.LayerNorm, eps=1e-6) + self.ln_q = norm_layer(context_dim) + self.mlp = nn.ModuleList([ + ColumnParallelLinear(self.hidden_size, + self.hidden_size, + bias=True, + quant_config=quant_config), + nn.GELU(), + RowParallelLinear(self.hidden_size, + d_model, + bias=True, + quant_config=quant_config), + ]) + + def forward(self, x: torch.Tensor) -> torch.Tensor: + x = self.ln_q(x) + x = x.view(-1, self.hidden_size) + + mlp_fc1, mlp_act, mlp_fc2 = self.mlp + x_parallel, _ = mlp_fc1(x) + x_parallel = mlp_act(x_parallel) + out, _ = mlp_fc2(x_parallel) + return out + + +class Qwen2_5_VisionRotaryEmbedding(nn.Module): + + def __init__(self, dim: int, theta: float = 10000.0) -> None: + super().__init__() + self.dim = dim + self.theta = theta + inv_freq = 1.0 / (theta + **(torch.arange(0, dim, 2, dtype=torch.float) / dim)) + self.register_buffer("inv_freq", inv_freq, persistent=False) + self._seq_len_cached = 0 + self._freqs_cached = None + + def update_freqs_cache(self, seqlen: int) -> None: + if seqlen > self._seq_len_cached: + seqlen *= 2 + self._seq_len_cached = seqlen + self.inv_freq = 1.0 / (self.theta**(torch.arange( + 0, self.dim, 2, dtype=torch.float, device=self.inv_freq.device) + / self.dim)) + seq = torch.arange(seqlen, + device=self.inv_freq.device, + dtype=self.inv_freq.dtype) + freqs = torch.outer(seq, self.inv_freq) + self._freqs_cached = freqs + + def forward(self, seqlen: int) -> torch.Tensor: + self.update_freqs_cache(seqlen) + return self._freqs_cached[:seqlen] + + +class Qwen2_5_VisionTransformer(nn.Module): + + def __init__( + self, + vision_config: Qwen2_5_VLVisionConfig, + norm_eps: float = 1e-6, + quant_config: Optional[QuantizationConfig] = None, + ) -> None: + super().__init__() + + patch_size: int = vision_config.patch_size + temporal_patch_size: int = vision_config.temporal_patch_size + spatial_merge_size: int = vision_config.spatial_merge_size + in_channels: int = vision_config.in_channels + hidden_size: int = vision_config.hidden_size + depth: int = vision_config.depth + num_heads: int = vision_config.num_heads + self.spatial_merge_size = spatial_merge_size + self.window_size = vision_config.window_size + self.patch_size = patch_size + self.spatial_merge_unit = self.spatial_merge_size**2 + self.fullatt_block_indexes = vision_config.fullatt_block_indexes + + self.patch_embed = Qwen2_5_VisionPatchEmbed( + patch_size=patch_size, + temporal_patch_size=temporal_patch_size, + in_chans=in_channels, + hidden_size=hidden_size, + ) + norm_layer = partial(RMSNorm, eps=norm_eps) + head_dim = hidden_size // num_heads + self.rotary_pos_emb = Qwen2_5_VisionRotaryEmbedding(head_dim // 2) + + self.blocks = nn.ModuleList([ + Qwen2_5_VisionBlock( + dim=hidden_size, + num_heads=num_heads, + mlp_hidden_dim=vision_config.intermediate_size, + norm_layer=norm_layer, + quant_config=quant_config, + ) for layer_idx in range(depth) + ]) + self.merger = Qwen2_5_VisionPatchMerger( + d_model=vision_config.out_hidden_size, + context_dim=hidden_size, + norm_layer=norm_layer, + spatial_merge_size=self.spatial_merge_size, + quant_config=quant_config, + ) + + @property + def dtype(self) -> torch.dtype: + return self.patch_embed.proj.weight.dtype + + @property + def device(self) -> torch.device: + return self.patch_embed.proj.weight.device + + def rot_pos_emb(self, grid_thw: torch.Tensor) -> torch.Tensor: + pos_ids = [] + for t, h, w in grid_thw: + hpos_ids = torch.arange(h).unsqueeze(1).expand(-1, w) + wpos_ids = torch.arange(w).unsqueeze(0).expand(h, -1) + hpos_ids = hpos_ids.reshape( + h // self.spatial_merge_size, + self.spatial_merge_size, + w // self.spatial_merge_size, + self.spatial_merge_size, + ).permute(0, 2, 1, 3).flatten() + wpos_ids = wpos_ids.reshape( + h // self.spatial_merge_size, + self.spatial_merge_size, + w // self.spatial_merge_size, + self.spatial_merge_size, + ).permute(0, 2, 1, 3).flatten() + pos_ids.append( + torch.stack([hpos_ids, wpos_ids], dim=-1).repeat(t, 1)) + pos_ids = torch.cat(pos_ids, dim=0) + max_grid_size = grid_thw[:, 1:].max() + rotary_pos_emb_full = self.rotary_pos_emb(max_grid_size) + rotary_pos_emb = rotary_pos_emb_full[pos_ids].flatten(1) + return rotary_pos_emb + + def get_window_index(self, grid_thw): + window_index: list = [] + cu_window_seqlens: list = [0] + window_index_id = 0 + vit_merger_window_size = (self.window_size // + self.spatial_merge_size // self.patch_size) + + for grid_t, grid_h, grid_w in grid_thw: + llm_grid_h = grid_h // self.spatial_merge_size + llm_grid_w = grid_w // self.spatial_merge_size + index = torch.arange(grid_t * llm_grid_h * llm_grid_w).reshape( + grid_t, llm_grid_h, llm_grid_w) + pad_h = vit_merger_window_size - llm_grid_h % vit_merger_window_size + pad_w = vit_merger_window_size - llm_grid_w % vit_merger_window_size + num_windows_h = (llm_grid_h + pad_h) // vit_merger_window_size + num_windows_w = (llm_grid_w + pad_w) // vit_merger_window_size + index_padded = F.pad(index, (0, pad_w, 0, pad_h), 'constant', -100) + index_padded = index_padded.reshape(grid_t, num_windows_h, + vit_merger_window_size, + num_windows_w, + vit_merger_window_size) + index_padded = index_padded.permute(0, 1, 3, 2, 4).reshape( + grid_t, num_windows_h * num_windows_w, vit_merger_window_size, + vit_merger_window_size) + seqlens = (index_padded != -100).sum([2, 3]).reshape(-1) + index_padded = index_padded.reshape(-1) + index_new = index_padded[index_padded != -100] + window_index.append(index_new + window_index_id) + cu_seqlens_tmp = seqlens.cumsum( + 0) * self.spatial_merge_unit + cu_window_seqlens[-1] + cu_window_seqlens.extend(cu_seqlens_tmp.tolist()) + window_index_id += (grid_t * llm_grid_h * llm_grid_w).item() + window_index = torch.cat(window_index, dim=0) + return window_index, cu_window_seqlens + + def forward( + self, + x: torch.Tensor, + grid_thw: torch.Tensor, + ) -> torch.Tensor: + # patchify + hidden_states = x.to(device=self.device, dtype=self.dtype) + hidden_states = self.patch_embed(hidden_states) + + # compute position embedding + rotary_pos_emb = self.rot_pos_emb(grid_thw) + + # windows attention + window_index, cu_window_seqlens = self.get_window_index(grid_thw) + cu_window_seqlens = torch.tensor( + cu_window_seqlens, + device=hidden_states.device, + dtype=grid_thw.dtype if torch.jit.is_tracing() else torch.int32) + cu_window_seqlens = torch.unique_consecutive(cu_window_seqlens) + seq_len, _ = hidden_states.size() + hidden_states = hidden_states.reshape( + seq_len // self.spatial_merge_unit, self.spatial_merge_unit, -1) + hidden_states = hidden_states[window_index, :, :] + hidden_states = hidden_states.reshape(seq_len, -1) + rotary_pos_emb = rotary_pos_emb.reshape( + seq_len // self.spatial_merge_unit, self.spatial_merge_unit, -1) + rotary_pos_emb = rotary_pos_emb[window_index, :, :] + rotary_pos_emb = rotary_pos_emb.reshape(seq_len, -1) + # compute cu_seqlens + cu_seqlens = torch.repeat_interleave(grid_thw[:, 1] * grid_thw[:, 2], + grid_thw[:, 0]).cumsum( + dim=0, dtype=torch.int32) + cu_seqlens = F.pad(cu_seqlens, (1, 0), "constant", 0) + + # transformers + hidden_states = hidden_states.unsqueeze(1) + for layer_num, blk in enumerate(self.blocks): + if layer_num in self.fullatt_block_indexes: + cu_seqlens_now = cu_seqlens + else: + cu_seqlens_now = cu_window_seqlens + hidden_states = blk(hidden_states, + cu_seqlens=cu_seqlens_now, + rotary_pos_emb=rotary_pos_emb) + + # adapter + hidden_states = self.merger(hidden_states) + reverse_indices = torch.argsort(window_index) + hidden_states = hidden_states[reverse_indices, :] + return hidden_states + + +# === Vision input helpers === # + +cached_get_processor = lru_cache(get_processor) + + +def mm_input_mapper_for_qwen2_5_vl( + ctx: InputContext, + data: MultiModalData[object], + data_type_key: str, +) -> MultiModalInputs: + """Input mapper for Qwen2-VL.""" + if data_type_key == "image" and isinstance(data, dict): + return MultiModalInputs({ + "image_embeds": data.get("image_embeds"), + "image_grid_thw": data.get("image_grid_thw"), + }) + model_config = ctx.model_config + image_processor = cached_get_image_processor( + model_config.model, trust_remote_code=model_config.trust_remote_code) + if image_processor is None: + raise RuntimeError("No HuggingFace processor is available " + "to process the image object") + + images = None + videos = None + if data_type_key == "image": + images = data + else: + assert data_type_key == "video" + videos = data + + try: + batch_data = image_processor \ + .preprocess(images=images, videos=videos, return_tensors="pt") \ + .data + except Exception: + logger.error("Failed to process image (%s)", data) + raise + + return MultiModalInputs(batch_data) + + +image_input_mapper_for_qwen2_5_vl = partial(mm_input_mapper_for_qwen2_5_vl, + data_type_key="image") +video_input_mapper_for_qwen2_5_vl = partial(mm_input_mapper_for_qwen2_5_vl, + data_type_key="video") + + +def _get_vision_info( + image_processor, + height: int, + width: int, + min_pixels: int, + max_pixels: int, + do_resize: bool = True, + data_type_key: str = "image", + mm_count: int = 1, +): + """Get information (resized height / width and number of vision tokens) + of input image / video frame.""" + + if do_resize: + resized_height, resized_width = smart_resize( + height=height, + width=width, + factor=image_processor.patch_size * image_processor.merge_size, + min_pixels=min_pixels, + max_pixels=max_pixels, + ) + else: + resized_height, resized_width = height, width + + if data_type_key == "image": + grid_t = mm_count + else: + assert data_type_key == "video" + grid_t = max(mm_count // image_processor.temporal_patch_size, 1) + + grid_h = resized_height // image_processor.patch_size + grid_w = resized_width // image_processor.patch_size + vision_tokens = grid_t * grid_h * grid_w + llm_num_vision_tokens = (vision_tokens // image_processor.merge_size // + image_processor.merge_size) + + return resized_height, resized_width, llm_num_vision_tokens + + +def _get_max_image_info( + image_processor, + data_type_key: str = "image", + mm_count: int = 1, +): + return _get_vision_info( + image_processor, + height=9999999, + width=9999999, + + # Limit min / max pixels. + min_pixels=max(image_processor.min_pixels, 28 * 28), + max_pixels=min(image_processor.max_pixels, 1280 * 28 * 28), + data_type_key=data_type_key, + mm_count=mm_count, + ) + + +def get_max_qwen2_5_vl_mm_tokens(ctx: InputContext, data_type_key: str) -> int: + image_processor = cached_get_image_processor(ctx.model_config.model) + max_resized_height, max_resized_width, max_llm_image_tokens = \ + _get_max_image_info(image_processor, data_type_key=data_type_key, + mm_count=1) + return max_llm_image_tokens + + +get_max_qwen2_5_vl_image_tokens = partial(get_max_qwen2_5_vl_mm_tokens, + data_type_key="image") +get_max_qwen2_5_vl_video_tokens = partial(get_max_qwen2_5_vl_mm_tokens, + data_type_key="video") + + +def dummy_data_for_qwen2_5_vl( + ctx: InputContext, seq_len: int, mm_counts: Mapping[str, int] +) -> Tuple[SequenceData, Optional[MultiModalDataDict]]: + image_processor = cached_get_image_processor(ctx.model_config.model) + + num_images = mm_counts["image"] + max_resized_height, max_resized_width, max_llm_image_tokens = \ + _get_max_image_info(image_processor, data_type_key="image", + mm_count=num_images) + if seq_len - max_llm_image_tokens - 2 < 0: + raise RuntimeError( + f"Qwen2-VL cannot process {num_images} images in a prompt, " + "please increase max_model_len or reduce image limit by " + "--limit-mm-per-prompt.") + + # Check video counts. + num_videos = mm_counts["video"] + max_resized_height, max_resized_width, max_llm_video_tokens = \ + _get_max_image_info(image_processor, data_type_key="video", + mm_count=num_videos) + if seq_len - max_llm_video_tokens - 2 < 0: + raise RuntimeError( + f"Qwen2-VL cannot process {num_images} videos in a prompt, " + "please increase max_model_len or reduce video limit by " + "--limit-mm-per-prompt.") + + hf_config = ctx.get_hf_config(Qwen2_5_VLConfig) + + dummy_seqdata = SequenceData.from_token_counts( + (hf_config.vision_start_token_id, 1), + (hf_config.image_token_id, max_llm_image_tokens), + (hf_config.vision_end_token_id, 1), + (0, seq_len - max_llm_image_tokens - 2), + ) + + dummy_image = Image.new("RGB", (max_resized_width, max_resized_height), + color=0) + + return dummy_seqdata, { + "image": dummy_image if num_images == 1 else [dummy_image] * num_images + } + + +def _get_llm_num_vision_tokens( + mm_inputs: list, + data_type_key: str, + image_processor, +): + """Get number of vision tokens of multimodal inputs. + + This method is derived from `transformers.models.qwen2_vl. + image_processing_qwen2_vl.Qwen2_5_VLImageProcessor._preprocess`. + """ + image = to_numpy_array(mm_inputs[0]) + input_data_format = infer_channel_dimension_format(image) + height, width = get_image_size(image, channel_dim=input_data_format) + _, _, llm_num_vision_tokens = _get_vision_info( + image_processor, + height=height, + width=width, + min_pixels=image_processor.min_pixels, + max_pixels=image_processor.max_pixels, + do_resize=image_processor.do_resize, + data_type_key=data_type_key, + mm_count=len(mm_inputs), + ) + return llm_num_vision_tokens + + +def _expand_pad_tokens(inputs: list, token_id: int, make_batched_fn: Callable, + data_type_key: str, image_processor: Any, + prompt_token_ids: List[int]) -> List[int]: + """ + Expand pad tokens for multi-modal inputs (e.g., images or videos). + + Args: + inputs (list): The multi-modal inputs (e.g., images or videos). + token_id (int): The token ID used to represent the multi-modal input. + make_batched_fn (Callable): A function to batch the inputs. + data_type_key (str): The type of the multi-modal input. + image_processor (Any): The image processor used to process the inputs. + prompt_token_ids (List[int]): The list of token IDs in the prompt. + + Returns: + List[int]: The list of token IDs for the multi-modal inputs. + """ + indices = [ + idx for idx, token in enumerate(prompt_token_ids) if token == token_id + ] + inputs = make_batched_fn(inputs) + assert len(indices) == len(inputs) + + prompt_token_ids_with_data = [] + for cnt, data in enumerate(inputs): + num_tokens = _get_llm_num_vision_tokens( + [data] if data_type_key == "image" else data, + data_type_key=data_type_key, + image_processor=image_processor, + ) + if cnt == 0: + end_idx = indices[cnt] + non_data_tokens = prompt_token_ids[:end_idx] + else: + non_data_tokens = prompt_token_ids[indices[cnt - 1] + + 1:indices[cnt]] + prompt_token_ids_with_data.extend(non_data_tokens) + prompt_token_ids_with_data.extend(token_id for _ in range(num_tokens)) + prompt_token_ids_with_data.extend(prompt_token_ids[indices[-1] + 1:]) + return prompt_token_ids_with_data + + +def input_processor_for_qwen2_5_vl(ctx: InputContext, + llm_inputs: LLMInputs) -> LLMInputs: + multi_modal_data = llm_inputs.get("multi_modal_data", None) + if multi_modal_data is None: + return llm_inputs + + image_inputs = multi_modal_data.get("image", None) + video_inputs = multi_modal_data.get("video", None) + + processor = cached_get_processor(ctx.model_config.model) + image_processor = processor.image_processor + hf_config = ctx.get_hf_config(Qwen2_5_VLConfig) + + # To avoid redundant processing of vision objects (resize, rescale, etc.), + # we extract code of calculating number of vision tokens from + # `transformers.models.qwen2_vl.processing_qwen2_vl.Qwen2_5_VLProcessor`. + # + # The following code is equivalent to: + # prompt = llm_inputs["prompt"] + # inputs = processor(text=[prompt], + # images=image_inputs, + # videos=video_inputs, + # padding=True, + # return_tensors="pt") + # prompt_token_ids = inputs["input_ids"][0].tolist() + + prompt_token_ids = llm_inputs.get("prompt_token_ids", None) + if prompt_token_ids is None: + prompt = llm_inputs["prompt"] + prompt_token_ids = processor.tokenizer( + prompt, + padding=True, + return_tensors=None, + )["input_ids"] + + # Expand image pad tokens. + + if image_inputs is not None: + if isinstance(image_inputs, dict): + prompt_token_ids_with_image = [] + image_indices = [ + idx for idx, token in enumerate(prompt_token_ids) + if token == hf_config.image_token_id + ] + image_cnt = len(image_indices) + embed_dim = image_inputs.get('image_embeds').size(0) + assert embed_dim % image_cnt == 0 + num_pad_tokens = embed_dim // image_cnt + for idx, token in enumerate(prompt_token_ids): + if idx in image_indices: + prompt_token_ids_with_image.extend([token] * + num_pad_tokens) + else: + prompt_token_ids_with_image.append(token) + prompt_token_ids = prompt_token_ids_with_image + else: + prompt_token_ids = _expand_pad_tokens(image_inputs, + hf_config.image_token_id, + make_batched_images, "image", + image_processor, + prompt_token_ids) + + if video_inputs is not None: + prompt_token_ids = _expand_pad_tokens(video_inputs, + hf_config.video_token_id, + make_batched_videos, "video", + image_processor, + prompt_token_ids) + + return LLMInputs( + prompt_token_ids=prompt_token_ids, + prompt=llm_inputs["prompt"], + multi_modal_data=multi_modal_data, + ) + + +@MULTIMODAL_REGISTRY.register_image_input_mapper( + image_input_mapper_for_qwen2_5_vl) +@MULTIMODAL_REGISTRY.register_input_mapper("video", + video_input_mapper_for_qwen2_5_vl) +@MULTIMODAL_REGISTRY.register_max_image_tokens(get_max_qwen2_5_vl_image_tokens) +@MULTIMODAL_REGISTRY.register_max_multimodal_tokens( + "video", get_max_qwen2_5_vl_video_tokens) +@INPUT_REGISTRY.register_dummy_data(dummy_data_for_qwen2_5_vl) +@INPUT_REGISTRY.register_input_processor(input_processor_for_qwen2_5_vl) +class Qwen2_5_VLForConditionalGeneration(nn.Module, SupportsMultiModal, + SupportsPP): + + def __init__(self, + config: Qwen2_5_VLConfig, + multimodal_config: MultiModalConfig, + cache_config: Optional[CacheConfig] = None, + quant_config: Optional[QuantizationConfig] = None) -> None: + super().__init__() + + assert not cache_config.enable_prefix_caching, \ + "Qwen2-VL currently does not support prefix caching" + + self.config = config + self.multimodal_config = multimodal_config + + self.visual = Qwen2_5_VisionTransformer( + config.vision_config, + norm_eps=getattr(config, "rms_norm_eps", 1e-6), + + # NOTE: Qwen2-5-VL vision encoder does not support any + # quantization method now. + quant_config=None, + ) + + self.model = Qwen2Model(config, cache_config, quant_config) + + if get_pp_group().is_last_rank: + if config.tie_word_embeddings: + self.lm_head = self.model.embed_tokens + else: + self.lm_head = ParallelLMHead(config.vocab_size, + config.hidden_size, + quant_config=quant_config) + else: + self.lm_head = PPMissingLayer() + + self.logits_processor = LogitsProcessor(config.vocab_size) + self.sampler = Sampler() + self.make_empty_intermediate_tensors = ( + make_empty_intermediate_tensors_factory( + ["hidden_states", "residual"], config.hidden_size)) + + def _validate_and_reshape_mm_tensor(self, + mm_input: Union[torch.Tensor, + List[torch.Tensor]], + name: str) -> torch.Tensor: + if not isinstance(mm_input, (torch.Tensor, list)): + raise ValueError(f"Incorrect type of {name}. " + f"Got type: {type(mm_input)}") + if isinstance(mm_input, torch.Tensor): + if mm_input.ndim == 2: + return mm_input + if mm_input.ndim != 3: + raise ValueError(f"{name} should be 2D or batched 3D tensor. " + f"Got ndim: {mm_input.ndim}") + return torch.concat(list(mm_input)) + else: + return torch.concat(mm_input) + + def _parse_and_validate_image_input( + self, **kwargs: object) -> Optional[Qwen2_5_VLImageInputs]: + pixel_values = kwargs.pop("pixel_values", None) + image_embeds = kwargs.pop("image_embeds", None) + image_grid_thw = kwargs.pop("image_grid_thw", None) + + if pixel_values is None and image_embeds is None: + return None + + if pixel_values is not None: + pixel_values = self._validate_and_reshape_mm_tensor( + pixel_values, "image pixel values") + image_grid_thw = self._validate_and_reshape_mm_tensor( + image_grid_thw, "image grid_thw") + + if not isinstance(pixel_values, (torch.Tensor, list)): + raise ValueError("Incorrect type of image pixel values. " + f"Got type: {type(pixel_values)}") + + return Qwen2_5_VLImagePixelInputs(type="pixel_values", + data=pixel_values, + image_grid_thw=image_grid_thw) + + if image_embeds is not None: + image_embeds = self._validate_and_reshape_mm_tensor( + image_embeds, "image embeds") + + if not isinstance(image_embeds, torch.Tensor): + raise ValueError("Incorrect type of image embeddings. " + f"Got type: {type(image_embeds)}") + return Qwen2_5_VLImageEmbeddingInputs(type="image_embeds", + data=image_embeds) + + def _parse_and_validate_video_input( + self, **kwargs: object) -> Optional[Qwen2_5_VLVideoInputs]: + pixel_values_videos = kwargs.pop("pixel_values_videos", None) + video_grid_thw = kwargs.pop("video_grid_thw", None) + + if pixel_values_videos is None: + return None + + pixel_values_videos = self._validate_and_reshape_mm_tensor( + pixel_values_videos, "video pixel values") + video_grid_thw = self._validate_and_reshape_mm_tensor( + video_grid_thw, "video grid_thw") + + return Qwen2_5_VLVideoInputs( + pixel_values_videos=pixel_values_videos, + video_grid_thw=video_grid_thw, + ) + + def _process_image_input(self, + image_input: Qwen2_5_VLImageInputs) -> torch.Tensor: + if image_input["type"] == "image_embeds": + return image_input["data"].type(self.visual.dtype) + + pixel_values = image_input["data"].type(self.visual.dtype) + image_embeds = self.visual(pixel_values, + grid_thw=image_input["image_grid_thw"]) + return image_embeds + + def _process_video_input(self, + video_input: Qwen2_5_VLVideoInputs) -> torch.Tensor: + pixel_values_videos = video_input["pixel_values_videos"].type( + self.visual.dtype) + video_embeds = self.visual(pixel_values_videos, + grid_thw=video_input["video_grid_thw"]) + return video_embeds + + def _merge_multimodal_embeddings( + self, + input_ids: torch.Tensor, + inputs_embeds: torch.Tensor, + multimodal_embeddings: torch.Tensor, + placeholder_token_id: int, + ) -> torch.Tensor: + mask = (input_ids == placeholder_token_id) + inputs_embeds[mask, :] = multimodal_embeddings + return inputs_embeds + + def forward( + self, + input_ids: torch.Tensor, + positions: torch.Tensor, + kv_caches: List[torch.Tensor], + attn_metadata: AttentionMetadata, + intermediate_tensors: Optional[IntermediateTensors] = None, + **kwargs: object, + ) -> Union[torch.Tensor, IntermediateTensors]: + """Run forward pass for Qwen2-VL. + + Args: + input_ids: Flattened (concatenated) input_ids corresponding to a + batch. + positions: Flattened (concatenated) position ids corresponding to a + batch. + **NOTE**: If mrope is enabled (default setting for Qwen2-VL + opensource models), the shape will be `(3, seq_len)`, + otherwise it will be `(seq_len,). + pixel_values: Pixel values to be fed to a model. + `None` if no images are passed. + image_grid_thw: Tensor `(n_images, 3)` of image 3D grid in LLM. + `None` if no images are passed. + pixel_values_videos: Pixel values of videos to be fed to a model. + `None` if no videos are passed. + video_grid_thw: Tensor `(n_videos, 3)` of video 3D grid in LLM. + `None` if no videos are passed. + """ + if intermediate_tensors is not None: + input_ids = None + inputs_embeds = None + else: + image_input = self._parse_and_validate_image_input(**kwargs) + video_input = self._parse_and_validate_video_input(**kwargs) + + if image_input is None and video_input is None: + inputs_embeds = None + else: + rope_scaling = getattr(self.config, "rope_scaling", {}) + if rope_scaling.get("type", None) == "mrope": + assert positions.ndim == 2 and positions.size(0) == 3, ( + "multimodal section rotary embedding requires " + f"(3, seq_len) positions, but got {positions.size()}") + + inputs_embeds = self.model.embed_tokens(input_ids) + + if image_input is not None: + image_embeds = self._process_image_input(image_input) + inputs_embeds = self._merge_multimodal_embeddings( + input_ids, + inputs_embeds, + image_embeds, + placeholder_token_id=self.config.image_token_id, + ) + + if video_input is not None: + video_embeds = self._process_video_input(video_input) + inputs_embeds = self._merge_multimodal_embeddings( + input_ids, + inputs_embeds, + video_embeds, + placeholder_token_id=self.config.video_token_id, + ) + + input_ids = None + + hidden_states = self.model( + input_ids=input_ids, + positions=positions, + kv_caches=kv_caches, + attn_metadata=attn_metadata, + intermediate_tensors=intermediate_tensors, + inputs_embeds=inputs_embeds, + ) + return hidden_states + + def compute_logits(self, hidden_states: torch.Tensor, + sampling_metadata: SamplingMetadata) -> torch.Tensor: + logits = self.logits_processor(self.lm_head, hidden_states, + sampling_metadata) + return logits + + def sample( + self, + logits: torch.Tensor, + sampling_metadata: SamplingMetadata, + ) -> Optional[SamplerOutput]: + next_tokens = self.sampler(logits, sampling_metadata) + return next_tokens + + def load_weights(self, weights: Iterable[Tuple[str, torch.Tensor]]): + stacked_params_mapping = [ + # (param_name, shard_name, shard_id) + ("qkv_proj", "q_proj", "q"), + ("qkv_proj", "k_proj", "k"), + ("qkv_proj", "v_proj", "v"), + ("gate_up_proj", "up_proj", 1), + ("gate_up_proj", "gate_proj", 0), + ] + + params_dict = dict(self.named_parameters(remove_duplicate=False)) + for name, loaded_weight in weights: + if "rotary_emb.inv_freq" in name: + continue + if self.config.tie_word_embeddings and "lm_head.weight" in name: + continue + is_visual_gate_up = "visual" in name and ("gate_proj" in name or "up_proj" in name) + if is_visual_gate_up: + if name not in params_dict: + continue + param = params_dict[name] + weight_loader = getattr(param, "weight_loader", default_weight_loader) + weight_loader(param, loaded_weight) + continue + for (param_name, weight_name, shard_id) in stacked_params_mapping: + if weight_name not in name: + continue + name = name.replace(weight_name, param_name) + # Skip loading extra bias for GPTQ models. + if name.endswith(".bias") and name not in params_dict: + continue + if is_pp_missing_parameter(name, self): + continue + param = params_dict[name] + weight_loader = param.weight_loader + weight_loader(param, loaded_weight, shard_id) + break + else: + try: + # Skip loading extra bias for GPTQ models. + if name.endswith(".bias") and name not in params_dict: + continue + if is_pp_missing_parameter(name, self): + continue + param = params_dict[name] + except KeyError: + raise ValueError(f"Unexpected weight: {name}") from None + + weight_loader = getattr(param, "weight_loader", + default_weight_loader) + weight_loader(param, loaded_weight) diff --git a/vllm/model_executor/models/qwen3.py b/vllm/model_executor/models/qwen3.py index 87a08b2..3f63c5f 100644 --- a/vllm/model_executor/models/qwen3.py +++ b/vllm/model_executor/models/qwen3.py @@ -136,11 +136,11 @@ class Qwen3Attention(nn.Module): # Add qk-norm q_by_head = q.view(*q.shape[:-1], q.shape[-1] // self.head_dim, self.head_dim) - q_by_head = self.q_norm.forward_native(q_by_head) + q_by_head = self.q_norm.forward_cuda(q_by_head.contiguous()) q = q_by_head.view(q.shape) k_by_head = k.view(*k.shape[:-1], k.shape[-1] // self.head_dim, self.head_dim) - k_by_head = self.k_norm.forward_native(k_by_head) + k_by_head = self.k_norm.forward_cuda(k_by_head.contiguous()) k = k_by_head.view(k.shape) q, k = self.rotary_emb(positions, q, k) attn_output = self.attn(q, k, v, kv_cache, attn_metadata) diff --git a/vllm/model_executor/models/registry.py b/vllm/model_executor/models/registry.py index 73ae906..a2d063c 100644 --- a/vllm/model_executor/models/registry.py +++ b/vllm/model_executor/models/registry.py @@ -114,6 +114,7 @@ _MULTIMODAL_MODELS = { "PixtralForConditionalGeneration": ("pixtral", "PixtralForConditionalGeneration"), # noqa: E501 "QWenLMHeadModel": ("qwen", "QWenLMHeadModel"), "Qwen2VLForConditionalGeneration": ("qwen2_vl", "Qwen2VLForConditionalGeneration"), # noqa: E501 + "Qwen2_5_VLForConditionalGeneration": ("qwen2_5_vl", "Qwen2_5_VLForConditionalGeneration"), # noqa: E501 "UltravoxModel": ("ultravox", "UltravoxModel"), # [Encoder-decoder] "MllamaForConditionalGeneration": ("mllama", "MllamaForConditionalGeneration"), # noqa: E501 diff --git a/vllm/multimodal/__pycache__/__init__.cpython-310.pyc b/vllm/multimodal/__pycache__/__init__.cpython-310.pyc index 6add128971af6bb7c4aab892a664c9b161d61799..ab4b7072d4c5709fe27f4a23cda488f300713be9 100644 GIT binary patch delta 61 zcmaFM{F0eFpO=@50SFA&?%T-S$f#nkUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS PUrsvR{NdpO=@50SFA&?%T+{gh|Clza+OnzaX*D$wSKPNLu Qzo4=tBR_BRb*3D408)??xc~qF delta 66 zcmdlla#(~rpO=@50SGF$HEiTw!ldD#Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5GE)va0HoIy$p8QV diff --git a/vllm/multimodal/__pycache__/registry.cpython-310.pyc b/vllm/multimodal/__pycache__/registry.cpython-310.pyc index 98fe724af55632c1335842f48d34cc09a98dff1a..350ec50266d4144632ebaa98ffbd28477decfb6b 100644 GIT binary patch delta 62 zcmZ4Hw8)7&pO=@50SFA&?%T+Hms!PLza+OnzaX*D$wSKPNLu Qzo4=tBR_Am0E?I`0AUmq6951J delta 66 zcmZ4Fw9JV+pO=@50SGF$HEiU*%dFw7Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(_heb>l0JPT?BLDyZ diff --git a/vllm/multimodal/__pycache__/utils.cpython-310.pyc b/vllm/multimodal/__pycache__/utils.cpython-310.pyc index 9e3b55cc5eadf536683a21082321605323ad1862..d04d3df17638203eeb5c1b1c4f4accbdb976ffb7 100644 GIT binary patch delta 62 zcmX@?wBLz4pO=@50SFA&?%T+{hDF6jza+OnzaX*D$wSKPNLu Qzo4=tBR_BReU=m%0BQjhHUIzs delta 66 zcmdn*bl8bIpO=@50SGF$HEiTw!=mA!Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5HcN^O0KMQAMgRZ+ diff --git a/vllm/multimodal/__pycache__/video.cpython-310.pyc b/vllm/multimodal/__pycache__/video.cpython-310.pyc index 6a318a232381ccc5c72ab044c7e7d00f81b024a4..e2d31636a6aed91d1a03653dcd6e67b12aae9325 100644 GIT binary patch delta 62 zcmew;{8pGdpO=@50SFA&?%T+Hj!DHvza+OnzaX*D$wSKPNLu Qzo4=tBR_95Bl8C~0Br6Q>i_@% delta 66 zcmaDW{85-YpO=@50SGF$HEiTQ$E4w)Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5FVhD$0L4NU`Tzg` diff --git a/vllm/platforms/__pycache__/__init__.cpython-310.pyc b/vllm/platforms/__pycache__/__init__.cpython-310.pyc index 07fb96c44b6e9b379b810d697b37305667da5273..0b50dc419131ff82cbc52614604ab580326d0e5b 100644 GIT binary patch delta 61 zcmZ3_wVI1NpO=@50SFA&?%T-i#iC-TUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS PUr0I5|KdH?_b diff --git a/vllm/platforms/__pycache__/cuda.cpython-310.pyc b/vllm/platforms/__pycache__/cuda.cpython-310.pyc index 559a358171f8d3d66464165cc3d96a60bc6eae4d..6c4935a6f8ce118502a4f5c3e01d3c11d27b62ff 100644 GIT binary patch delta 62 zcmeyO{z08PpO=@50SFA&?%T+{jYY*uza+OnzaX*D$wSKPNLu Qzo4=tBR_BROBQZ^0Cj>D4gdfE delta 66 zcmeyM{zaWTpO=@50SGF$HEiVG#-d@TUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5DGN700Ln2I9smFU diff --git a/vllm/platforms/__pycache__/interface.cpython-310.pyc b/vllm/platforms/__pycache__/interface.cpython-310.pyc index 9e971de57e34331e7118f4e80f55db9d0244a105..053ec4f9802a47e18cc68889cf75bf35f2f67fb8 100644 GIT binary patch delta 62 zcmbQDI6;v+pO=@50SFA&?%T-S&!}RrUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr*D$wSKPNLu Qzo4=tBR_AmB(oqh07^X*n*aa+ delta 66 zcmZ3+vx UlB!#fn4F!Mo?5(Flv$7&0Gxajs{jB1 diff --git a/vllm/platforms/__pycache__/tpu.cpython-310.pyc b/vllm/platforms/__pycache__/tpu.cpython-310.pyc index 84d31fe6af19c4f2fce7142a035fa7c82a7527a7..142ab4db2d453885090f12bb14f30a910a5c9676 100644 GIT binary patch delta 62 zcmZ3(wStQ~pO=@50SFA&?%T+%&!l3hUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr*D$wSKPNLu Qzo4=tBR_AmEYkrd0AlGBt^fc4 delta 66 zcmcb~d6$zrpO=@50SGF$HEiU5#i(JcUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(FlIZ{w0Jg9dz5oCK diff --git a/vllm/plugins/__pycache__/__init__.cpython-310.pyc b/vllm/plugins/__pycache__/__init__.cpython-310.pyc index fb5aa1d9370a61813559b3a807a69e68da8e0255..01e729b56d0559f0a6aca199393714c11262fc5f 100644 GIT binary patch delta 384 zcmcb}cb1PkpO=@50SFA&?%T+1!ps;o*@1bJrWjDrXu;t{H%IXvLJPGAOfKS%#xTK&Z@7R(;)svWOUzA;k1yf}DUt*cQj_noNomT1m>{Qu S9aW?OVrha13_mHd>i_`W(@V<$ diff --git a/vllm/prompt_adapter/__pycache__/__init__.cpython-310.pyc b/vllm/prompt_adapter/__pycache__/__init__.cpython-310.pyc index b77191e9a1a6494222a7c620985173b5f4d2ed45..a0d7d61e7b7d6cefdb8d03bc4a0b63efa94651bf 100644 GIT binary patch delta 59 zcmZ3&xPXy6pO=@50SFA&?wiPMqvEVzl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEohz6ae=F69@nR delta 63 zcmZ3$xP*~ApO=@50SGF$HB98T(QwxiX8i-CiY?LQkM%l|6d$&K1t Kn~#aw$^rneXdR#c delta 116 zcmZonYfj_N=jG*M0D{VG4I8;-nKfMXON)#2bMliDbM$jElk^KJOEU8FjP(o+^ouh~ zQgsUwld}`kQ;RqIFyChu-~sAnV_;)qV`Tcv!pQc2vn9JfA0G!$l&OJ>fsIk*D$wSKPNLu Qzo4=tBR_AmIuj2w08vL1#sB~S delta 66 zcmZ3_wV8`MpO=@50SGF$HEiVm!l>b UlB!#fn4F!Mo?5(FnTdxP0HhKW)&Kwi diff --git a/vllm/prompt_adapter/__pycache__/utils.cpython-310.pyc b/vllm/prompt_adapter/__pycache__/utils.cpython-310.pyc index a143fd4bf20608b32f6233f3a23e8aff8f44aab9..0e78e38433c5c1f0e19506d60d780b54edf41169 100644 GIT binary patch delta 138 zcmaDO^h1a@pO=@50SFA&?#nRW$h(qJ#X-L$w?Mxjvp}~bu_!&YMAtmGG$YqAw_HCb zGfBUovLquvZ}L6HY{rhwUQ7*)tjsBbz08}>GJj^0Ws2g-O)QAd$xlu!$;{7-;wewf qOwTAOj?d4_soZ>?&6JT@Ku~BhJBK_o%YUB9njF52T$9T=z5)PS(k&GL delta 152 zcmew%^hSs`pO=@50SGF$HDsu4L(gX2D*j&8L|^Gx0M<@#H2J#DjE~Waj5>zRhOJ ysLCfO@}G%`=^qCR8>1K#A0v=t1d%*U9E?1STr5nCO#k^Nn{xOva!hXK_zD0Gaw;_d diff --git a/vllm/prompt_adapter/__pycache__/worker_manager.cpython-310.pyc b/vllm/prompt_adapter/__pycache__/worker_manager.cpython-310.pyc index 3cc1bba275d0a96c79343382bd9f154af083c975..24b2c337d7a7b787fe778398c94eb19ba8d77879 100644 GIT binary patch delta 62 zcmZ2tyug?{pO=@50SFA&?%T-S&Z^?6Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr*D$wSKPNLu ozo4=tBR_BQPcBmdkS;a`CPofMrvGe=RW_3wr6o5 xlB!#fn4F!Mo?1NlE0?Jd4^Sf;0}~?~Bhx=1`M=6$asZ3O*D$wSKPNLu izo4=tBR_BRRgS-0OnDreuLujVGjlL=Y mlB!#fn4F!Mo?5*5BFA4Yrox?@F9-{ diff --git a/vllm/spec_decode/__pycache__/interfaces.cpython-310.pyc b/vllm/spec_decode/__pycache__/interfaces.cpython-310.pyc index ed509147eb71aa9e1ec46aa1885b6714617a4cd8..9a5a06525556a5686f05554ff96066a10e6ff2dc 100644 GIT binary patch delta 62 zcmca2c0r6gpO=@50SFA&?%T*M!>r<@Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr*D$wSKPNLu Qzo4=tBR_Am5py>m0A+;~u>b%7 delta 66 zcmdm~yjPh!pO=@50SGF$HEiVm&!pk0Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(FkGY!<0J)?U!2kdN diff --git a/vllm/spec_decode/__pycache__/metrics.cpython-310.pyc b/vllm/spec_decode/__pycache__/metrics.cpython-310.pyc index f37fc633498402c4408c9908cd88c803d7a5cd81..9518ee31e0843c7940171a0a2680b4759bf8cbdb 100644 GIT binary patch delta 62 zcmbQMK2x1LpO=@50SFA&?%T+n&!l3nUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr$|pO=@50SGF$HEiT=*D$wSKPNLu zzo4=tBR_AmESoq7Qy$}HGrlEUihL|wf0>xr{xLCgu`vB(VPyFaWHEF7XJTYw2IBur Kn}19E69xclLLhPg delta 113 zcmeww`7@F`pO=@50SGF$HEiU5#j4?}Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> zlB!#fn4F!Mo?5(Fl1-e0sZeRN5#JInMIIKOzf4SQ|CpFLSXlnCFtYpyvY2`PGcmF- PGchv#XW9H+;-4@8`ZOV) diff --git a/vllm/spec_decode/__pycache__/ngram_worker.cpython-310.pyc b/vllm/spec_decode/__pycache__/ngram_worker.cpython-310.pyc index 0da7d4e121b2b2efd1f1b334012b0df776158c85..dfc4758401b41c5fda4cd84d9f9c0a541f10af47 100644 GIT binary patch delta 114 zcmdn3wq1=opO=@50SFA&?%T-S%B delta 138 zcmdn4wp)!mpO=@50SGF$HEiT=W!CV}FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` zN!2Y#OwLYBPc7cOg}IT1sc`pZa}G;p##@^UxqmS+x^2$kD_|722bx!82qbQ?WT#dZ jYckzp(laP>oZQGFyqQg4B_p>hNC5|kaNE2~u$B=3rRgZi diff --git a/vllm/spec_decode/__pycache__/proposer_worker_base.cpython-310.pyc b/vllm/spec_decode/__pycache__/proposer_worker_base.cpython-310.pyc index 2b3eb515628dbcf52d6bd7eba3c82d264fd0d59e..6d326eb8f3076dd770d3dc042a54faac66f1ff5d 100644 GIT binary patch delta 62 zcmew(@pO=@50SFA&?%T-S&!pm`Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr0KoAUZvX%Q diff --git a/vllm/spec_decode/__pycache__/smaller_tp_proposer_worker.cpython-310.pyc b/vllm/spec_decode/__pycache__/smaller_tp_proposer_worker.cpython-310.pyc index c47e835bee8712373b89839b8e60fb9aeeb037b7..c8bd07f2fc44a85acc02b23e02b27c250f406e49 100644 GIT binary patch delta 62 zcmeCz>(=AW=jG*M00P6c`!;fmv#A8>m*f`c7i1RbmLwLXri_@% delta 66 zcmeCy>(}GX=jG*M0D{VG4I8<|*)+oRON)#2bMliDbM$jElk^KJOEU8FjP(o+^ouh~ UQgsUwld}`kQ;Rpdu^klv0DvqM`v3p{ diff --git a/vllm/spec_decode/__pycache__/spec_decode_worker.cpython-310.pyc b/vllm/spec_decode/__pycache__/spec_decode_worker.cpython-310.pyc index a4e914a409659815416c0a6b762582da66bf4cf7..dae197d24fe340d459f465afe1805f9ebc55e453 100644 GIT binary patch delta 618 zcmezRlkx3OM(%uGUM>b8FkHKDBlk>B6)*jg+yecA%mUq##G>@n5?%A$(u`cg+;aV# z%q0DS%94!yyv=7gd-xf*O^%eD$iniUg=zB#$vK?N9L!9c`;{kX^MTA`V_;+AVdVM8 z#5b+$&^#QTw0Es?kAmhd4hw<^^AU#Eea3vreD;bNP zOb$;d;{|h=iog~W$5AQ%Mu*)w`zM2@#b`QkAx!Ej9Ox#yn$+V~{hH?Vy}wJJ4zrdCDT&uTKu`6zEW5|#&AnurQA-+D*W zdTz^2M_bog?^IO02Z}thYa>l^f7?ED3dVCe+U6QG#SQL7`-5^KB<^9O8Tbgy@Q7<0 zvr6)ly3M@g?)QSCXH{&NM2TD4`+}Gm)`Zs%$L87gdUH;>5se4jnoBt4zhN=|uj?Sx zkOJ#UEMT<=d;+}te1`I_w>tafZ!F>$ap=kep-R9D;H9rt@fGB2!0YiEy|OVLjh!&3 zu~U$Z9mX1~qG6PHPyE*UKP_rqDe->jxcnNQC-V(rZ)GvDn`nu*CBs(5fnDI{ eubTnCtUb5Y2>-z5G2jpo1u!i7fHI%FF!&p{ro^`Z diff --git a/vllm/spec_decode/__pycache__/target_model_runner.cpython-310.pyc b/vllm/spec_decode/__pycache__/target_model_runner.cpython-310.pyc index af40176d589346fcc49a8da21dbbfc34e70289c0..dcefa2f62c7b6240729c9f9a81071689d73d97f1 100644 GIT binary patch delta 62 zcmew^@>zsCpO=@50SFA&?%T*ck4?o}za+OnzaX*D$wSKPNLu Qzo4=tBR_BRMYd(k0By$=VgLXD delta 66 zcmew?@?C^GpO=@50SGF$HEiUb$EM-0Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5EZZ_>0KwuGasU7T diff --git a/vllm/spec_decode/__pycache__/top1_proposer.cpython-310.pyc b/vllm/spec_decode/__pycache__/top1_proposer.cpython-310.pyc index 0e72f46275d37867503b0a6688ae7cd088d3d381..d1f72a3492b52ef9efe8e3d79cf5c57d9e7c5810 100644 GIT binary patch delta 123 zcmX@Fb5w^rpO=@50SFA&?%T+HomItEza+OnzaX*D$wSKPNLu zzo4=tBR_957n?1+oEA_Q3pWcR3!?xd7c&Z$pHfL XENuT-m?oDBr~ny4lAGrXY+wZd^N}7O delta 133 zcmX@Ab6$r#pO=@50SGF$HEiU*&Z^<5Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> zlB!#fn4F!Mo?5(_jm?%_K?kUlg`0(ug;9W!i_if}hWl^!wFUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E zFQ_cZ$j{rH!BW90A^_CI#=ynO!Nl^5kCBa$KymlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} zr0NzVCTAz6rxtHcVX0sh69VdFW8h+CV`BQr!pO(S#>n!I?f>QvocThGw*D$wSKPNLu Pzo4=tBR_BQRYqR`Cy*2t delta 65 zcmbQovWSH{pO=@50SGF$HEiTw#Hit|Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> TlB!#fn4F!Mo?1NlBBL(=cV87I diff --git a/vllm/transformers_utils/__pycache__/config.cpython-310.pyc b/vllm/transformers_utils/__pycache__/config.cpython-310.pyc index 852d8f10c2976c282d19ae5e9a728ca253c8951a..532911ccecf37ef8553efc8f55b9d56891dbce00 100644 GIT binary patch delta 118 zcmccMa>|7}pO=@50SFA&?%T*+#HQk^Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS zUr0c=pO=@50SGF$HEiTAV$<-{FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` zN!2Y#OwLYBPc7cOkWH7Fsc_@u3!HL5YV!xq5EjN|lU@0;*_i$VAi_@% diff --git a/vllm/transformers_utils/__pycache__/tokenizer.cpython-310.pyc b/vllm/transformers_utils/__pycache__/tokenizer.cpython-310.pyc index 60b447301888452a9a962c767fd237c5028cff44..191d2845193e4e4ee7e5d5a4b111b285d83428be 100644 GIT binary patch delta 80 zcmcbwb6tl!pO=@50SFA&?%T+Ho<+q&za+OnzaX*D$wSKPNLu jzo4=tBR_956YFAL#)iqugp%2K7 rlB!#fn4F!Mo?5*5AIoB1#+J#8gp#?q7@7WaF){sPVcyIw?86KI1d1F; diff --git a/vllm/transformers_utils/__pycache__/utils.cpython-310.pyc b/vllm/transformers_utils/__pycache__/utils.cpython-310.pyc index 77fb60c3369a82920c245f7da79ca9858f22366f..4dc959c4b373cad3965555fd293480acd3005e1f 100644 GIT binary patch delta 61 zcmeBVZDr-o=jG*M00P6c`!;gVVpMU_FUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E PFQ_cZ$j_U6mT?aN8r2j+ delta 65 zcmZo=?PTT7=jG*M0D{VG4I8;} Tr0NzVCTAz6rxs5>$+!mqX}A?q diff --git a/vllm/transformers_utils/configs/__pycache__/__init__.cpython-310.pyc b/vllm/transformers_utils/configs/__pycache__/__init__.cpython-310.pyc index 400b5e3771174c53bd187fd02fa5fbf97f042be2..52a9ae47b6fe78741ea1561776cc7183c637d02b 100644 GIT binary patch delta 61 zcmeyy{fV19pO=@50SFA&?%T+n#H!-2Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS PUr0HGWesQ>@~ diff --git a/vllm/transformers_utils/configs/__pycache__/chatglm.cpython-310.pyc b/vllm/transformers_utils/configs/__pycache__/chatglm.cpython-310.pyc index 5b934d3f1f894b1e28279128e678c5e3b6b45491..b8baa1b961ad824451626c64513be3a9b99bb34b 100644 GIT binary patch delta 62 zcmeyx`;C`7pO=@50SFA&?%T-ykwwK%za+OnzaX*D$wSKPNLu Qzo4=tBR_Am3hOmS0C)WrE&u=k delta 66 zcmeyy`-_)5pO=@50SGF$HEiVm$f6OXUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(Ff%O_A0L@4iJ^%m! diff --git a/vllm/transformers_utils/configs/__pycache__/dbrx.cpython-310.pyc b/vllm/transformers_utils/configs/__pycache__/dbrx.cpython-310.pyc index 2f8b67a8b2ca0debe7e777c951b36b6edc41ac66..f014576ae9581b7e046af7a57164411b21f1dc20 100644 GIT binary patch delta 134 zcmX@*xzCe3pO=@50SFA&?%T+%#-`$}Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS zUrAuJ{Ar}4rUHUrvH3QEKHlfa_rzFq~^TP GZ$SWwr69Hd delta 146 zcmdnzdCHSJpO=@50SGF$HEiToW7F{0FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` zN!2Y#OwLYBPc7aY%2vgsqz2T<#lphG#K`iWiIM9+9}5Q~8#B{?4ko65Jj_ggSy(r} O<=DYVjJm@@zXbt?wk5&< diff --git a/vllm/transformers_utils/configs/__pycache__/eagle.cpython-310.pyc b/vllm/transformers_utils/configs/__pycache__/eagle.cpython-310.pyc index 39a4a5038f399be995f83e348b6b9813d930e979..be8b08a204428a3f41d1d6abccba42322c32f34a 100644 GIT binary patch delta 70 zcmbQuGo6P!pO=@50SFA&?%T+1#;oF_Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS YUr};OKXU{V03%rzNB{r; diff --git a/vllm/transformers_utils/configs/__pycache__/exaone.cpython-310.pyc b/vllm/transformers_utils/configs/__pycache__/exaone.cpython-310.pyc index 161adbcd4450a5c7fa0e7d891139b62661e3aabc..c39474db12480bde04e275923e14c5ba2d9aaca2 100644 GIT binary patch delta 62 zcmca&alwK+pO=@50SFA&?%T*cSyIJUza+OnzaX*D$wSKPNLu Qzo4=tBR_BRG08qA0B>{^T>t<8 delta 66 zcmca$am9i=pO=@50SGF$HEiUbEU6KwUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5kYpbd0K>l)Z2$lO diff --git a/vllm/transformers_utils/configs/__pycache__/falcon.cpython-310.pyc b/vllm/transformers_utils/configs/__pycache__/falcon.cpython-310.pyc index aab95b571a55ac957b98a592012cb6b9ee3bb8a6..49f16255ab79795029dc378bcea2dd6c9bc413b8 100644 GIT binary patch delta 62 zcmey#_mz)3pO=@50SFA&?%T*6z@p--Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr*D$wSKPNLu zzo4=tBR_AmzSK!(J|CbiE*2I>9wt6UCdSDeax!WhOdLQa2(tWV`Om=& zlB!#fn4F!Mo?5(FTk0fpLtF*E&TVqpS`vixWH&%umC{Lf|=Ic_EZ+xaM9 diff --git a/vllm/transformers_utils/configs/__pycache__/medusa.cpython-310.pyc b/vllm/transformers_utils/configs/__pycache__/medusa.cpython-310.pyc index dd4229281e14a094426b93de5497406f3f52f74c..ad40fe5b9c0987369b66ae86b9ed2272cc6bda67 100644 GIT binary patch delta 62 zcmZ20uu_0KpO=@50SFA&?%T*M%B*D$wSKPNLu Qzo4=tBR_BRclOz>% delta 66 zcmZ1{yh)flpO=@50SGF$HEiTQ!mbgiUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5*5Gy85v0H`b$Q2+n{ diff --git a/vllm/transformers_utils/configs/__pycache__/mpt.cpython-310.pyc b/vllm/transformers_utils/configs/__pycache__/mpt.cpython-310.pyc index 18a77583714bb30be866f01bf852ff4395814882..07ea9347357104cfcf18a0e89c010a700dae1830 100644 GIT binary patch delta 78 zcmeCtYSZG*=jG*M00P6c`!;e%aHx3cm*f`c7i1RbmLwLXre1rP=jG*M0D{VG4I8;5I5hn9ON)#2bMliDbM$jElk^KJOEU8FjP(o+^ouh~ mQgsUwld}`kQ;RpZb1dRyoHtoZD4C6ek?B7Z)8>gnrAz=aeHrlp diff --git a/vllm/transformers_utils/configs/__pycache__/nemotron.cpython-310.pyc b/vllm/transformers_utils/configs/__pycache__/nemotron.cpython-310.pyc index d8b8e040976bcc91b2235326f784af2d29c54ab8..693b3ca2f9e7a3cbf684cf8ed44033a8212d4060 100644 GIT binary patch delta 105 zcmexv@!o7i-m=ejfshoB+P@}Gy1=|2xF0X8s`i4i0Wg#R`# ImO8@-08RBDd;kCd diff --git a/vllm/transformers_utils/configs/__pycache__/nvlm_d.cpython-310.pyc b/vllm/transformers_utils/configs/__pycache__/nvlm_d.cpython-310.pyc index 3e4678379af25d38ea2f2d9c2ebb60bce1eca241..f9cee42c46843292ce620a2d2ff1b060f9ff4aea 100644 GIT binary patch delta 60 zcmbQsJd>F_pO=@50SFA&?wiQ{T*X(vB)34nAhSTXB(W$xwM5rEw=^TyFt=PkCo@UE Opt2+*KX0-WV>19GiW9E@ delta 64 zcmbQqJeQd}pO=@50SGF$HB97wt`VqTT3n=`lb@WJqo0$Rq+d{3l98WhtY>JTUz}Nz Ss#}nloSm4ST0B{du^9k#z7)Rz diff --git a/vllm/transformers_utils/configs/__pycache__/qwen2vl.cpython-310.pyc b/vllm/transformers_utils/configs/__pycache__/qwen2vl.cpython-310.pyc index 6d53853d08564104e1e28d79c9da65b4e8bbf5b3..32491a113effbffa832f2e983a8e906c4326ed21 100644 GIT binary patch delta 62 zcmdlYx*D$wSKPNLu Qzo4=tBR_95C-Z7{092(EQvd(} delta 66 zcmdlWx UlB!#fn4F!Mo?5(_m3cKg0H=%_if}hkX7-~FUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E zFQ_cZ$j{rHEX%{pX9U#6#lphK!^FqP#5lQLL5h!qi3!MLVr2Obf}2+=++hR&xq=&3 delta 130 zcmezC((1~c&&$ij00foW8a8qp$Z7=WmlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} zr0NzVCTAz6rxtIHm*ru$G6U-5VqszAVd7zA`p?9~#K^+L@{i>|9}6F&03!*D$wSKPNLu Qzo4=tBR_Am5py9k08w-lJ^%m! delta 66 zcmbQwyO@_dpO=@50SGF$HEiVm&!iEpUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> UlB!#fn4F!Mo?5(FkGYT;0Hj+LP5=M^ diff --git a/vllm/transformers_utils/tokenizer_group/__pycache__/base_tokenizer_group.cpython-310.pyc b/vllm/transformers_utils/tokenizer_group/__pycache__/base_tokenizer_group.cpython-310.pyc index 63750e8441972b57d487a067a7872a0f7ef860f9..e1077282911162fe6fab53efc99f711c0563a05f 100644 GIT binary patch delta 62 zcmdlcyh)flpO=@50SFA&?%T+HfJr4;za+OnzaX*D$wSKPNLu Qzo4=tBR_BRXQsn!09X UlB!#fn4F!Mo?5*5J=0+}0IKyCVgLXD diff --git a/vllm/transformers_utils/tokenizer_group/__pycache__/ray_tokenizer_group.cpython-310.pyc b/vllm/transformers_utils/tokenizer_group/__pycache__/ray_tokenizer_group.cpython-310.pyc index 43c7d5fae27a663a94b3759b321537c07870774c..5c3bbcc5f6f77c2093be461fbab0848be12b14af 100644 GIT binary patch delta 62 zcmX?QdCZbKpO=@50SFA&?%T-S&Z?56Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUr_ig0<&a4urUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrz>% diff --git a/vllm/transformers_utils/tokenizers/__pycache__/__init__.cpython-310.pyc b/vllm/transformers_utils/tokenizers/__pycache__/__init__.cpython-310.pyc index e4bba79a27f214ee668aa8ce9c15f0cfba157503..1e6b3a2cac5965c0dc5df971374e1d54b792715b 100644 GIT binary patch delta 59 zcmey#_?3}6pO=@50SFA&?wiQnpc15Cl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEq%{8vrX@6j}fP delta 63 zcmey$_>+-4pO=@50SGF$HB97g&0zg diff --git a/vllm/transformers_utils/tokenizers/__pycache__/mistral.cpython-310.pyc b/vllm/transformers_utils/tokenizers/__pycache__/mistral.cpython-310.pyc index 27bceffae2a0594de845f4aab4a32a1902242178..c3399cc7fe7be6f37b66c89366641d0567398798 100644 GIT binary patch delta 282 zcmaFm^xBCxpO=@50SFA&?#pnU$ZH_Sl){k0l*63M62-#E0Aw@gu;#Kwv4PnvITPbW z>vMUdc)?uO9KKxsDE?f5C;>2^Ek`g{C`t&-W(Tr`qeQ@LjvUcku_!Sxn=?l|S0YLx zS29YHks+0%$PZ`*SB_M!bd)rZ&*ILI!kxm?!jQt#%+$;nC6mIN%AG1J$&kjB!k5C| z!V)Ft&dZP@kRk|FBG}9nCA{&^WJZ-h{gT`Q{esK_-IBzj^wbhv^W4&mT*KUQ{hZ7s z{esGpjQqUK+nJ7w@PYiw#=ykL!^rfXjd63IcsK{Ie31iC^cHJTYI99+*%8~ALW*r@Q&L!YbtR9w zqJv%N%7J!CxX1l9;r@!PDD3c{aEsjzxn(@$(OQQ+xzXUU+=y2UlGmRNJ-p5yXH_Q3 z(NJV!a+6IL^KtobdVJE)W|MhwG#!rahj+!SuGvR3@#X&}VbrDUmr?WY>0*<&&+7N| Pz&7`*T&DGRZ%O|FKy65e diff --git a/vllm/transformers_utils/tokenizers/mistral.py b/vllm/transformers_utils/tokenizers/mistral.py index aae10d3..b7e33ae 100644 --- a/vllm/transformers_utils/tokenizers/mistral.py +++ b/vllm/transformers_utils/tokenizers/mistral.py @@ -1,5 +1,5 @@ import os -import re +import regex as re from dataclasses import dataclass from pathlib import Path from typing import TYPE_CHECKING, Any, Dict, List, Optional, Union diff --git a/vllm/triton_utils/__init__.py b/vllm/triton_utils/__init__.py index 4e19581..80f7a32 100644 --- a/vllm/triton_utils/__init__.py +++ b/vllm/triton_utils/__init__.py @@ -2,8 +2,8 @@ from vllm.triton_utils.importing import HAS_TRITON __all__ = ["HAS_TRITON"] -#from vllm.triton_utils.custom_cache_manager import ( -# maybe_set_triton_cache_manager) -#from vllm.triton_utils.libentry import libentry +from vllm.triton_utils.custom_cache_manager import ( + maybe_set_triton_cache_manager) +from vllm.triton_utils.libentry import libentry __all__ += ["maybe_set_triton_cache_manager", "libentry"] diff --git a/vllm/triton_utils/__pycache__/__init__.cpython-310.pyc b/vllm/triton_utils/__pycache__/__init__.cpython-310.pyc index 9be72bcbf7409ee1eb3a5b81adb82dca57ee866d..1ddb7112f1770e107aef8ec0038e1eee53ab2db4 100644 GIT binary patch delta 61 zcmZ3+yoi}QpO=@50SFA&?%T+1!KmV>Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS PUr*D$wSKPNLu hzo4=tBR_BR2Sx)99uA-`HU mlB!#fn4F!Mo?5*54Wj`EA4n@310NI9KNd!||C=?qn%Mz!PZ?qW diff --git a/vllm/usage/__pycache__/__init__.cpython-310.pyc b/vllm/usage/__pycache__/__init__.cpython-310.pyc index 9320f07bf3dae4d1927cdb1e914ab152bc4c6f05..2ebb66338b879e3aec1c275882658fed4799782c 100644 GIT binary patch delta 59 zcmbQuIGvF@pO=@50SFA&?wiPMqhh6Bl3So(kXfKxl30|UTB2*7Tbhw;m|L!&lbNJn NP+5|ZpEogI2LSPh6662? delta 63 zcmbQvIGd3>pO=@50SGF$HB98T(Xi7mEiTf}$xlwq(a*_D(l4ki$;i($)-yEFFU~AU R)h$R&&Q45EEuNUI0{}gu6Z8N8 diff --git a/vllm/usage/__pycache__/usage_lib.cpython-310.pyc b/vllm/usage/__pycache__/usage_lib.cpython-310.pyc index 4c0bd297b9b47b8789f72d070b60cf898920155e..b7990bfe8df7e93ed79373dc420a58af55f406f5 100644 GIT binary patch delta 62 zcmZ2xvdDxxpO=@50SFA&?%T-C#H?biUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrE QFQ_cZ$j{p>&z8jw07SSG>i_@% delta 66 zcmZpb?v&=v=jG*M0D{VG4I8=NuxdE#mlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} Ur0NzVCTAz6rxtIPX3Js+0G6K=`v3p{ diff --git a/vllm/worker/__pycache__/cpu_enc_dec_model_runner.cpython-310.pyc b/vllm/worker/__pycache__/cpu_enc_dec_model_runner.cpython-310.pyc index 29b091e8443fbb7278b7afb65abc8c865a93df54..b6a4074f5ed9051e86cb497f28998dd6cc4eaf9a 100644 GIT binary patch delta 130 zcmX?Yf83rspO=@50SFA&?%T-S&!Xb3Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS zUr12KxYsRw8-ZJitoYf!^Qy?+*D$wSKPNLu zzo4=tBR_BRQ+8cJp){Z_4h{}RE@mD^4o0T`d`z3wB*VBFYbMvKcye$tGBL9JXJXlW ZLFE=VW7Ou=1}u!s9E>cRHyKW21pvm7B3l3e delta 130 zcmX?*cOs8FpO=@50SGF$HEiVG#IE73Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> zlB!#fn4F!Mo?5*5A-k@iNCr?R2L}fu7c&$##@^g8?Z1kvoW%5US&9q6#x~ZCC>l= diff --git a/vllm/worker/__pycache__/model_runner.cpython-310.pyc b/vllm/worker/__pycache__/model_runner.cpython-310.pyc index a8cef0115090758148acbc29f05f31cbbdd54a27..b85fb28f12bc42b8edce049d83ae1ab2df53dd6e 100644 GIT binary patch delta 826 zcmXAl?@Lor7{~8(ce`%$Zth3AN!B#QSYSiTEQBP)S7m8oKYZb3xur9=U2k`YaL__} zBUZ+F6_jq8mP#}|P6^72uq0D6%NPC&1yMl|r0bmPf&1lip6~ab=RBwHJOAe!pBc4S z%p6^%Pv@sHqo$%NpB7epN=PZu{Ax>3E2#*_TEnH`PG5WIicjg%TB8v%YUw;$(NEfkxeNiJ6hJC}RMWJuUQi z*^G>o3v{+16XgQ|R<|NEx^9w*E=L(i`3=#+=|Cr5fG=q>9 zLDJ;MKuf<@3OCjjpH~ zYLUayK(JlD8dW>}YCzUP;h_48x|?D&rYSLPGb0oUgqnlb)kWNK)`=esnfQMkemvCe zpmzn-n|Q~FiE9RRD(*p zzf0Xm`>L#;x{SpMFRZiaN%h1*fEgT_tmVG~zEPAz)+cKP@j1(V#>L6Iut8>%vf%l| WDh=$63ru>L^fH-YlEOz)8~*__Cjn&u delta 803 zcmXAlT}V@59LCT8?0B5}a&GBXO_v7df}Hk61eFlwMXR*PP>8kWTC?Hi*>*8HWFX!| zAIkr#sJUfH%OdsFB|&KfhGpvdFj#cawSnM8H#!zuDGs>KlX77ngl&F~&NQ-`a+Sh* zxrlO2JM#^)hH|aq7t318yA?LdI?DSME|K+=8x%Il2FgbjHp|77U4E{PZnQx*(#0ud zP%4*DZjEm2VHIVviLTtr#3Gw1`_O53KsRZ%uL7uvtMWscN&_Ok~0gTAG^-Dvd@YY4-~7T|dcPPu65$Zz^&$l;?qlBGLC2$l<{o zxe`7v{Nt%F^1>P~h$;hd+`J{gD4Fcvse?&ezHf&S)FuwW6dp^&;1#|}^ipmdD7Q=l z$K}LOEEP(Ao~6P7b67EWRy#*~q&-Z&W47OnI2hs=0H1HQkj)SE z^p@vw`=c>StN*1ii1LR9Zmo&=LJ4J7$456pp*489X=SG%m8tM<$P%%#(XV zZ~5ve#$!wf6Sk3~cs=%s8OkxfVsE+{7V&A?Q9i@mVJdB+HqajAm#N~}+s$JMk0 zz7X4!0{|1)HhdhGupwn7)59)7e90o8(KK=!zL5tbZo!^q&KdT53zKdpJxs=#WN^#G F(tp9B`#t~w diff --git a/vllm/worker/__pycache__/model_runner_base.cpython-310.pyc b/vllm/worker/__pycache__/model_runner_base.cpython-310.pyc index 370603046a1710e6fee45af8ca7c25a7102b4760..41fe8a49cffc39ef3b0ff5a687fec5f1853f8601 100644 GIT binary patch delta 82 zcmZ4LJ>Q!t<8 diff --git a/vllm/worker/__pycache__/multi_step_model_runner.cpython-310.pyc b/vllm/worker/__pycache__/multi_step_model_runner.cpython-310.pyc index 6a57eb8d25aa8eddcdf6599102014a11863cc4cc..b05eb7921051223be7d894fb810fa52447ac2649 100644 GIT binary patch delta 84 zcmdnCigD8_M(%uGUM>b8FkHKDBX=RIikE&#Zh?M5W`S-=Vo`c(iLQBWX-2MLZn=I= nW|DqEWl2VU-sUB&{Hk0$oIL-T7&-n|$xeb8sNB}Dk-Lyp!%x4oxJW-IKRGc+KPNLuzo4=tBR|hr&(J`> rII|>Gw;(Y&J25@Ac=G~QepN0mPQL$4j2!=~WG5HeiEcipm7)az-0~c! diff --git a/vllm/worker/__pycache__/multi_step_tpu_worker.cpython-310.pyc b/vllm/worker/__pycache__/multi_step_tpu_worker.cpython-310.pyc index 1ef4b4500051a0e2a11bbe9168af835c4f55ba12..fabe7d26906593e1ca833c2b56d760c29f196dc6 100644 GIT binary patch delta 62 zcmaDXa$kfypO=@50SFA&?%T-i#iZh)Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrqmBpO=@50SGF$HEiVeV$$%@FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` UN!2Y#OwLYBPc7bD$@GjJ0Hxm*+W-In diff --git a/vllm/worker/__pycache__/multi_step_worker.cpython-310.pyc b/vllm/worker/__pycache__/multi_step_worker.cpython-310.pyc index c55ecd058856d333f332be4692e780464ea4fa44..614441315574ed921b6dd82989dea1b78ea68898 100644 GIT binary patch delta 62 zcmZ3Yx~783vf delta 75 zcmZ4Ew!w`%pO=@50SGF$HEiV8W7Y7|FD)+8&&f|t%+b%uOwuo?EXl~vGuAUS&@av` dN!2Y#OwLYBPc7aY%j(0y%*M>Nc@1xaC;(%;7asrs diff --git a/vllm/worker/__pycache__/neuron_worker.cpython-310.pyc b/vllm/worker/__pycache__/neuron_worker.cpython-310.pyc index 5fac9ad7e3668493175f6445688d16ac51249598..9a00b6b8a20643972f9bbb38eca114afed95a77e 100644 GIT binary patch delta 62 zcmbQEG((9ypO=@50SFA&?%T*6#H!+;Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS QUrtF*E&TVwrqixQ>sFne9Id T6B{Gbf3|;2^EXF|TxSCS^&lf* diff --git a/vllm/worker/__pycache__/openvino_worker.cpython-310.pyc b/vllm/worker/__pycache__/openvino_worker.cpython-310.pyc index f6fa42e62d45d739c288c43d7f3fe265fe7c61b1..87ac044dbde79c49eb675618df5c76efdb9a6e8e 100644 GIT binary patch delta 109 zcmexW@u`A4pO=@50SFA&?%T+n&!OU^Uy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS zUr|L4NwywCmSOOaxw8R@-gzUZGOg~ug{ngD9flne&poY1IMTDW2wT88ZA&Vo6Gn=)@ERS{a9nmbNJl@S7Vr%sQ DO(-8D delta 105 zcmey^&G@yOkvpH4mx}=iDz`OkEFQ_cZ$j>v@Gc?dI z&MZmQEl5nxPE1cN-kiXmz$Z~?UBg_%BEnG1TEkkykj0V3nax^cR%ku>hG-U3VdZ8Q Hv90ITQ~>i_@% diff --git a/vllm/worker/__pycache__/utils.cpython-310.pyc b/vllm/worker/__pycache__/utils.cpython-310.pyc index a32a86afe93752d185436fc77fc68712acb206ac..6e964660335dced909561b2c3a8c38967739143d 100644 GIT binary patch delta 62 zcmZqYZsz9B=jG*M00P6c`!;fWv8Y(+m*f`c7i1RbmLwLXr*D$wSKPNLu zzo4=tBR_BQEk0Go36uDZIa&U5FflQ*{Aby0$A4K=MFD6K8xt23A0rnd3s4x9CC13| MkA-owrK*}301bm5_W%F@ delta 134 zcmcawcE5}}pO=@50SGF$HEiTw&Zl9kUs_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> zlB!#fn4F!Mo?1Nl8lNiTq{)ByjJcWqGyUgaW@2Re&$iiu|FWot3eY?@CN3r(pb!@m U3nL4VL}!aJas1n?uc{^n03IDB{r~^~ diff --git a/vllm/worker/__pycache__/worker_base.cpython-310.pyc b/vllm/worker/__pycache__/worker_base.cpython-310.pyc index b3bdfef68f53db7a922a235845895539b076d109..a1aec6a207a71c5191ec61b880c0f975b36776c5 100644 GIT binary patch delta 113 zcmdmAv9p3ZpO=@50SFA&?%T-yfmOv$za+OnzaX*D$wSKPNLu zzo4=tBR_AmGTSB<#)8S$v@Dsqn0O`&X>0RwFmW(40U^hK7M3cl$?sKVC*N1(*j%KY N$OKZe`I>Gf9{~HTA_4#a delta 101 zcmdm4vA=>lpO=@50SGF$HEiVmz^dV-Us_zGpOc@Qn4_PQnWSG(S(1^TXRK#vpkJI> zlB!#fn4F!Mo?5(Fo^6u~W6|VGT9(WlOnj61w6)pTn3(=?FmJZip1=eW+k8PclMeui Cz8>HJ diff --git a/vllm/worker/__pycache__/xpu_model_runner.cpython-310.pyc b/vllm/worker/__pycache__/xpu_model_runner.cpython-310.pyc index 8130605ff25d50a0e7f2d4a67f12d5cd8dc86f91..ee9897b6c218b4605f8450c1a73c84666af4de77 100644 GIT binary patch delta 87 zcmbPG*j31#&&$ij00f3>_if~6W>az2FUc*?FUTy=ElDg&Pc6|k&n?Z!HOwv7&&f>E pFQ_cZ$j{qs#`a2vnTLgCv$8Uy0AtK#RpVe54kjkX&2`2?tN?rw7_$HX delta 93 zcmeAwoKVP}&&$ij00foW8a8q>vuU{NmlhZ4=j10R=IG~SCg~ScmSp7T8S5Du=oe>} vr0NzVCTAz6rxtHEVtXaS%*DdCSzeh@fH7{eqH!=A8xzw%Cg#l*#zL$BAMYBu diff --git a/vllm/worker/__pycache__/xpu_worker.cpython-310.pyc b/vllm/worker/__pycache__/xpu_worker.cpython-310.pyc index 7b6f4180f589e608378e5cae24844e6391411bc4..c4cc9e5fe8405052f400833db9e8c675cbebf376 100644 GIT binary patch delta 104 zcmX@0zek@tpO=@50SFA&?%T-C$f07ZUy@s(Uyxa#Tas9mo?4=7o?DucYnWTEpOcxS zUrGB&Ah_r7#ZCs-x0aW?E^HZ$QDGnZr&rhgptv6a-w)V E0DKQ0tN;K2 delta 108 zcmdm^e?Xr*pO=@50SGF$HEiT&G>&78vL7#Te#-w?UV?F%%l$QDGnZQdcegptu} Ia;$hf01SU2EdT%j