Upgrade to vllm 0.17.0 corex v4.1 overlay
This commit is contained in:
@@ -311,8 +311,9 @@ class AutoWeightsLoader:
|
||||
|
||||
continue
|
||||
|
||||
named_parameters = module.named_parameters(recurse=True)
|
||||
desc_param_keys = {
|
||||
base_prefix + k for k, _ in module.named_parameters(recurse=True)
|
||||
maybe_prefix(base_prefix, k) for k, _ in named_parameters
|
||||
}
|
||||
msg = (
|
||||
f"There is no module or parameter named {prefix!r} "
|
||||
@@ -874,16 +875,3 @@ def get_layer_index(feature_layer_index: int, num_hidden_layers: int) -> int:
|
||||
if feature_layer_index < 0:
|
||||
return num_hidden_layers + feature_layer_index + 1
|
||||
return feature_layer_index
|
||||
|
||||
|
||||
from vllm.model_executor.layers.quantization.compressed_tensors.utils import should_ignore_layer
|
||||
|
||||
def reparse_quant_config(prefix: str, quant_config):
|
||||
ignore = getattr(quant_config, "ignore", None)
|
||||
if not ignore:
|
||||
return quant_config
|
||||
|
||||
if should_ignore_layer(prefix, ignore):
|
||||
return None
|
||||
|
||||
return quant_config
|
||||
Reference in New Issue
Block a user