[Model] Support Meituan LongCat-Flash && LongCat-Flash-MTP (#9824)
This commit is contained in:
@@ -307,7 +307,10 @@ class ModelRunner:
|
||||
model_num_layers = (
|
||||
self.model_config.num_nextn_predict_layers
|
||||
if self.is_draft_worker and model_has_mtp_layers
|
||||
else self.model_config.num_hidden_layers
|
||||
else max(
|
||||
self.model_config.num_hidden_layers,
|
||||
self.model_config.num_attention_layers,
|
||||
)
|
||||
)
|
||||
self.start_layer = getattr(self.model, "start_layer", 0)
|
||||
self.end_layer = getattr(self.model, "end_layer", model_num_layers)
|
||||
|
||||
Reference in New Issue
Block a user