From 5ae24d0620bd79582a35252adeabe96353efad4f Mon Sep 17 00:00:00 2001 From: ai-modelscope Date: Wed, 23 Apr 2025 21:11:53 +0800 Subject: [PATCH] Add supports_gradient_checkpointing --- README.md | 1 + 1 file changed, 1 insertion(+) diff --git a/README.md b/README.md index cdd5c6f..25fc446 100644 --- a/README.md +++ b/README.md @@ -138,6 +138,7 @@ def split_model(model_name): device_map['language_model.model.embed_tokens'] = 0 device_map['language_model.output'] = 0 device_map['language_model.model.norm'] = 0 + device_map['language_model.model.rotary_emb'] = 0 device_map['language_model.lm_head'] = 0 device_map[f'language_model.model.layers.{num_layers - 1}'] = 0