THUDM
/

glm-10b-chinese

Feature Extraction

Model card Files Files and versions Community

Support accelerate for GLM

#2

by larrylawl - opened Apr 5, 2023

base: refs/heads/main

←

from: refs/pr/2

Discussion Files changed

Files changed (1) hide show

modeling_glm.py +1 -0

modeling_glm.py CHANGED Viewed

@@ -625,6 +625,7 @@ class GLMPreTrainedModel(PreTrainedModel):
     base_model_prefix = "glm"
     supports_gradient_checkpointing = True
     _keys_to_ignore_on_load_missing = [r"position_ids"]
     def _init_weights(self, module):
         """ Initialize the weights """

     base_model_prefix = "glm"
     supports_gradient_checkpointing = True
     _keys_to_ignore_on_load_missing = [r"position_ids"]
+    _no_split_modules = ["GLMBlock"]
     def _init_weights(self, module):
         """ Initialize the weights """