Support accelerate for GLM
#2
by
larrylawl
- opened
- modeling_glm.py +1 -0
modeling_glm.py
CHANGED
@@ -625,6 +625,7 @@ class GLMPreTrainedModel(PreTrainedModel):
|
|
625 |
base_model_prefix = "glm"
|
626 |
supports_gradient_checkpointing = True
|
627 |
_keys_to_ignore_on_load_missing = [r"position_ids"]
|
|
|
628 |
|
629 |
def _init_weights(self, module):
|
630 |
""" Initialize the weights """
|
|
|
625 |
base_model_prefix = "glm"
|
626 |
supports_gradient_checkpointing = True
|
627 |
_keys_to_ignore_on_load_missing = [r"position_ids"]
|
628 |
+
_no_split_modules = ["GLMBlock"]
|
629 |
|
630 |
def _init_weights(self, module):
|
631 |
""" Initialize the weights """
|