Support accelerate for GLM
#2
by
larrylawl
- opened
- modeling_glm.py +1 -0
modeling_glm.py
CHANGED
|
@@ -625,6 +625,7 @@ class GLMPreTrainedModel(PreTrainedModel):
|
|
| 625 |
base_model_prefix = "glm"
|
| 626 |
supports_gradient_checkpointing = True
|
| 627 |
_keys_to_ignore_on_load_missing = [r"position_ids"]
|
|
|
|
| 628 |
|
| 629 |
def _init_weights(self, module):
|
| 630 |
""" Initialize the weights """
|
|
|
|
| 625 |
base_model_prefix = "glm"
|
| 626 |
supports_gradient_checkpointing = True
|
| 627 |
_keys_to_ignore_on_load_missing = [r"position_ids"]
|
| 628 |
+
_no_split_modules = ["GLMBlock"]
|
| 629 |
|
| 630 |
def _init_weights(self, module):
|
| 631 |
""" Initialize the weights """
|