zai-org
/

glm-4-9b-chat

Model card Files Files and versions

duzx16 commited on Jul 14, 2024

Commit

047c657

·

1 Parent(s): 27f8067

Fix past_key_values

Files changed (1) hide show

modeling_chatglm.py +2 -1

modeling_chatglm.py CHANGED Viewed

@@ -932,9 +932,10 @@ class ChatGLMForConditionalGeneration(ChatGLMPreTrainedModel):
             standardize_cache_format: bool = False,
     ) -> Dict[str, Any]:
         # update past_key_values
-        model_kwargs["past_key_values"] = self._extract_past_from_model_output(
             outputs, standardize_cache_format=standardize_cache_format
         )
         # update attention mask
         if "attention_mask" in model_kwargs:

             standardize_cache_format: bool = False,
     ) -> Dict[str, Any]:
         # update past_key_values
+        cache_name, cache = self._extract_past_from_model_output(
             outputs, standardize_cache_format=standardize_cache_format
         )
+        model_kwargs[cache_name] = cache
         # update attention mask
         if "attention_mask" in model_kwargs: