THUDM
/

cogvlm2-video-llama3-chat

Text Generation

Model card Files Files and versions Community

zR commited on Jul 24

Commit

f375ead

•

1 Parent(s): ca14f13

update

Files changed (3) hide show

config.json +1 -1
generation_config.json +1 -1
modeling_cogvlm.py +3 -1

config.json CHANGED Viewed

@@ -21,7 +21,7 @@
   "template_version": "base",
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
-  "transformers_version": "4.41.0",
   "use_cache": true,
   "vision_config": {
     "dropout_prob": 0.0,

   "template_version": "base",
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
+  "transformers_version": "4.43.1",
   "use_cache": true,
   "vision_config": {
     "dropout_prob": 0.0,

generation_config.json CHANGED Viewed

@@ -7,5 +7,5 @@
   "max_length": 2048,
   "top_p": 0.1,
   "top_k": 1,
-  "transformers_version": "4.41.0"
 }

   "max_length": 2048,
   "top_p": 0.1,
   "top_k": 1,
+  "transformers_version": "4.43.1"
 }

modeling_cogvlm.py CHANGED Viewed

@@ -723,9 +723,11 @@ class CogVLMVideoForCausalLM(CogVLMPreTrainedModel):
             standardize_cache_format: bool = False,
     ) -> Dict[str, Any]:
         # update past_key_values
-        model_kwargs["past_key_values"] = self._extract_past_from_model_output(
             outputs, standardize_cache_format=standardize_cache_format
         )
         if getattr(outputs, "state", None) is not None:
             model_kwargs["state"] = outputs.state

             standardize_cache_format: bool = False,
     ) -> Dict[str, Any]:
         # update past_key_values
+        cache_name, cache = self._extract_past_from_model_output(
             outputs, standardize_cache_format=standardize_cache_format
         )
+        model_kwargs[cache_name] = cache
         if getattr(outputs, "state", None) is not None:
             model_kwargs["state"] = outputs.state