allenai
/

Molmo-7B-D-0924

Image-Text-to-Text

text-generation

Model card Files Files and versions Community

soldni commited on Sep 25

Commit

f75a7cd

•

1 Parent(s): 27a76be

Update modeling_molmo.py

Files changed (1) hide show

modeling_molmo.py +3 -3

modeling_molmo.py CHANGED Viewed

@@ -2509,7 +2509,6 @@ class MOLMoForCausalLM(PreTrainedModel):
         outputs: ModelOutput,
         model_kwargs: Dict[str, Any],
         is_encoder_decoder: bool = False,
-        standardize_cache_format: bool = False,
         num_new_tokens: int = 1,
     ) -> Dict[str, Any]:
         if self.config.use_position_ids:
@@ -2520,8 +2519,9 @@ class MOLMoForCausalLM(PreTrainedModel):
                 del model_kwargs["images"]
                 del model_kwargs["image_masks"]
                 del model_kwargs["image_input_idx"]
-        model_kwargs = super()._update_model_kwargs_for_generation(
-            outputs, model_kwargs, is_encoder_decoder, standardize_cache_format, num_new_tokens)
         return model_kwargs
     # TODO: these are required to make the implementation complete.

         outputs: ModelOutput,
         model_kwargs: Dict[str, Any],
         is_encoder_decoder: bool = False,
         num_new_tokens: int = 1,
     ) -> Dict[str, Any]:
         if self.config.use_position_ids:
                 del model_kwargs["images"]
                 del model_kwargs["image_masks"]
                 del model_kwargs["image_input_idx"]
+        cache_name, cache = super()._extract_past_from_model_output(outputs)
+        model_kwargs[cache_name] = cache
+        model_kwargs["cache_position"] = model_kwargs["cache_position"][-1:] + num_new_tokens
         return model_kwargs
     # TODO: these are required to make the implementation complete.