specsGuy
/

Deepseek-ocr

Image-Text-to-Text

feature-extraction

vision-language

Model card Files Files and versions

specsGuy commited on Nov 14, 2025

Commit

a50cbc5

·

verified ·

1 Parent(s): 8ae2e57

Update modeling_deepseekocr.py

Files changed (1) hide show

modeling_deepseekocr.py +1 -1

modeling_deepseekocr.py CHANGED Viewed

@@ -620,7 +620,7 @@ class DeepseekOCRForCausalLM(DeepseekV2ForCausalLM):
         if past_key_values is not None:
             if isinstance(past_key_values, Cache):
                 cache_length = past_key_values.get_seq_length()
-                past_length = past_key_values.seen_tokens
                 max_cache_length = past_key_values.get_max_length()
             else:
                 cache_length = past_length = past_key_values[0][0].shape[2]

         if past_key_values is not None:
             if isinstance(past_key_values, Cache):
                 cache_length = past_key_values.get_seq_length()
+                past_length = getattr(past_key_values, "seen_tokens", cache_length)
                 max_cache_length = past_key_values.get_max_length()
             else:
                 cache_length = past_length = past_key_values[0][0].shape[2]