Upload folder using huggingface_hub
Browse files- README.md +2 -1
- model-00001-of-000001.safetensors +3 -0
- model.safetensors.index.json +0 -0
- modeling_deepseekocr.py +2 -2
README.md
CHANGED
|
@@ -16,7 +16,7 @@ license: mit
|
|
| 16 |
|
| 17 |
<div>
|
| 18 |
<p style="margin-top: 0;margin-bottom: 0;">
|
| 19 |
-
<em><a href="https://docs.unsloth.ai/
|
| 20 |
</p>
|
| 21 |
<div style="display: flex; gap: 5px; align-items: center; ">
|
| 22 |
<a href="https://github.com/unslothai/unsloth/">
|
|
@@ -32,6 +32,7 @@ license: mit
|
|
| 32 |
<h1 style="margin-top: 0rem;">✨ Read our DeepSeek-OCR Guide <a href="https://docs.unsloth.ai/new/deepseek-ocr">here</a>!</h1>
|
| 33 |
</div>
|
| 34 |
|
|
|
|
| 35 |
- Fine-tune DeepSeek-OCR for free using our [Google Colab notebook](https://colab.research.google.com/github/unslothai/notebooks/blob/main/nb/Deepseek_OCR_(3B).ipynb)
|
| 36 |
- View the rest of our notebooks in our [docs here](https://docs.unsloth.ai/get-started/unsloth-notebooks).
|
| 37 |
|
|
|
|
| 16 |
|
| 17 |
<div>
|
| 18 |
<p style="margin-top: 0;margin-bottom: 0;">
|
| 19 |
+
<em>This DeepSeek-OCR upload was edited to enable inference & fine-tuning on the latest transformers (no accuracy change). <a href="https://docs.unsloth.ai/new/deepseek-ocr-run-and-fine-tune#fine-tuning-deepseek-ocr">Read more</a></em>
|
| 20 |
</p>
|
| 21 |
<div style="display: flex; gap: 5px; align-items: center; ">
|
| 22 |
<a href="https://github.com/unslothai/unsloth/">
|
|
|
|
| 32 |
<h1 style="margin-top: 0rem;">✨ Read our DeepSeek-OCR Guide <a href="https://docs.unsloth.ai/new/deepseek-ocr">here</a>!</h1>
|
| 33 |
</div>
|
| 34 |
|
| 35 |
+
- Thank you to [Prithiv's](https://huggingface.co/prithivMLmods/DeepSeek-OCR-Latest-BF16.I64) model modifcations that enables DeepSeek-OCR fine-tuning.
|
| 36 |
- Fine-tune DeepSeek-OCR for free using our [Google Colab notebook](https://colab.research.google.com/github/unslothai/notebooks/blob/main/nb/Deepseek_OCR_(3B).ipynb)
|
| 37 |
- View the rest of our notebooks in our [docs here](https://docs.unsloth.ai/get-started/unsloth-notebooks).
|
| 38 |
|
model-00001-of-000001.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1169e7cdc28ff2fb6186556acb2175db148ad26a62097df4c45a17e523180d3f
|
| 3 |
+
size 6672547120
|
model.safetensors.index.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
modeling_deepseekocr.py
CHANGED
|
@@ -370,7 +370,7 @@ def decoder_layer_init(self, config: DeepseekV2Config, layer_idx: int):
|
|
| 370 |
DeepseekV2DecoderLayer.__init__ = decoder_layer_init
|
| 371 |
|
| 372 |
class DeepseekOCRConfig(DeepseekV2Config):
|
| 373 |
-
model_type = "
|
| 374 |
|
| 375 |
class DeepseekOCRModel(DeepseekV2Model):
|
| 376 |
config_class = DeepseekOCRConfig
|
|
@@ -1040,4 +1040,4 @@ class DeepseekOCRForCausalLM(DeepseekV2ForCausalLM):
|
|
| 1040 |
plt.savefig(f'{output_path}/geo.jpg')
|
| 1041 |
plt.close()
|
| 1042 |
|
| 1043 |
-
result.save(f"{output_path}/result_with_boxes.jpg")
|
|
|
|
| 370 |
DeepseekV2DecoderLayer.__init__ = decoder_layer_init
|
| 371 |
|
| 372 |
class DeepseekOCRConfig(DeepseekV2Config):
|
| 373 |
+
model_type = "deepseek_ocr"
|
| 374 |
|
| 375 |
class DeepseekOCRModel(DeepseekV2Model):
|
| 376 |
config_class = DeepseekOCRConfig
|
|
|
|
| 1040 |
plt.savefig(f'{output_path}/geo.jpg')
|
| 1041 |
plt.close()
|
| 1042 |
|
| 1043 |
+
result.save(f"{output_path}/result_with_boxes.jpg")
|