Add technical report link and text improvements
#2
by
nlivathinos
- opened
README.md
CHANGED
|
@@ -2,19 +2,16 @@
|
|
| 2 |
license: apache-2.0
|
| 3 |
---
|
| 4 |
|
| 5 |
-
|
| 6 |
|
|
|
|
| 7 |
|
| 8 |
-
|
| 9 |
|
| 10 |
-
|
| 11 |
|
| 12 |
-
The model has been trained from scratch on a mix of document datasets.
|
| 13 |
|
| 14 |
-
|
| 15 |
-
|
| 16 |
-
|
| 17 |
-
# Inference code example
|
| 18 |
|
| 19 |
Prerequisites:
|
| 20 |
|
|
@@ -85,9 +82,19 @@ for result in results:
|
|
| 85 |
```
|
| 86 |
|
| 87 |
|
| 88 |
-
|
| 89 |
|
| 90 |
```
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 91 |
@techreport{Docling,
|
| 92 |
author = {Deep Search Team},
|
| 93 |
month = {8},
|
|
@@ -98,16 +105,5 @@ for result in results:
|
|
| 98 |
version = {1.0.0},
|
| 99 |
year = {2024}
|
| 100 |
}
|
| 101 |
-
|
| 102 |
-
@misc{lv2024rtdetrv2improvedbaselinebagoffreebies,
|
| 103 |
-
title={RT-DETRv2: Improved Baseline with Bag-of-Freebies for Real-Time Detection Transformer},
|
| 104 |
-
author={Wenyu Lv and Yian Zhao and Qinyao Chang and Kui Huang and Guanzhong Wang and Yi Liu},
|
| 105 |
-
year={2024},
|
| 106 |
-
eprint={2407.17140},
|
| 107 |
-
archivePrefix={arXiv},
|
| 108 |
-
primaryClass={cs.CV},
|
| 109 |
-
url={https://arxiv.org/abs/2407.17140},
|
| 110 |
-
}
|
| 111 |
-
|
| 112 |
```
|
| 113 |
|
|
|
|
| 2 |
license: apache-2.0
|
| 3 |
---
|
| 4 |
|
| 5 |
+
# Document Layout Analysis "heron-101"
|
| 6 |
|
| 7 |
+
๐ **`heron-101`** is a Document Layout Analysis Model used in the [Docling project](https://github.com/docling-project/docling).
|
| 8 |
|
| 9 |
+
๐ For an in-depth description of the **model architecture**, **training datasets**, and **evaluation methodology**, please refer to our technical report:
|
| 10 |
|
| 11 |
+
๐ For an in-depth description of the model architecture, training datasets, and evaluation methodology, please refer to our technical report: **"Advanced Layout Analysis Models for Docling"**, Nikolaos Livathinos *et al.*,
|
| 12 |
|
|
|
|
| 13 |
|
| 14 |
+
## Inference code example
|
|
|
|
|
|
|
|
|
|
| 15 |
|
| 16 |
Prerequisites:
|
| 17 |
|
|
|
|
| 82 |
```
|
| 83 |
|
| 84 |
|
| 85 |
+
## References
|
| 86 |
|
| 87 |
```
|
| 88 |
+
@misc{livathinos2025advancedlayoutanalysismodels,
|
| 89 |
+
title={advanced layout analysis models for docling},
|
| 90 |
+
author={nikolaos livathinos and christoph auer and ahmed nassar and rafael teixeira de lima and maksym lysak and brown ebouky and cesar berrospi and michele dolfi and panagiotis vagenas and matteo omenetti and kasper dinkla and yusik kim and valery weber and lucas morin and ingmar meijer and viktor kuropiatnyk and tim strohmeyer and a. said gurbuz and peter w. j. staar},
|
| 91 |
+
year={2025},
|
| 92 |
+
eprint={2509.11720},
|
| 93 |
+
archiveprefix={arxiv},
|
| 94 |
+
primaryclass={cs.cv},
|
| 95 |
+
url={https://arxiv.org/abs/2509.11720},
|
| 96 |
+
}
|
| 97 |
+
|
| 98 |
@techreport{Docling,
|
| 99 |
author = {Deep Search Team},
|
| 100 |
month = {8},
|
|
|
|
| 105 |
version = {1.0.0},
|
| 106 |
year = {2024}
|
| 107 |
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 108 |
```
|
| 109 |
|