File size: 1,955 Bytes
ffe59ba
 
 
 
 
4e0f10e
ffe59ba
 
 
 
 
 
 
 
 
 
 
 
 
 
4e0f10e
ffe59ba
 
 
 
 
 
 
 
 
 
 
 
 
 
4e0f10e
ffe59ba
 
 
 
 
 
 
 
 
 
 
4e0f10e
 
 
 
ffe59ba
4e0f10e
 
 
 
 
 
ffe59ba
 
 
4e0f10e
 
 
 
ffe59ba
4e0f10e
ffe59ba
4e0f10e
 
ffe59ba
 
 
4e0f10e
 
 
 
ffe59ba
4e0f10e
ffe59ba
4e0f10e
 
 
 
ffe59ba
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
[
  {
    "id": "receipt",
    "filename": "receipt.png",
    "label": "Grocery receipt",
    "description": "Printed receipt with line items, subtotal, tax, total. Donut on CORD reads this end-to-end.",
    "labels": [
      "merchant",
      "date",
      "line_item",
      "subtotal",
      "tax",
      "total",
      "payment_method"
    ]
  },
  {
    "id": "invoice",
    "filename": "invoice.png",
    "label": "Vendor invoice",
    "description": "Multi-column invoice with billing party, line items, subtotal, tax, total.",
    "labels": [
      "vendor",
      "invoice_number",
      "date",
      "due_date",
      "billing_party",
      "line_item",
      "total"
    ]
  },
  {
    "id": "business-card",
    "filename": "business-card.png",
    "label": "Business card",
    "description": "Tight layout, mixed text sizes, multiple contact fields. Good NER showcase.",
    "labels": [
      "company",
      "person",
      "role",
      "email",
      "phone",
      "address",
      "website"
    ]
  },
  {
    "id": "event-poster",
    "filename": "event-poster.png",
    "label": "Event poster",
    "description": "Large-text poster with title, date, artists, ticket info. Florence-2 OCR's home turf.",
    "labels": [
      "event",
      "date",
      "venue",
      "artist",
      "price",
      "organization"
    ]
  },
  {
    "id": "slide",
    "filename": "slide.png",
    "label": "Presentation slide",
    "description": "Roadmap slide with title and three numbered items. Clean printed text on a single background.",
    "labels": [
      "initiative",
      "person",
      "date",
      "quarter"
    ]
  },
  {
    "id": "letter",
    "filename": "letter.png",
    "label": "Business letter",
    "description": "Short printed business letter with sender, date, recipient, body, and signature.",
    "labels": [
      "company",
      "person",
      "address",
      "date",
      "amount",
      "phone"
    ]
  }
]