runninglsy commited on
Commit
5a7a90f
·
verified ·
1 Parent(s): 6407cfd

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +1 -1
README.md CHANGED
@@ -66,7 +66,7 @@ class OvisOCRParser:
66
  gpu_memory_utilization=0.8,
67
  )
68
 
69
- prompt = 'Extract all readable content from the image in natural human reading order and output the result as a single Markdown document. For charts or images, represent them using an HTML image tag: <img src="images/bbox_{left}_{top}_{right}_{bottom}.jpg" />, where left, top, right, bottom are bounding box coordinates scaled to [0, 1000). Format formulas as LaTeX. Format tables as HTML: <table>...</table>. Transcribe all other text as standard Markdown. Preserve the original text without translation or paraphrasing.'
70
  self.prompt = self.model.get_tokenizer().apply_chat_template(
71
  [{"role": "user", "content": f"<image>\n{prompt}"}],
72
  tokenize=False,
 
66
  gpu_memory_utilization=0.8,
67
  )
68
 
69
+ prompt = 'Extract all readable content from the image in natural human reading order and output the result as a single Markdown document. For charts or images, represent them using an HTML image tag: <' + 'img src="images/bbox_{left}_{top}_{right}_{bottom}.jpg" />, where left, top, right, bottom are bounding box coordinates scaled to [0, 1000). Format formulas as LaTeX. Format tables as HTML: <table>...</table>. Transcribe all other text as standard Markdown. Preserve the original text without translation or paraphrasing.'
70
  self.prompt = self.model.get_tokenizer().apply_chat_template(
71
  [{"role": "user", "content": f"<image>\n{prompt}"}],
72
  tokenize=False,