Spaces:
Runtime error
Runtime error
Commit
·
71b2a17
1
Parent(s):
c749499
Add cumulative token count
Browse files- tapas_visualizer.py +7 -3
tapas_visualizer.py
CHANGED
|
@@ -115,7 +115,7 @@ class TapasVisualizer:
|
|
| 115 |
token_text = self.tokenizer._convert_id_to_token(input_id)
|
| 116 |
cell_tokens[(row_id, col_id)].append(token_text)
|
| 117 |
|
| 118 |
-
|
| 119 |
header_row_html = ""
|
| 120 |
header_row_token_cnt = 0
|
| 121 |
for col_id, col in enumerate(table.columns, start=1):
|
|
@@ -124,7 +124,9 @@ class TapasVisualizer:
|
|
| 124 |
cell_html = "".join(span_htmls)
|
| 125 |
header_row_html += f"<th>{cell_html}</th>"
|
| 126 |
header_row_token_cnt += len(cur_cell_tokens)
|
| 127 |
-
|
|
|
|
|
|
|
| 128 |
header_row_html = f'<tr>{header_row_html}</tr>'
|
| 129 |
|
| 130 |
table_vals = table.values
|
|
@@ -140,7 +142,9 @@ class TapasVisualizer:
|
|
| 140 |
cell_html = "".join(span_htmls)
|
| 141 |
row_html += f"<td>{cell_html}</td>"
|
| 142 |
row_token_cnt += len(cur_cell_tokens)
|
| 143 |
-
|
|
|
|
|
|
|
| 144 |
table_html += f'<tr>{row_html}</tr>'
|
| 145 |
|
| 146 |
table_html = f'<table>{table_html}</table>'
|
|
|
|
| 115 |
token_text = self.tokenizer._convert_id_to_token(input_id)
|
| 116 |
cell_tokens[(row_id, col_id)].append(token_text)
|
| 117 |
|
| 118 |
+
cumulative_cnt = 0
|
| 119 |
header_row_html = ""
|
| 120 |
header_row_token_cnt = 0
|
| 121 |
for col_id, col in enumerate(table.columns, start=1):
|
|
|
|
| 124 |
cell_html = "".join(span_htmls)
|
| 125 |
header_row_html += f"<th>{cell_html}</th>"
|
| 126 |
header_row_token_cnt += len(cur_cell_tokens)
|
| 127 |
+
cumulative_cnt += header_row_token_cnt
|
| 128 |
+
cnt_str = f'{header_row_token_cnt} | {cumulative_cnt}'
|
| 129 |
+
header_row_html += f'<th style="border: none;">{self.style_span(cnt_str, ["non-token", "count"])}</th>'
|
| 130 |
header_row_html = f'<tr>{header_row_html}</tr>'
|
| 131 |
|
| 132 |
table_vals = table.values
|
|
|
|
| 142 |
cell_html = "".join(span_htmls)
|
| 143 |
row_html += f"<td>{cell_html}</td>"
|
| 144 |
row_token_cnt += len(cur_cell_tokens)
|
| 145 |
+
cumulative_cnt += row_token_cnt
|
| 146 |
+
cnt_str = f'{row_token_cnt} | {cumulative_cnt}'
|
| 147 |
+
row_html += f'<td style="border: none;">{self.style_span(cnt_str, ["non-token", "count"])}</td>'
|
| 148 |
table_html += f'<tr>{row_html}</tr>'
|
| 149 |
|
| 150 |
table_html = f'<table>{table_html}</table>'
|