Spaces:
				
			
			
	
			
			
		Runtime error
		
	
	
	
			
			
	
	
	
	
		
		
		Runtime error
		
	Commit 
							
							·
						
						71b2a17
	
1
								Parent(s):
							
							c749499
								
Add cumulative token count
Browse files- tapas_visualizer.py +7 -3
    	
        tapas_visualizer.py
    CHANGED
    
    | @@ -115,7 +115,7 @@ class TapasVisualizer: | |
| 115 | 
             
                        token_text = self.tokenizer._convert_id_to_token(input_id)
         | 
| 116 | 
             
                        cell_tokens[(row_id, col_id)].append(token_text)
         | 
| 117 |  | 
| 118 | 
            -
                     | 
| 119 | 
             
                    header_row_html = ""
         | 
| 120 | 
             
                    header_row_token_cnt = 0
         | 
| 121 | 
             
                    for col_id, col in enumerate(table.columns, start=1):
         | 
| @@ -124,7 +124,9 @@ class TapasVisualizer: | |
| 124 | 
             
                        cell_html = "".join(span_htmls)
         | 
| 125 | 
             
                        header_row_html += f"<th>{cell_html}</th>"
         | 
| 126 | 
             
                        header_row_token_cnt += len(cur_cell_tokens)
         | 
| 127 | 
            -
                     | 
|  | |
|  | |
| 128 | 
             
                    header_row_html = f'<tr>{header_row_html}</tr>'
         | 
| 129 |  | 
| 130 | 
             
                    table_vals = table.values
         | 
| @@ -140,7 +142,9 @@ class TapasVisualizer: | |
| 140 | 
             
                            cell_html = "".join(span_htmls)
         | 
| 141 | 
             
                            row_html += f"<td>{cell_html}</td>"
         | 
| 142 | 
             
                            row_token_cnt += len(cur_cell_tokens)
         | 
| 143 | 
            -
                         | 
|  | |
|  | |
| 144 | 
             
                        table_html += f'<tr>{row_html}</tr>'
         | 
| 145 |  | 
| 146 | 
             
                    table_html = f'<table>{table_html}</table>'
         | 
|  | |
| 115 | 
             
                        token_text = self.tokenizer._convert_id_to_token(input_id)
         | 
| 116 | 
             
                        cell_tokens[(row_id, col_id)].append(token_text)
         | 
| 117 |  | 
| 118 | 
            +
                    cumulative_cnt = 0
         | 
| 119 | 
             
                    header_row_html = ""
         | 
| 120 | 
             
                    header_row_token_cnt = 0
         | 
| 121 | 
             
                    for col_id, col in enumerate(table.columns, start=1):
         | 
|  | |
| 124 | 
             
                        cell_html = "".join(span_htmls)
         | 
| 125 | 
             
                        header_row_html += f"<th>{cell_html}</th>"
         | 
| 126 | 
             
                        header_row_token_cnt += len(cur_cell_tokens)
         | 
| 127 | 
            +
                    cumulative_cnt += header_row_token_cnt
         | 
| 128 | 
            +
                    cnt_str = f'{header_row_token_cnt} | {cumulative_cnt}'
         | 
| 129 | 
            +
                    header_row_html += f'<th style="border: none;">{self.style_span(cnt_str, ["non-token", "count"])}</th>'
         | 
| 130 | 
             
                    header_row_html = f'<tr>{header_row_html}</tr>'
         | 
| 131 |  | 
| 132 | 
             
                    table_vals = table.values
         | 
|  | |
| 142 | 
             
                            cell_html = "".join(span_htmls)
         | 
| 143 | 
             
                            row_html += f"<td>{cell_html}</td>"
         | 
| 144 | 
             
                            row_token_cnt += len(cur_cell_tokens)
         | 
| 145 | 
            +
                        cumulative_cnt += row_token_cnt
         | 
| 146 | 
            +
                        cnt_str = f'{row_token_cnt} | {cumulative_cnt}'
         | 
| 147 | 
            +
                        row_html += f'<td style="border: none;">{self.style_span(cnt_str, ["non-token", "count"])}</td>'
         | 
| 148 | 
             
                        table_html += f'<tr>{row_html}</tr>'
         | 
| 149 |  | 
| 150 | 
             
                    table_html = f'<table>{table_html}</table>'
         |