Spaces:

dejanseo
/

linkbert

Running

dejanseo commited on May 2

Commit

266743a

•

1 Parent(s): d598c67

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -87,20 +87,22 @@ def process_text(inputs: str, confidence_threshold: float):
         for word_start in sorted(word_info.keys()):
             word_data = word_info[word_start]
             for subtoken_start, subtoken_end, subtoken_text in word_data['subtokens']:
                 if last_end < subtoken_start:
                     reconstructed_text += chunk[last_end:subtoken_start]
                 if word_data['prediction'] == 1:
-                    reconstructed_text += f"<span style='background-color: rgba(0, 255, 0); display: inline;'>{subtoken_text.replace('$', '\\$')}</span>"
                 else:
-                    reconstructed_text += subtoken_text.replace('$', '\\$')
                 last_end = subtoken_end
-                df_data['Word'].append(subtoken_text.replace('$', '\\$'))
                 df_data['Prediction'].append(word_data['prediction'])
                 df_data['Confidence'].append(word_info[word_start]['confidence'])
                 df_data['Start'].append(subtoken_start + original_position_offset)
                 df_data['End'].append(subtoken_end + original_position_offset)
             original_position_offset += len(chunk) + 1
         reconstructed_text += chunk[last_end:].replace('$', '\\$')

         for word_start in sorted(word_info.keys()):
             word_data = word_info[word_start]
             for subtoken_start, subtoken_end, subtoken_text in word_data['subtokens']:
+                escaped_subtoken_text = subtoken_text.replace('$', '\\$')  # Perform replacement outside f-string
                 if last_end < subtoken_start:
                     reconstructed_text += chunk[last_end:subtoken_start]
                 if word_data['prediction'] == 1:
+                    reconstructed_text += f"<span style='background-color: rgba(0, 255, 0); display: inline;'>{escaped_subtoken_text}</span>"
                 else:
+                    reconstructed_text += escaped_subtoken_text
                 last_end = subtoken_end
+                df_data['Word'].append(escaped_subtoken_text)
                 df_data['Prediction'].append(word_data['prediction'])
                 df_data['Confidence'].append(word_info[word_start]['confidence'])
                 df_data['Start'].append(subtoken_start + original_position_offset)
                 df_data['End'].append(subtoken_end + original_position_offset)
             original_position_offset += len(chunk) + 1
         reconstructed_text += chunk[last_end:].replace('$', '\\$')