Spaces:

anamargarida
/

Trial

Sleeping

App Files Files Community

anamargarida commited on Mar 12

Commit

7538da0

verified ·

1 Parent(s): 2cbd71b

Rename app_25.py to app_26.py

Browse files

Files changed (1) hide show

app_25.py → app_26.py +39 -2

app_25.py → app_26.py RENAMED Viewed

@@ -294,12 +294,49 @@ def extract_arguments(text, tokenizer, model, beam_search=True):
         return annotated_text
     # Apply the tags to the sentence tokens
-    tagged_sentence1 = add_tags_offset(input_text, start_cause1, end_cause1, start_effect1, end_effect1, start_signal, end_signal)
-    tagged_sentence2 = add_tags_offset(input_text, start_cause2, end_cause2, start_effect2, end_effect2, start_signal, end_signal)
     return tagged_sentence1, tagged_sentence2

         return annotated_text
+    def add_tags_offset_2(text, start_cause, end_cause, start_effect, end_effect, start_signal, end_signal):
+        """
+        Inserts tags into the original text based on token offsets.
+        Args:
+            text (str): The original input text.
+            offset_mapping (list of tuples): Maps token indices to character spans.
+            start_cause (int): Start token index of the cause span.
+            end_cause (int): End token index of the cause span.
+            start_effect (int): Start token index of the effect span.
+            end_effect (int): End token index of the effect span.
+            start_signal (int, optional): Start token index of the signal span.
+            end_signal (int, optional): End token index of the signal span.
+        Returns:
+            str: The modified text with annotated spans.
+        """
+        # Convert token indices to character indices
+        spans = [
+            (offset_mapping[start_cause][0], offset_mapping[end_cause][1], "<ARG0>", "</ARG0>"),
+            (offset_mapping[start_effect][0], offset_mapping[end_effect][1], "<ARG1>", "</ARG1>")
+        ]
+        # Include signal tags if available
+        if start_signal is not None and end_signal is not None:
+            spans.append((offset_mapping[start_signal][0], offset_mapping[end_signal][1], "<SIG0>", "</SIG0>"))
+        # Sort spans in reverse order based on start index (to avoid shifting issues)
+        spans.sort(reverse=True, key=lambda x: x[0])
+        # Insert tags
+        for start, end, open_tag, close_tag in spans:
+            text = text[:start] + open_tag + text[start:end] + close_tag + text[end:]
+        return text
     # Apply the tags to the sentence tokens
+    tagged_sentence1 = add_tags_offset_2(input_text, start_cause1, end_cause1, start_effect1, end_effect1, start_signal, end_signal)
+    tagged_sentence2 = add_tags_offset_2(input_text, start_cause2, end_cause2, start_effect2, end_effect2, start_signal, end_signal)
     return tagged_sentence1, tagged_sentence2