Spaces:

shroom-semeval25
/

cogumelo-visualizer

Sleeping

App Files Files Community

acmc commited on Nov 14, 2024

Commit

a85555b

verified ·

1 Parent(s): 82a1f36

Update visualize.py

Browse files

Files changed (1) hide show

visualize.py +193 -37

visualize.py CHANGED Viewed

@@ -91,31 +91,22 @@ def show_hallucinations(element):
     ]
-prediction_model = transformers.AutoModelForTokenClassification.from_pretrained(
     "shroom-semeval25/cogumelo-hallucinations-detector-roberta-base"
 )
-prediction_tokenizer = transformers.AutoTokenizer.from_pretrained(
     "shroom-semeval25/cogumelo-hallucinations-detector-roberta-base"
 )
-def predict_hallucinations(hallucinated_text: str):
-    """The model will return 0 if it's not a hallucination, 1 if it is the beginning of a hallucination, and 2 if it's the continuation of a hallucination"""
-    hallucinated_tokens = prediction_tokenizer(
-        hallucinated_text,
-        return_offsets_mapping=True,
-        add_special_tokens=True,
-        return_tensors="pt",
     )
-    inputs = {
-        "input_ids": hallucinated_tokens["input_ids"],
-        "attention_mask": hallucinated_tokens["attention_mask"],
-    }
-    with torch.no_grad():
-        outputs = prediction_model(**inputs)
     # Get the highest value for each token
-    predictions = outputs.logits.argmax(dim=-1).squeeze(0).tolist()
     entities = []
     current_entity = None
     for i, prediction in enumerate(predictions):
@@ -129,20 +120,18 @@ def predict_hallucinations(hallucinated_text: str):
                 entities.append(current_entity)
             current_entity = {
                 "entity": "hal",
-                "start": hallucinated_tokens["offset_mapping"][0][i][0],
-                "end": hallucinated_tokens["offset_mapping"][0][i][1] + 1,
             }
         if prediction == 2:
             if current_entity is None:
                 current_entity = {
                     "entity": "hal",
-                    "start": hallucinated_tokens["offset_mapping"][0][i][0],
-                    "end": hallucinated_tokens["offset_mapping"][0][i][1] + 1,
                 }
             else:
-                current_entity["end"] = (
-                    hallucinated_tokens["offset_mapping"][0][i][1] + 1
-                )
     if current_entity is not None:
         entities.append(current_entity)
     return {
@@ -157,14 +146,150 @@ def update_selection(evt: gr.SelectData):
     # Run the two functions
     json_example, original_text, highlighted_text = show_hallucinations(element)
     try:
-        highlighted_text_predicted = predict_hallucinations(
-            element["hallucinated_answer_generated"]
         )
     except Exception as e:
         logging.exception(f"An error occurred: {e}")
         gr.Error(f"An error occurred: {e}")
-        highlighted_text_predicted = {"text": "", "entities": []}
-    return json_example, original_text, highlighted_text, highlighted_text_predicted
 with gr.Blocks(title="Hallucinations Explorer") as demo:
@@ -186,8 +311,13 @@ _SHROOM '25: Detection of Hallucinated Content_
         color_map={"+": "red", "-": "blue", "hal": "red"},
         combine_adjacent=True,
     )
-    highlighted_text_predicted = gr.HighlightedText(
-        label="Predicted Hallucinations",
         color_map={"+": "red", "-": "blue", "hal": "red"},
         combine_adjacent=True,
     )
@@ -200,7 +330,8 @@ _SHROOM '25: Detection of Hallucinated Content_
             json_example,
             original_text,
             highlighted_text,
-            highlighted_text_predicted,
         ],
     )
@@ -213,15 +344,40 @@ _SHROOM '25: Detection of Hallucinated Content_
             type="text",
         )
-        manual_input_highlighted_text = gr.HighlightedText(
-            label="Predicted Hallucinations",
             color_map={"+": "red", "-": "blue", "hal": "red"},
             combine_adjacent=True,
         )
         model_manual_input.change(
-            predict_hallucinations,
-            inputs=[model_manual_input],
-            outputs=[manual_input_highlighted_text],
         )
 demo.launch(show_error=True)

     ]
+roberta_base_predictor = transformers.AutoModelForTokenClassification.from_pretrained(
     "shroom-semeval25/cogumelo-hallucinations-detector-roberta-base"
 )
+roberta_base_tokenizer = transformers.AutoTokenizer.from_pretrained(
     "shroom-semeval25/cogumelo-hallucinations-detector-roberta-base"
 )
+roberta_large_qa_predictor = (
+    transformers.AutoModelForTokenClassification.from_pretrained(
+        "shroom-semeval25/cogumelo-hallucinations-detector-roberta-large-qa-15000"
     )
+)
+def mark_hallucinations(logits, hallucinated_text, offsets):
     # Get the highest value for each token
+    predictions = logits.argmax(dim=-1).squeeze(0).tolist()
     entities = []
     current_entity = None
     for i, prediction in enumerate(predictions):
                 entities.append(current_entity)
             current_entity = {
                 "entity": "hal",
+                "start": offsets[i][0],
+                "end": offsets[i][1] + 1,
             }
         if prediction == 2:
             if current_entity is None:
                 current_entity = {
                     "entity": "hal",
+                    "start": offsets[i][0],
+                    "end": offsets[i][1] + 1,
                 }
             else:
+                current_entity["end"] = offsets[i][1] + 1
     if current_entity is not None:
         entities.append(current_entity)
     return {
     # Run the two functions
     json_example, original_text, highlighted_text = show_hallucinations(element)
     try:
+        hallucinated_tokens = roberta_base_tokenizer(
+            text=element["hallucinated_answer_generated"],
+            return_offsets_mapping=True,
+            add_special_tokens=True,
+            return_tensors="pt",
+            return_special_tokens_mask=True,
+        )
+        q_a_tokens = roberta_base_tokenizer(
+            # We have to batch into a single-example batch, because otherwise the tokenizer will interpret that the second element of the pair is example #2 of the batch (while actually it is the second part of the pair of example #1)
+            text=[(element["question"], element["hallucinated_answer_generated"])],
+            return_offsets_mapping=True,
+            add_special_tokens=True,
+            return_tensors="pt",
+            return_special_tokens_mask=True,
+        )
+        with torch.no_grad():
+            outputs_roberta_base = roberta_base_predictor(
+                input_ids=hallucinated_tokens.input_ids,
+                attention_mask=hallucinated_tokens.attention_mask,
+            )
+            # Take only the outputs that are NOT special tokens and where the attention mask is 1
+            logits_roberta_base = outputs_roberta_base.logits[
+                ...,
+                (hallucinated_tokens.special_tokens_mask == 0)
+                & (hallucinated_tokens.attention_mask == 1),
+                :,
+            ]
+            outputs_roberta_large_qa = roberta_large_qa_predictor(
+                input_ids=q_a_tokens.input_ids,
+                attention_mask=q_a_tokens.attention_mask,
+            )
+            # Take only the outputs after the first special token and where the attention mask is 1 and the special tokens mask is 0
+            logits_roberta_large_qa = outputs_roberta_large_qa.logits[
+                ...,
+                (q_a_tokens.special_tokens_mask.cumsum(dim=-1) > 1)
+                & (q_a_tokens.attention_mask == 1)
+                & (q_a_tokens.special_tokens_mask == 0),
+                :,
+            ]
+        highlighted_text_predicted_roberta_base = mark_hallucinations(
+            hallucinated_text=element["hallucinated_answer_generated"],
+            logits=logits_roberta_base,
+            # Discard the first token, which is the BOS token
+            offsets=hallucinated_tokens["offset_mapping"][0][1:],
+        )
+        # How much should we remove from the offset_mapping?
+        # The length of the tokens before the first special token
+        number_of_offsets_to_remove = (
+            q_a_tokens.special_tokens_mask.cumsum(dim=-1) <= 1
+        ).sum()
+        highlighted_text_predicted_roberta_large_qa = mark_hallucinations(
+            hallucinated_text=element["hallucinated_answer_generated"],
+            logits=logits_roberta_large_qa,
+            # Discard the first two tokens, which are the separators between the question and the answer
+            offsets=q_a_tokens["offset_mapping"][0][number_of_offsets_to_remove + 2 :],
         )
     except Exception as e:
         logging.exception(f"An error occurred: {e}")
         gr.Error(f"An error occurred: {e}")
+        highlighted_text_predicted_roberta_base = {"text": "", "entities": []}
+        highlighted_text_predicted_roberta_large_qa = {"text": "", "entities": []}
+    return (
+        json_example,
+        original_text,
+        highlighted_text,
+        highlighted_text_predicted_roberta_base,
+        highlighted_text_predicted_roberta_large_qa,
+    )
+def predict_hallucinations_manual_input_roberta_base(text: str):
+    hallucinated_tokens = roberta_base_tokenizer(
+        text=text,
+        return_offsets_mapping=True,
+        add_special_tokens=True,
+        return_tensors="pt",
+        return_special_tokens_mask=True,
+    )
+    with torch.no_grad():
+        outputs_roberta_base = roberta_base_predictor(
+            input_ids=hallucinated_tokens.input_ids,
+            attention_mask=hallucinated_tokens.attention_mask,
+        )
+        logits_roberta_base = outputs_roberta_base.logits[
+            ...,
+            (hallucinated_tokens.special_tokens_mask == 0)
+            & (hallucinated_tokens.attention_mask == 1),
+            :,
+        ]
+    highlighted_text_predicted_roberta_base = mark_hallucinations(
+        hallucinated_text=text,
+        logits=logits_roberta_base,
+        offsets=hallucinated_tokens["offset_mapping"][0][1:],
+    )
+    return highlighted_text_predicted_roberta_base
+def predict_hallucinations_manual_input_roberta_qa_large(text: str, question: str = ""):
+    q_a_tokens = roberta_base_tokenizer(
+        text=[(question, text)],
+        return_offsets_mapping=True,
+        add_special_tokens=True,
+        return_tensors="pt",
+        return_special_tokens_mask=True,
+    )
+    with torch.no_grad():
+        outputs_roberta_large_qa = roberta_large_qa_predictor(
+            input_ids=q_a_tokens.input_ids,
+            attention_mask=q_a_tokens.attention_mask,
+        )
+        number_of_offsets_to_remove = (
+            q_a_tokens.special_tokens_mask.cumsum(dim=-1) <= 1
+        ).sum()
+        logits_roberta_large_qa = outputs_roberta_large_qa.logits[
+            ...,
+            (q_a_tokens.special_tokens_mask.cumsum(dim=-1) > 1)
+            & (q_a_tokens.attention_mask == 1)
+            & (q_a_tokens.special_tokens_mask == 0),
+            :,
+        ]
+    highlighted_text_predicted_roberta_large_qa = mark_hallucinations(
+        hallucinated_text=text,
+        logits=logits_roberta_large_qa,
+        offsets=q_a_tokens["offset_mapping"][0][number_of_offsets_to_remove + 2 :],
+    )
+    return highlighted_text_predicted_roberta_large_qa
+def predict_hallucinations_manual_input(text: str, question: str = ""):
+    empty_response = {"text": "", "entities": []}
+    # If the text is empty, return nothing
+    if not text:
+        return empty_response, empty_response
+    # If the text is not empty, we can get the hallucinations with the RoBERTa Base model
+    roberta_base_prediction = predict_hallucinations_manual_input_roberta_base(text)
+    # If the question is empty, we can't use the RoBERTa Large QA model
+    if not question:
+        return roberta_base_prediction, empty_response
+    # If the question is not empty, we can use the RoBERTa Large QA model
+    roberta_large_qa_prediction = predict_hallucinations_manual_input_roberta_qa_large(
+        text, question
+    )
+    return roberta_base_prediction, roberta_large_qa_prediction
 with gr.Blocks(title="Hallucinations Explorer") as demo:
         color_map={"+": "red", "-": "blue", "hal": "red"},
         combine_adjacent=True,
     )
+    highlighted_text_predicted_roberta_base = gr.HighlightedText(
+        label="Predicted Hallucinations (RoBERTa Base)",
+        color_map={"+": "red", "-": "blue", "hal": "red"},
+        combine_adjacent=True,
+    )
+    highlighted_text_predicted_roberta_large_qa = gr.HighlightedText(
+        label="Predicted Hallucinations (RoBERTa Large QA)",
         color_map={"+": "red", "-": "blue", "hal": "red"},
         combine_adjacent=True,
     )
             json_example,
             original_text,
             highlighted_text,
+            highlighted_text_predicted_roberta_base,
+            highlighted_text_predicted_roberta_large_qa,
         ],
     )
             type="text",
         )
+        model_question_input = gr.Textbox(
+            value="",
+            label="Question (only for RoBERTa Large QA)",
+            placeholder="Type the question here",
+            type="text",
+        )
+        manual_input_highlighted_text_roberta_base = gr.HighlightedText(
+            label="Predicted Hallucinations (RoBERTa Base)",
+            color_map={"+": "red", "-": "blue", "hal": "red"},
+            combine_adjacent=True,
+        )
+        manual_input_highlighted_text_roberta_large_qa = gr.HighlightedText(
+            label="Predicted Hallucinations (RoBERTa Large QA)",
             color_map={"+": "red", "-": "blue", "hal": "red"},
             combine_adjacent=True,
         )
         model_manual_input.change(
+            predict_hallucinations_manual_input,
+            inputs=[model_manual_input, model_question_input],
+            outputs=[
+                manual_input_highlighted_text_roberta_base,
+                manual_input_highlighted_text_roberta_large_qa,
+            ],
+        )
+        model_question_input.change(
+            predict_hallucinations_manual_input_roberta_qa_large,
+            inputs=[model_manual_input, model_question_input],
+            outputs=[
+                manual_input_highlighted_text_roberta_large_qa,
+            ],
         )
 demo.launch(show_error=True)