AttnTrace is an efficient context traceback method for long contexts (e.g., full papers). It is over 15× faster than the state-of-the-art context traceback method TracLLM. Compared to previous attention-based approaches, AttnTrace is more accurate, reliable, and memory-efficient. """, elem_classes="feature-highlights") # Feature highlights gr.Markdown("""

AttnTrace can be used in many real-world applications, such as tracing back to: - 📄 prompt injection instructions that manipulate LLM-generated paper reviews. - 💻 malicious comment & code hiding in the codebase that misleads the AI coding assistant. - 🤖 malicious instructions that mislead the action of the LLM agent. - 🖋 source texts in the context from an AI summary. - 🔍 evidence that supports the LLM-generated answer for a question. - ❌ misinformation (corrupted knowledge) that manipulates LLM output for a question. - And a lot more...

""", elem_classes="feature-highlights") # Example buttons with topic-relevant images - moved here for better positioning gr.Markdown("### 🚀 Try These Examples!", elem_classes="example-title") with gr.Row(elem_classes=["example-button-container"]): with gr.Column(scale=1): example_1_btn = gr.Button( "📄 Prompt Injection Attacks in AI Paper Review", elem_classes=["example-button", "example-paper"], elem_id="example_1_button", scale=None, size="sm" ) with gr.Column(scale=1): example_2_btn = gr.Button( "💻 Malicious Comments & Code in Codebase", elem_classes=["example-button", "example-movie"], elem_id="example_2_button" ) with gr.Column(scale=1): example_3_btn = gr.Button( "🤖 Malicious Instructions Misleading the LLM Agent", elem_classes=["example-button", "example-code"], elem_id="example_3_button" ) with gr.Row(elem_classes=["example-button-container"]): with gr.Column(scale=1): example_4_btn = gr.Button( "🖋 Source Texts for an AI Summary", elem_classes=["example-button", "example-paper-alt"], elem_id="example_4_button" ) with gr.Column(scale=1): example_5_btn = gr.Button( "🔍 Evidence that Support Question Answering", elem_classes=["example-button", "example-movie-alt"], elem_id="example_5_button" ) with gr.Column(scale=1): example_6_btn = gr.Button( "❌ Misinformation (Corrupted Knowledge) in Question Answering", elem_classes=["example-button", "example-code-alt"], elem_id="example_6_button" ) state = gr.State( value=clear_state() ) basic_tab = gr.Tab("Demo") with basic_tab: # gr.Markdown("## Demo") gr.Markdown( "Enter your context and instruction below to try out AttnTrace! You can also click on the example buttons above to load pre-configured examples." ) gr.Markdown( '**Color Legend for Context Traceback (by ranking):** Red = 1st (most important) | Orange = 2nd | Golden = 3rd | Yellow = 4th-5th | Light = 6th+' ) # Top section: Wide Context box with tabs with gr.Row(): with gr.Column(scale=1): with gr.Tabs() as basic_context_tabs: with gr.TabItem("Context", id=0): basic_context_box = gr.Textbox( placeholder="Enter context...", show_label=False, value="", lines=6, max_lines=6, elem_id="basic_context_box", autoscroll=False, ) with gr.TabItem("Context with highlighted traceback results", id=1, visible=True) as basic_sources_in_context_tab: basic_sources_in_context_box = HighlightedTextbox( value=[("Click on a sentence in the response below to see highlighted traceback results here.", None)], show_legend_label=False, show_label=False, show_legend=False, interactive=False, elem_id="basic_sources_in_context_box", ) # Error messages basic_generate_error_box = HighlightedTextbox( show_legend_label=False, show_label=False, show_legend=False, visible=False, interactive=False, container=False, ) # Bottom section: Left (instruction + button + response), Right (response selection) with gr.Row(equal_height=True): # Left: Instruction + Button + Response with gr.Column(scale=1): basic_query_box = gr.Textbox( label="Instruction", placeholder="Enter an instruction...", value="", lines=3, max_lines=3, ) unified_response_button = gr.Button( "Generate/Use Response", variant="primary", size="lg" ) response_input_box = gr.Textbox( label="Response (Editable)", placeholder="Response will appear here after generation, or type your own response for traceback...", lines=8, max_lines=8, info="Leave empty and click button to generate from LLM, or type your own response to use for traceback" ) # Right: Response for attribution selection with gr.Column(scale=1): basic_response_box = gr.HighlightedText( label="Click to select text for traceback!", value=[("Click the 'Generate/Use Response' button on the left to see response text here for traceback analysis.", None)], interactive=False, combine_adjacent=False, show_label=True, show_legend=False, elem_id="basic_response_box", visible=True, ) # Button for full response traceback full_response_traceback_button = gr.Button( "🔍 Traceback Entire Response", variant="secondary", size="sm" ) # Hidden error box and dummy elements basic_attribute_error_box = HighlightedTextbox( show_legend_label=False, show_label=False, show_legend=False, visible=False, interactive=False, container=False, ) dummy_basic_sources_box = gr.Textbox( visible=False, interactive=False, container=False ) # Only a single (AttnTrace) method and model in this simplified version def basic_clear_state(): state = clear_state() return ( "", # basic_context_box "", # basic_query_box "", # response_input_box gr.update(value=[("Click the 'Generate/Use Response' button above to see response text here for traceback analysis.", None)]), # basic_response_box - keep visible gr.update(selected=0), # basic_context_tabs - switch to first tab state, ) # Defining behavior of various interactions for the basic tab basic_tab.select( fn=basic_clear_state, inputs=[], outputs=[ basic_context_box, basic_query_box, response_input_box, basic_response_box, basic_context_tabs, state, ], ) for component in [basic_context_box, basic_query_box]: component.change( basic_update, [basic_context_box, basic_query_box, state], [ basic_response_box, basic_context_tabs, state, ], ) # Example button event handlers - now update both UI and state outputs_for_examples = [ basic_context_box, basic_query_box, state, response_input_box, basic_response_box, basic_context_tabs, ] example_1_btn.click( fn=partial(load_an_example, run_example_1), inputs=[state], outputs=outputs_for_examples ) example_2_btn.click( fn=partial(load_an_example, run_example_2), inputs=[state], outputs=outputs_for_examples ) example_3_btn.click( fn=partial(load_an_example, run_example_3), inputs=[state], outputs=outputs_for_examples ) example_4_btn.click( fn=partial(load_an_example, run_example_4), inputs=[state], outputs=outputs_for_examples ) example_5_btn.click( fn=partial(load_an_example, run_example_5), inputs=[state], outputs=outputs_for_examples ) example_6_btn.click( fn=partial(load_an_example, run_example_6), inputs=[state], outputs=outputs_for_examples ) unified_response_button.click( fn=lambda: None, inputs=[], outputs=[], js=get_scroll_js_code("basic_response_box"), ) basic_response_box.change( fn=lambda: None, inputs=[], outputs=[], js=get_scroll_js_code("basic_sources_in_context_box"), ) # Add immediate tab switch on response selection def immediate_tab_switch(): return ( gr.update(value=[("🔄 Processing traceback... Please wait...", None)]), # Show progress message gr.update(selected=1), # Switch to annotation tab immediately ) basic_response_box.select( fn=immediate_tab_switch, inputs=[], outputs=[basic_sources_in_context_box, basic_context_tabs], queue=False, # Execute immediately without queue ) basic_response_box.select( fn=basic_get_scores_and_sources, inputs=[basic_response_box, state], outputs=[ basic_sources_in_context_box, basic_context_tabs, basic_sources_in_context_tab, dummy_basic_sources_box, basic_attribute_error_box, state, ], show_progress="full", ) basic_response_box.select( fn=basic_update_highlighted_response, inputs=[state], outputs=[basic_response_box, state], ) # Full response traceback button full_response_traceback_button.click( fn=immediate_tab_switch, inputs=[], outputs=[basic_sources_in_context_box, basic_context_tabs], queue=False, # Execute immediately without queue ) full_response_traceback_button.click( fn=basic_get_scores_and_sources_full_response, inputs=[state], outputs=[ basic_sources_in_context_box, basic_context_tabs, basic_sources_in_context_tab, dummy_basic_sources_box, basic_attribute_error_box, state, ], show_progress="full", ) dummy_basic_sources_box.change( fn=lambda: None, inputs=[], outputs=[], js=get_scroll_js_code("basic_sources_in_context_box"), ) # Unified response handler unified_response_button.click( fn=unified_response_handler, inputs=[response_input_box, state], outputs=[state, response_input_box, basic_response_box, basic_generate_error_box] ) # gr.Markdown( # "Please do not interact with elements while generation/attribution is in progress. This may cause errors. You can refresh the page if you run into issues because of this." # ) demo.launch(show_api=False, share=True)