File size: 3,667 Bytes
2c3850c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
680c70a
2c3850c
 
 
c0569fe
2c3850c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
a094a33
 
2c3850c
 
b5230a5
2c3850c
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
from typing import Dict, Union
from gliner import GLiNER
import gradio as gr

model = GLiNER.from_pretrained("knowledgator/gliner-multitask-large-v0.5").to('cpu')

text1 = """
"I recently purchased the Sony WH-1000XM4 Wireless Noise-Canceling Headphones from Amazon and I must say, I'm thoroughly impressed. The package arrived in New York within 2 days, thanks to Amazon Prime's expedited shipping.

The headphones themselves are remarkable. The noise-canceling feature works like a charm in the bustling city environment, and the 30-hour battery life means I don't have to charge them every day. Connecting them to my Samsung Galaxy S21 was a breeze, and the sound quality is second to none.

I also appreciated the customer service from Amazon when I had a question about the warranty. They responded within an hour and provided all the information I needed.

However, the headphones did not come with a hard case, which was listed in the product description. I contacted Amazon, and they offered a 10% discount on my next purchase as an apology.

Overall, I'd give these headphones a 4.5/5 rating and highly recommend them to anyone looking for top-notch quality in both product and service."""



open_ie_examples = [
    [
        f"Extract all brands, please",
        text1,
        0.5,
        False
    ]]

def merge_entities(entities):
    if not entities:
        return []
    merged = []
    current = entities[0]
    for next_entity in entities[1:]:
        if next_entity['entity'] == current['entity'] and (next_entity['start'] == current['end'] + 1 or next_entity['start'] == current['end']):
            current['word'] += ' ' + next_entity['word']
            current['end'] = next_entity['end']
        else:
            merged.append(current)
            current = next_entity
    merged.append(current)
    return merged

def process(
    prompt:str, text, threshold: float, nested_ner: bool, labels: str = ["match"]
) -> Dict[str, Union[str, int, float]]:
    text = prompt + "\n" + text
    r = {
        "text": text,
        "entities": [
            {
                "entity": entity["label"],
                "word": entity["text"],
                "start": entity["start"],
                "end": entity["end"],
                "score": 0,
            }
            for entity in model.predict_entities(
                text, labels, flat_ner=not nested_ner, threshold=threshold
            )
        ],
    }
    r["entities"] =  merge_entities(r["entities"])
    return r

with gr.Blocks(title="Open Information Extracting") as open_ie_interface:
    prompt = gr.Textbox(label="Prompt", placeholder="Enter your prompt here")
    input_text = gr.Textbox(label="Text input", placeholder="Enter your text here")
    threshold = gr.Slider(0, 1, value=0.3, step=0.01, label="Threshold", info="Lower the threshold to increase how many entities get predicted.")
    nested_ner = gr.Checkbox(label="Nested NER", info="Allow for nested NER?")
    output = gr.HighlightedText(label="Predicted Entities")
    submit_btn = gr.Button("Submit")
    
    theme=gr.themes.Base()

    input_text.submit(fn=process, inputs=[prompt, input_text, threshold, nested_ner], outputs=output)
    prompt.submit(fn=process, inputs=[prompt, input_text, threshold, nested_ner], outputs=output)
    threshold.release(fn=process, inputs=[prompt, input_text, threshold, nested_ner], outputs=output)
    submit_btn.click(fn=process, inputs=[prompt, input_text, threshold, nested_ner], outputs=output)
    nested_ner.change(fn=process, inputs=[prompt, input_text, threshold, nested_ner], outputs=output)


if __name__ == "__main__":
    
    open_ie_interface.launch()