TransDis-CreativityAutoAssessment

Sleeping

App Files Files Community

Qifan Zhang commited on Apr 1, 2023

Commit

3f6f474

1 Parent(s): b8d9710

update optional models, add text input

Browse files

Files changed (2) hide show

app.py +34 -14
utils/models.py +3 -1

app.py CHANGED Viewed

@@ -1,3 +1,4 @@
 from typing import Optional
 import gradio as gr
@@ -7,8 +8,6 @@ from utils.similarity import batch_cos_sim
 def read_data(filepath: str) -> Optional[pd.DataFrame]:
-    if not filepath:
-        return None
     if filepath.endswith('.xlsx'):
         df = pd.read_csv(filepath)
     elif filepath.endswith('.csv'):
@@ -19,35 +18,56 @@ def read_data(filepath: str) -> Optional[pd.DataFrame]:
 def process(model_name: str,
-            prompt: str,
             file=None,
             ):
-    df = read_data(file.name)
     df = batch_cos_sim(df, model_name)
     path = 'output.csv'
     df.to_csv(path, index=False, encoding='utf-8-sig')
-    return df.to_markdown(), path
 model_name_input = gr.components.Textbox(
     value='paraphrase-multilingual-MiniLM-L12-v2',
     lines=1,
-    type="text"
 )
-prompt_input = gr.components.Textbox(
-    value='prompt,response',
     lines=10,
-    type="text"
 )
-file_output = gr.components.File(label="Output File",
-                                 file_count="single",
-                                 file_types=["", ".", ".csv", ".xls", ".xlsx"])
 app = gr.Interface(
     fn=process,
-    inputs=[model_name_input, prompt_input, "file" ],
-    outputs=["text", file_output]
 )
 app.launch()

+from io import StringIO
 from typing import Optional
 import gradio as gr
 def read_data(filepath: str) -> Optional[pd.DataFrame]:
     if filepath.endswith('.xlsx'):
         df = pd.read_csv(filepath)
     elif filepath.endswith('.csv'):
 def process(model_name: str,
+            text: str,
             file=None,
             ):
+    if file:
+        df = read_data(file.name)
+    elif text:
+        string_io = StringIO(text)
+        df = pd.read_csv(string_io)
+    else:
+        raise Exception('No input provided')
     df = batch_cos_sim(df, model_name)
     path = 'output.csv'
     df.to_csv(path, index=False, encoding='utf-8-sig')
+    return str(df), path
 model_name_input = gr.components.Textbox(
     value='paraphrase-multilingual-MiniLM-L12-v2',
     lines=1,
+    type='text'
+)
+model_name_option = gr.components.Dropdown(
+    label='Model Name',
+    value='paraphrase-multilingual-MiniLM-L12-v2',
+    choices=[
+        'paraphrase-multilingual-MiniLM-L12-v2',
+        'paraphrase-multilingual-mpnet-base-v2',
+        'cyclone/simcse-chinese-roberta-wwm-ext'
+    ]
 )
+text_input = gr.components.Textbox(
+    value='prompt,response\n',
     lines=10,
+    type='text'
+)
+text_output = gr.components.Textbox(
+    label='Output',
+    type='text'
 )
+file_output = gr.components.File(label='Output File',
+                                 file_count='single',
+                                 file_types=['', '.', '.csv', '.xls', '.xlsx'])
 app = gr.Interface(
     fn=process,
+    inputs=[model_name_option, text_input, 'file'],
+    outputs=[text_output, file_output]
 )
 app.launch()

utils/models.py CHANGED Viewed

@@ -1,13 +1,15 @@
 from functools import lru_cache
 import torch
 from sentence_transformers import SentenceTransformer
-import numpy as np
 DEVICE = 'cuda' if torch.cuda.is_available() else 'cpu'
 class SBert:
     def __init__(self, path):
         self.model = SentenceTransformer(path, device=DEVICE)
     @lru_cache(maxsize=10000)

 from functools import lru_cache
+import numpy as np
 import torch
 from sentence_transformers import SentenceTransformer
 DEVICE = 'cuda' if torch.cuda.is_available() else 'cpu'
 class SBert:
     def __init__(self, path):
+        print(f'Loading model from {path} ...')
         self.model = SentenceTransformer(path, device=DEVICE)
     @lru_cache(maxsize=10000)