Spaces:

Zihao-Li
/

MT-HumanEval

Sleeping

App Files Files Community

Zihao-Li commited on Apr 14

Commit

029f30f

verified ·

1 Parent(s): 3daca56

Upload app.py

Browse files

Files changed (1) hide show

app.py +70 -18

app.py CHANGED Viewed

@@ -3,26 +3,24 @@ import json
 import os
 import tempfile
-# ======== 设置路径 ========
-LANG_DIR = "./human_eval"  # 含有语言对子文件夹的目录
-SAVE_DIR = "./annotations"  # 保存标注记录的目录
 os.makedirs(SAVE_DIR, exist_ok=True)
-# ======== 初始化数据结构 ========
 data = []
 user_annotations = []
-# ======== 获取可用语言对列表 ========
 language_options = sorted([f for f in os.listdir(LANG_DIR)])
-# ======== 加载选择的语言对数据 ========
 def load_data_for_lang(lang_pair):
-    global data, user_annotations
     file_path = os.path.join(LANG_DIR, lang_pair, f"{lang_pair}.json")
     with open(file_path, "r", encoding="utf-8") as f:
         data = json.load(f)
     user_annotations = []
     return (
         0,
         data[0]["source"],
@@ -31,7 +29,45 @@ def load_data_for_lang(lang_pair):
     )
-# ======== 读取当前样本 ========
 def load_sample(i):
     if not data:
         return "", ""
@@ -39,13 +75,14 @@ def load_sample(i):
     return entry["source"], entry["hypothesis"]
-# ======== 提交打分并进入下一条 ========
 def annotate(index, score, comment, annotator):
     index = int(index)
     entry = data[index]
     record = {
         "index": index,
         "annotator": annotator,
         "source": entry["source"],
         "hypothesis": entry["hypothesis"],
         "score": score,
@@ -85,19 +122,20 @@ def annotate(index, score, comment, annotator):
     )
-# ======== 导出打分结果 ========
 def export_results():
     tmp = tempfile.NamedTemporaryFile(
         delete=False, suffix=".json", mode="w", encoding="utf-8"
     )
     json.dump(user_annotations, tmp, ensure_ascii=False, indent=2)
     tmp.close()
-    return tmp.name
-# ======== UI 构建 ========
 with gr.Blocks() as demo:
-    gr.Markdown("## Direct Assessment Annotation Tool")
     with gr.Row():
         lang_choice = gr.Dropdown(
@@ -107,6 +145,12 @@ with gr.Blocks() as demo:
         )
         load_button = gr.Button("🔄 Load Data")
     with gr.Row():
         annotator = gr.Textbox(
             label="Annotator ID",
@@ -122,16 +166,18 @@ with gr.Blocks() as demo:
     comment = gr.Textbox(lines=2, placeholder="Optional comment...", label="Comment")
     output = gr.Textbox(label="Status", interactive=False)
     next_button = gr.Button("Submit and Next")
-    export_button = gr.Button("📥 Export My Results")
     export_file = gr.File(label="Download your results", visible=False)
-    # 行为绑定
     load_button.click(
         fn=load_data_for_lang,
         inputs=[lang_choice],
         outputs=[idx, source, hyp, progress],
     )
     next_button.click(
         fn=annotate,
         inputs=[idx, score, comment, annotator],
@@ -146,9 +192,15 @@ with gr.Blocks() as demo:
             export_file,
         ],
     )
-    export_button.click(fn=export_results, outputs=export_file)
     idx.change(fn=load_sample, inputs=idx, outputs=[source, hyp])
     demo.load(fn=load_sample, inputs=[idx], outputs=[source, hyp])
-# ======== 启动应用 ========
 demo.launch(server_name="0.0.0.0", server_port=int(os.environ.get("PORT", 7860)))

 import os
 import tempfile
+LANG_DIR = "./human_eval"
+SAVE_DIR = "./annotations"
 os.makedirs(SAVE_DIR, exist_ok=True)
 data = []
 user_annotations = []
+current_lang = ""
 language_options = sorted([f for f in os.listdir(LANG_DIR)])
 def load_data_for_lang(lang_pair):
+    global data, user_annotations, current_lang
     file_path = os.path.join(LANG_DIR, lang_pair, f"{lang_pair}.json")
     with open(file_path, "r", encoding="utf-8") as f:
         data = json.load(f)
     user_annotations = []
+    current_lang = lang_pair
     return (
         0,
         data[0]["source"],
     )
+def restore_previous_annotations(file_obj):
+    global data, user_annotations, current_lang
+    with open(file_obj.name, "r", encoding="utf-8") as f:
+        user_annotations = json.load(f)
+    if not user_annotations:
+        return 0, "", "", "No annotations found."
+    restored_lang = user_annotations[0].get("lang_pair", None)
+    if not restored_lang or not os.path.exists(
+        os.path.join(LANG_DIR, restored_lang, f"{restored_lang}.json")
+    ):
+        return 0, "", "", "❌ Language pair info missing or file not found."
+    file_path = os.path.join(LANG_DIR, restored_lang, f"{restored_lang}.json")
+    with open(file_path, "r", encoding="utf-8") as f:
+        data = json.load(f)
+    current_lang = restored_lang
+    # Back to last index
+    last_index = user_annotations[-1]["index"] + 1
+    if last_index >= len(data):
+        return (
+            last_index,
+            "",
+            "",
+            f"✅ Already completed {len(data)} samples of {restored_lang}.",
+        )
+    return (
+        last_index,
+        data[last_index]["source"],
+        data[last_index]["hypothesis"],
+        f"Restored {restored_lang}: {last_index}/{len(data)}",
+        restored_lang,
+    )
 def load_sample(i):
     if not data:
         return "", ""
     return entry["source"], entry["hypothesis"]
 def annotate(index, score, comment, annotator):
+    global current_lang
     index = int(index)
     entry = data[index]
     record = {
         "index": index,
         "annotator": annotator,
+        "lang_pair": current_lang,
         "source": entry["source"],
         "hypothesis": entry["hypothesis"],
         "score": score,
     )
 def export_results():
+    if not user_annotations:
+        raise ValueError("No annotations to export.")
     tmp = tempfile.NamedTemporaryFile(
         delete=False, suffix=".json", mode="w", encoding="utf-8"
     )
     json.dump(user_annotations, tmp, ensure_ascii=False, indent=2)
     tmp.close()
+    return tmp.name, gr.update(visible=True, value=tmp.name)
+# ======== UI ========
 with gr.Blocks() as demo:
+    gr.Markdown("## 📝 Direct Assessment Annotation Tool")
     with gr.Row():
         lang_choice = gr.Dropdown(
         )
         load_button = gr.Button("🔄 Load Data")
+    with gr.Row():
+        upload_file = gr.File(
+            label="📤 Upload Previous Annotations", file_types=[".json"]
+        )
+        export_button = gr.Button("📥 Export My Results")
     with gr.Row():
         annotator = gr.Textbox(
             label="Annotator ID",
     comment = gr.Textbox(lines=2, placeholder="Optional comment...", label="Comment")
     output = gr.Textbox(label="Status", interactive=False)
     next_button = gr.Button("Submit and Next")
     export_file = gr.File(label="Download your results", visible=False)
     load_button.click(
         fn=load_data_for_lang,
         inputs=[lang_choice],
         outputs=[idx, source, hyp, progress],
     )
+    upload_file.change(
+        fn=restore_previous_annotations,
+        inputs=[upload_file],
+        outputs=[idx, source, hyp, progress, lang_choice],
+    )
     next_button.click(
         fn=annotate,
         inputs=[idx, score, comment, annotator],
             export_file,
         ],
     )
+    export_button.click(
+        fn=export_results,
+        inputs=[],
+        outputs=[
+            export_file,
+            export_file,
+        ],  # 绑定两次 export_file，第二个用于更新它的可见性和路径
+    )
     idx.change(fn=load_sample, inputs=idx, outputs=[source, hyp])
     demo.load(fn=load_sample, inputs=[idx], outputs=[source, hyp])
 demo.launch(server_name="0.0.0.0", server_port=int(os.environ.get("PORT", 7860)))