Spaces:

JulioContrerasH
/

my-challenge

Runtime error

App Files Files Community

JulioContrerasH commited on Mar 27

Commit

4f65d0c

verified ·

1 Parent(s): 2d87186

Upload: Multiple files to assets directory

Browse files

Files changed (1) hide show

app.py +122 -33

app.py CHANGED Viewed

@@ -8,16 +8,96 @@ matplotlib.use('Agg')
 import matplotlib.pyplot as plt
 import io
 import base64
-# 1) URL del archivo de referencia
 REFERENCE_FILE_URL = "https://huggingface.co/datasets/juliocontrerash/my-challenge-submissions/resolve/main/reference.csv"
-LOCAL_REF_PATH = "reference.csv"
 def download_reference():
     """
-    Descarga el CSV de referencia desde Hugging Face Datasets
-    y lo guarda como un archivo local 'reference.csv'.
-    Se ejecuta solo si el archivo no existe todavía.
     """
     if not os.path.exists(LOCAL_REF_PATH):
         print("Descargando archivo de referencia...")
@@ -27,61 +107,68 @@ def download_reference():
             f.write(r.content)
         print("Descarga completa:", LOCAL_REF_PATH)
-download_reference()  # Se ejecutará una sola vez al iniciar el Space
 def evaluate_prediction(pred_path, ref_path):
     """
-    Lee el archivo CSV subido (pred_path) y el archivo CSV de referencia (ref_path).
-    Calcula alguna métrica, por ejemplo MRE y RMSE.
-    Formato de CSV esperado:
-    - reference.csv: col [wavelength, power]
-    - predictions.csv: col [wavelength, prediction]
     """
     # Leer la referencia
     df_ref = pd.read_csv(ref_path)
-    # Leer la predicción del participante
     df_pred = pd.read_csv(pred_path)
-    # Hacer merge en base a la columna 'wavelength'
     df_merged = pd.merge(df_ref, df_pred, on='wavelength', how='inner')
-    # Extraer valores
     real = df_merged['power'].values
     pred = df_merged['prediction'].values
-    # Calcular Mean Relative Error (MRE) por cada fila
     mre = np.abs((pred - real) / real)
     mre_mean = mre.mean()
     # Calcular RMSE
     rmse = np.sqrt(np.mean((pred - real)**2))
-    # Retornar resultados
     return {
-        "mre_mean": mre_mean,
-        "rmse": rmse,
-        "mre_spectrum": mre.tolist()  # vector
     }
 def evaluate_and_save(pred_file, participant_name):
     """
-    Función que se llama al presionar el botón "Evaluar" en la interfaz.
-    1. Lee el CSV de predicciones (subido por usuario).
-    2. Llama a evaluate_prediction().
-    3. Genera una gráfica y arma un mensaje final.
-    4. Retorna el mensaje y la gráfica embebida (base64).
     """
     if not pred_file:
         return "No file uploaded", None
-    # 1. El archivo subido es un objeto tipo gradio.tempfile. Obtenemos la ruta
     pred_path = pred_file.name
-    # 2. Evaluar la predicción
     results = evaluate_prediction(pred_path, LOCAL_REF_PATH)
-    # 3. Generar la gráfica
     mre_spectrum = results["mre_spectrum"]
     plt.figure(figsize=(6,4))
     plt.plot(np.arange(len(mre_spectrum)), mre_spectrum, marker='o', label='MRE Spectrum')
@@ -89,7 +176,6 @@ def evaluate_and_save(pred_file, participant_name):
     plt.ylabel('MRE')
     plt.title('Spectral Error')
     plt.legend()
     buf = io.BytesIO()
     plt.savefig(buf, format='png')
     plt.close()
@@ -97,7 +183,7 @@ def evaluate_and_save(pred_file, participant_name):
     img_str = base64.b64encode(buf.read()).decode('utf-8')
     img_str = f"data:image/png;base64,{img_str}"
-    # 4. Construir mensaje final
     message = (
         f"Participant: {participant_name}\n"
         f"MRE mean: {results['mre_mean']:.4f}\n"
@@ -106,11 +192,14 @@ def evaluate_and_save(pred_file, participant_name):
     return message, img_str
-# === Construcción de la interfaz con Gradio ===
 with gr.Blocks() as demo:
     gr.Markdown("# My Challenge\nSube tu archivo de predicciones en CSV para evaluar tu modelo.")
     participant_name = gr.Textbox(label="Nombre del participante")
-    pred_file = gr.File(label="Subir archivo CSV (ej. predictions.csv)")
     output_message = gr.Textbox(label="Resultados")
     output_image = gr.HTML(label="Gráfica")

 import matplotlib.pyplot as plt
 import io
 import base64
+import json
+import time
+from huggingface_hub import Repository
+# -----------------------------------------------------------------------------
+# CONFIGURACIÓN DEL REPO DEL SPACE Y DE LA REFERENCIA
+# -----------------------------------------------------------------------------
+SPACE_REPO_URL = "https://huggingface.co/spaces/juliocontrerash/my-challenge"
+SPACE_LOCAL_DIR = "."  # Usa la carpeta actual (el mismo repo del Space)
+# URL de tu archivo de referencia CSV en un dataset (por ejemplo, "reference.csv")
 REFERENCE_FILE_URL = "https://huggingface.co/datasets/juliocontrerash/my-challenge-submissions/resolve/main/reference.csv"
+LOCAL_REF_PATH = "reference.csv"  # Lo guardaremos con este nombre local
+def setup_local_repo_for_push():
+    """
+    Inicializa un objeto 'Repository' apuntando al mismo repo del Space.
+    Requiere un token con permisos de escritura, guardado en HF_SPACE_TOKEN
+    como secret en la configuración del Space.
+    """
+    token = os.environ.get("HF_SPACE_TOKEN", None)  # <--- ASEGÚRATE DE QUE SE LLAME ASÍ
+    if not token:
+        print("WARNING: HF_SPACE_TOKEN no está configurado. No se podrá hacer push.")
+        return None
+    repo = Repository(
+        local_dir=SPACE_LOCAL_DIR,
+        clone_from=SPACE_REPO_URL,
+        use_auth_token=token
+    )
+    # Por si se actualizó el Space en remoto
+    try:
+        repo.git_pull()
+    except:
+        pass
+    return repo
+# Inicializamos la posibilidad de hacer push a nuestro Space
+space_repo = setup_local_repo_for_push()
+def add_submission_entry(entry):
+    """
+    Abre/crea submissions.jsonl (en la raíz del Space),
+    agrega la nueva 'entry', y hace commit+push al repo.
+    """
+    global space_repo
+    if space_repo is None:
+        print("No repo handle (space_repo is None). Skipping save.")
+        return
+    submissions_file = "submissions.jsonl"
+    # 1) Traer la última versión de remoto (por si hubo otros commits)
+    space_repo.git_pull()
+    # 2) Leer el archivo actual (si existe)
+    submissions = []
+    if os.path.exists(submissions_file):
+        with open(submissions_file, "r") as f:
+            for line in f:
+                line = line.strip()
+                if line:
+                    submissions.append(json.loads(line))
+    # 3) Añadir la nueva entrada
+    submissions.append(entry)
+    # 4) Guardar sobrescribiendo
+    with open(submissions_file, "w") as f:
+        for s in submissions:
+            f.write(json.dumps(s) + "\n")
+    # 5) Hacer commit y push
+    space_repo.git_add(submissions_file)
+    space_repo.git_commit("Add new submission entry")
+    try:
+        space_repo.git_push()
+        print("Submission pushed successfully to the Space repo.")
+    except Exception as e:
+        print("Error pushing submission:", e)
+# -----------------------------------------------------------------------------
+# DESCARGA DEL ARCHIVO DE REFERENCIA
+# -----------------------------------------------------------------------------
 def download_reference():
     """
+    Descarga el CSV de referencia desde el dataset en Hugging Face,
+    guardándolo como 'reference.csv' si no existe aún.
     """
     if not os.path.exists(LOCAL_REF_PATH):
         print("Descargando archivo de referencia...")
             f.write(r.content)
         print("Descarga completa:", LOCAL_REF_PATH)
+download_reference()  # Se ejecuta al iniciar el Space
+# -----------------------------------------------------------------------------
+# LÓGICA DE EVALUACIÓN
+# -----------------------------------------------------------------------------
 def evaluate_prediction(pred_path, ref_path):
     """
+    Lee el CSV subido (pred_path) y el CSV de referencia (ref_path),
+    Calcula el MRE y RMSE, y retorna un dict con resultados.
+    Formato esperado:
+    - reference.csv: [wavelength, power]
+    - predictions.csv: [wavelength, prediction]
     """
     # Leer la referencia
     df_ref = pd.read_csv(ref_path)
+    # Leer la predicción
     df_pred = pd.read_csv(pred_path)
+    # Merge en base a 'wavelength'
     df_merged = pd.merge(df_ref, df_pred, on='wavelength', how='inner')
     real = df_merged['power'].values
     pred = df_merged['prediction'].values
+    # Calcular MRE
     mre = np.abs((pred - real) / real)
     mre_mean = mre.mean()
     # Calcular RMSE
     rmse = np.sqrt(np.mean((pred - real)**2))
+    # Retornar
     return {
+        "mre_mean": float(mre_mean),
+        "rmse": float(rmse),
+        "mre_spectrum": mre.tolist()
     }
 def evaluate_and_save(pred_file, participant_name):
     """
+    1. Toma el archivo subido (pred_file).
+    2. Evalúa comparándolo con la referencia (LOCAL_REF_PATH).
+    3. Agrega la entrada a submissions.jsonl.
+    4. Genera una gráfica y mensaje de resultados.
     """
     if not pred_file:
         return "No file uploaded", None
     pred_path = pred_file.name
     results = evaluate_prediction(pred_path, LOCAL_REF_PATH)
+    # Guardar submission en submissions.jsonl
+    submission_entry = {
+        "submission_id": int(time.time()),
+        "participant": participant_name,
+        "mre_mean": results["mre_mean"],
+        "rmse": results["rmse"],
+        "timestamp": time.strftime("%Y-%m-%d %H:%M:%S")
+    }
+    add_submission_entry(submission_entry)
+    # Graficar
     mre_spectrum = results["mre_spectrum"]
     plt.figure(figsize=(6,4))
     plt.plot(np.arange(len(mre_spectrum)), mre_spectrum, marker='o', label='MRE Spectrum')
     plt.ylabel('MRE')
     plt.title('Spectral Error')
     plt.legend()
     buf = io.BytesIO()
     plt.savefig(buf, format='png')
     plt.close()
     img_str = base64.b64encode(buf.read()).decode('utf-8')
     img_str = f"data:image/png;base64,{img_str}"
+    # Mensaje final
     message = (
         f"Participant: {participant_name}\n"
         f"MRE mean: {results['mre_mean']:.4f}\n"
     return message, img_str
+# -----------------------------------------------------------------------------
+# INTERFAZ GRADIO
+# -----------------------------------------------------------------------------
 with gr.Blocks() as demo:
     gr.Markdown("# My Challenge\nSube tu archivo de predicciones en CSV para evaluar tu modelo.")
     participant_name = gr.Textbox(label="Nombre del participante")
+    pred_file = gr.File(label="Subir archivo CSV (predictions.csv)")
     output_message = gr.Textbox(label="Resultados")
     output_image = gr.HTML(label="Gráfica")