Spaces:

rshakked
/

safe-talk

Running

rshakked commited on May 12

Commit

7a679b4

1 Parent(s): 58be06f

Update training code

Files changed (2) hide show

app.py CHANGED Viewed

@@ -4,7 +4,7 @@ import subprocess
 def run_training():
     try:
         # Run train.py using subprocess and capture output
-        result = subprocess.run(["python", "train.py"], capture_output=True, text=True)
         # Return stdout if success, otherwise stderr
         return result.stdout if result.returncode == 0 else f"Error:\n{result.stderr}"
     except Exception as e:

 def run_training():
     try:
         # Run train.py using subprocess and capture output
+        result = subprocess.run(["python", "train_abuse_model.py"], capture_output=True, text=True)
         # Return stdout if success, otherwise stderr
         return result.stdout if result.returncode == 0 else f"Error:\n{result.stderr}"
     except Exception as e:

train_abuse_model.py CHANGED Viewed

@@ -11,6 +11,9 @@ from sklearn.metrics import classification_report, precision_recall_fscore_suppo
 from torch.utils.data import Dataset
 # Hugging Face transformers
 from transformers import (
     AutoTokenizer,
@@ -22,6 +25,7 @@ from transformers import (
     TrainingArguments
 )
 # Check for GPU availability
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
@@ -125,8 +129,14 @@ def evaluate_model_with_thresholds(trainer, test_dataset):
         "pred_labels": final_pred_str
     }
-# Load dataset
-df = pd.read_excel("Abusive Relationship Stories - Technion & MSF.xlsx")
 # Define text and label columns
 text_column = "post_body"

 from torch.utils.data import Dataset
+# Hugging Face Hub
+from huggingface_hub import hf_hub_download
 # Hugging Face transformers
 from transformers import (
     AutoTokenizer,
     TrainingArguments
 )
 # Check for GPU availability
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
         "pred_labels": final_pred_str
     }
+# Load dataset from Hugging Face Hub
+path = hf_hub_download(
+    repo_id="rshakked/abusive-relashionship-stories",
+    filename="Abusive Relationship Stories - Technion & MSF.xlsx",
+    repo_type="dataset"
+)
+df = pd.read_excel(path)
 # Define text and label columns
 text_column = "post_body"