Spaces:

poltextlab
/

babel_machine

Running

App Files Files Community

kovacsvi commited on May 13

Commit

fb1a253

1 Parent(s): 0b09517

JIT tracing

Browse files

Files changed (11) hide show

interfaces/cap.py +1 -1
interfaces/cap_media_demo.py +20 -8
interfaces/cap_minor.py +20 -8
interfaces/cap_minor_media.py +20 -8
interfaces/emotion.py +20 -9
interfaces/emotion9.py +20 -8
interfaces/illframes.py +19 -17
interfaces/manifesto.py +20 -8
interfaces/ontolisst.py +20 -19
interfaces/sentiment.py +20 -9
utils.py +1 -1

interfaces/cap.py CHANGED Viewed

@@ -106,7 +106,7 @@ def predict(text, model_id, tokenizer_id):
     with torch.no_grad():
         output = model(inputs["input_ids"], inputs["attention_mask"])
-        print(output)
         logits = output["logits"]
     release_model(model, model_id)

     with torch.no_grad():
         output = model(inputs["input_ids"], inputs["attention_mask"])
+        print(output) # debug
         logits = output["logits"]
     release_model(model, model_id)

interfaces/cap_media_demo.py CHANGED Viewed

@@ -35,18 +35,30 @@ def build_huggingface_path(language: str, domain: str):
 def predict(text, model_id, tokenizer_id):
     device = torch.device("cpu")
-    model = AutoModelForSequenceClassification.from_pretrained(model_id, device_map="auto", token=HF_TOKEN)
-    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
-    inputs = tokenizer(text,
-                       max_length=256,
-                       truncation=True,
-                       padding="do_not_pad",
-                       return_tensors="pt").to(device)
     model.eval()
     with torch.no_grad():
-        logits = model(**inputs).logits
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

 def predict(text, model_id, tokenizer_id):
     device = torch.device("cpu")
+    # Load JIT-traced model
+    jit_model_path = f"/data/jit_models/{model_id.replace('/', '_')}.pt"
+    model = torch.jit.load(jit_model_path).to(device)
     model.eval()
+    # Load tokenizer (still regular HF)
+    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
+    # Tokenize input
+    inputs = tokenizer(
+        text,
+        max_length=256,
+        truncation=True,
+        padding="do_not_pad",
+        return_tensors="pt"
+    )
+    inputs = {k: v.to(device) for k, v in inputs.items()}
     with torch.no_grad():
+        output = model(inputs["input_ids"], inputs["attention_mask"])
+        print(output) # debug
+        logits = output["logits"]
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

interfaces/cap_minor.py CHANGED Viewed

@@ -67,18 +67,30 @@ def build_huggingface_path(language: str, domain: str):
 def predict(text, model_id, tokenizer_id):
     device = torch.device("cpu")
-    model = AutoModelForSequenceClassification.from_pretrained(model_id, device_map="auto", token=HF_TOKEN)
-    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
-    inputs = tokenizer(text,
-                       max_length=256,
-                       truncation=True,
-                       padding="do_not_pad",
-                       return_tensors="pt").to(device)
     model.eval()
     with torch.no_grad():
-        logits = model(**inputs).logits
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

 def predict(text, model_id, tokenizer_id):
     device = torch.device("cpu")
+    # Load JIT-traced model
+    jit_model_path = f"/data/jit_models/{model_id.replace('/', '_')}.pt"
+    model = torch.jit.load(jit_model_path).to(device)
     model.eval()
+    # Load tokenizer (still regular HF)
+    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
+    # Tokenize input
+    inputs = tokenizer(
+        text,
+        max_length=256,
+        truncation=True,
+        padding="do_not_pad",
+        return_tensors="pt"
+    )
+    inputs = {k: v.to(device) for k, v in inputs.items()}
     with torch.no_grad():
+        output = model(inputs["input_ids"], inputs["attention_mask"])
+        print(output) # debug
+        logits = output["logits"]
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

interfaces/cap_minor_media.py CHANGED Viewed

@@ -150,18 +150,30 @@ def predict(text, major_model_id, minor_model_id, tokenizer_id, HF_TOKEN=None):
 def predict_flat(text, model_id, tokenizer_id, HF_TOKEN=None):
     device = torch.device("cpu")
-    model = AutoModelForSequenceClassification.from_pretrained(model_id, device_map="auto", token=HF_TOKEN).to(device)
-    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
-    inputs = tokenizer(text,
-                       max_length=256,
-                       truncation=True,
-                       padding="do_not_pad",
-                       return_tensors="pt").to(device)
     model.eval()
     with torch.no_grad():
-        logits = model(**inputs).logits
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

 def predict_flat(text, model_id, tokenizer_id, HF_TOKEN=None):
     device = torch.device("cpu")
+    # Load JIT-traced model
+    jit_model_path = f"/data/jit_models/{model_id.replace('/', '_')}.pt"
+    model = torch.jit.load(jit_model_path).to(device)
     model.eval()
+    # Load tokenizer (still regular HF)
+    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
+    # Tokenize input
+    inputs = tokenizer(
+        text,
+        max_length=256,
+        truncation=True,
+        padding="do_not_pad",
+        return_tensors="pt"
+    )
+    inputs = {k: v.to(device) for k, v in inputs.items()}
     with torch.no_grad():
+        output = model(inputs["input_ids"], inputs["attention_mask"])
+        print(output) # debug
+        logits = output["logits"]
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

interfaces/emotion.py CHANGED Viewed

@@ -27,19 +27,30 @@ def build_huggingface_path(language: str):
 def predict(text, model_id, tokenizer_id):
     device = torch.device("cpu")
-    model = AutoModelForSequenceClassification.from_pretrained(model_id, device_map="auto", token=HF_TOKEN)
-    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
-    model.to(device)
-    inputs = tokenizer(text,
-                       max_length=512,
-                       truncation=True,
-                       padding="do_not_pad",
-                       return_tensors="pt").to(device)
     model.eval()
     with torch.no_grad():
-        logits = model(**inputs).logits
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

 def predict(text, model_id, tokenizer_id):
     device = torch.device("cpu")
+    # Load JIT-traced model
+    jit_model_path = f"/data/jit_models/{model_id.replace('/', '_')}.pt"
+    model = torch.jit.load(jit_model_path).to(device)
     model.eval()
+    # Load tokenizer (still regular HF)
+    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
+    # Tokenize input
+    inputs = tokenizer(
+        text,
+        max_length=256,
+        truncation=True,
+        padding="do_not_pad",
+        return_tensors="pt"
+    )
+    inputs = {k: v.to(device) for k, v in inputs.items()}
     with torch.no_grad():
+        output = model(inputs["input_ids"], inputs["attention_mask"])
+        print(output) # debug
+        logits = output["logits"]
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

interfaces/emotion9.py CHANGED Viewed

@@ -26,18 +26,30 @@ def build_huggingface_path(language: str):
 def predict(text, model_id, tokenizer_id):
     device = torch.device("cpu")
-    model = AutoModelForSequenceClassification.from_pretrained(model_id, token=HF_TOKEN)
-    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
-    inputs = tokenizer(text,
-                       max_length=512,
-                       truncation=True,
-                       padding="do_not_pad",
-                       return_tensors="pt").to(device)
     model.eval()
     with torch.no_grad():
-        logits = model(**inputs).logits
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

 def predict(text, model_id, tokenizer_id):
     device = torch.device("cpu")
+    # Load JIT-traced model
+    jit_model_path = f"/data/jit_models/{model_id.replace('/', '_')}.pt"
+    model = torch.jit.load(jit_model_path).to(device)
     model.eval()
+    # Load tokenizer (still regular HF)
+    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
+    # Tokenize input
+    inputs = tokenizer(
+        text,
+        max_length=256,
+        truncation=True,
+        padding="do_not_pad",
+        return_tensors="pt"
+    )
+    inputs = {k: v.to(device) for k, v in inputs.items()}
     with torch.no_grad():
+        output = model(inputs["input_ids"], inputs["attention_mask"])
+        print(output) # debug
+        logits = output["logits"]
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

interfaces/illframes.py CHANGED Viewed

@@ -58,28 +58,30 @@ def build_huggingface_path(domain: str):
 def predict(text, model_id, tokenizer_id, label_names):
     device = torch.device("cpu")
-    try:
-        model = AutoModelForSequenceClassification.from_pretrained(model_id, device_map="auto", token=HF_TOKEN)
-    except:
-        disk_space = get_disk_space('/data/')
-        print("Disk Space Error:")
-        for key, value in disk_space.items():
-            print(f"{key}: {value}")
-        shutil.rmtree("/data")
-        model = AutoModelForSequenceClassification.from_pretrained(model_id, device_map="auto", token=HF_TOKEN, force_download=True)
     tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
-    inputs = tokenizer(text,
-                       max_length=256,
-                       truncation=True,
-                       padding="do_not_pad",
-                       return_tensors="pt").to(device)
-    model.eval()
     with torch.no_grad():
-        logits = model(**inputs).logits
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

 def predict(text, model_id, tokenizer_id, label_names):
     device = torch.device("cpu")
+    # Load JIT-traced model
+    jit_model_path = f"/data/jit_models/{model_id.replace('/', '_')}.pt"
+    model = torch.jit.load(jit_model_path).to(device)
+    model.eval()
+    # Load tokenizer (still regular HF)
     tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
+    # Tokenize input
+    inputs = tokenizer(
+        text,
+        max_length=256,
+        truncation=True,
+        padding="do_not_pad",
+        return_tensors="pt"
+    )
+    inputs = {k: v.to(device) for k, v in inputs.items()}
     with torch.no_grad():
+        output = model(inputs["input_ids"], inputs["attention_mask"])
+        print(output) # debug
+        logits = output["logits"]
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

interfaces/manifesto.py CHANGED Viewed

@@ -26,18 +26,30 @@ def build_huggingface_path(language: str):
 def predict(text, model_id, tokenizer_id):
     device = torch.device("cpu")
-    model = AutoModelForSequenceClassification.from_pretrained(model_id, device_map="auto", token=HF_TOKEN)
-    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
-    inputs = tokenizer(text,
-                       max_length=256,
-                       truncation=True,
-                       padding="do_not_pad",
-                       return_tensors="pt").to(device)
     model.eval()
     with torch.no_grad():
-        logits = model(**inputs).logits
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

 def predict(text, model_id, tokenizer_id):
     device = torch.device("cpu")
+    # Load JIT-traced model
+    jit_model_path = f"/data/jit_models/{model_id.replace('/', '_')}.pt"
+    model = torch.jit.load(jit_model_path).to(device)
     model.eval()
+    # Load tokenizer (still regular HF)
+    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
+    # Tokenize input
+    inputs = tokenizer(
+        text,
+        max_length=256,
+        truncation=True,
+        padding="do_not_pad",
+        return_tensors="pt"
+    )
+    inputs = {k: v.to(device) for k, v in inputs.items()}
     with torch.no_grad():
+        output = model(inputs["input_ids"], inputs["attention_mask"])
+        print(output) # debug
+        logits = output["logits"]
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

interfaces/ontolisst.py CHANGED Viewed

@@ -44,29 +44,30 @@ def build_huggingface_path(language: str):
 def predict(text, model_id, tokenizer_id):
     device = torch.device("cpu")
-    model = AutoModelForSequenceClassification.from_pretrained(model_id, device_map="auto", token=HF_TOKEN)
-    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
-    # --- DEBUG ---
-    disk_space = get_disk_space('/data/')
-    print("Disk Space Info:")
-    for key, value in disk_space.items():
-        print(f"{key}: {value}")
-    # ---
-    model.to(device)
-    inputs = tokenizer(text,
-                       max_length=256,
-                       truncation=True,
-                       padding="do_not_pad",
-                       return_tensors="pt").to(device)
     model.eval()
     with torch.no_grad():
-        logits = model(**inputs).logits
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

 def predict(text, model_id, tokenizer_id):
     device = torch.device("cpu")
+    # Load JIT-traced model
+    jit_model_path = f"/data/jit_models/{model_id.replace('/', '_')}.pt"
+    model = torch.jit.load(jit_model_path).to(device)
     model.eval()
+    # Load tokenizer (still regular HF)
+    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
+    # Tokenize input
+    inputs = tokenizer(
+        text,
+        max_length=256,
+        truncation=True,
+        padding="do_not_pad",
+        return_tensors="pt"
+    )
+    inputs = {k: v.to(device) for k, v in inputs.items()}
     with torch.no_grad():
+        output = model(inputs["input_ids"], inputs["attention_mask"])
+        print(output) # debug
+        logits = output["logits"]
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

interfaces/sentiment.py CHANGED Viewed

@@ -30,19 +30,30 @@ def build_huggingface_path(language: str):
 def predict(text, model_id, tokenizer_id):
     device = torch.device("cpu")
-    model = AutoModelForSequenceClassification.from_pretrained(model_id, device_map="auto", token=HF_TOKEN)
-    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
-    model.to(device)
-    inputs = tokenizer(text,
-                       max_length=256,
-                       truncation=True,
-                       padding="do_not_pad",
-                       return_tensors="pt").to(device)
     model.eval()
     with torch.no_grad():
-        logits = model(**inputs).logits
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

 def predict(text, model_id, tokenizer_id):
     device = torch.device("cpu")
+    # Load JIT-traced model
+    jit_model_path = f"/data/jit_models/{model_id.replace('/', '_')}.pt"
+    model = torch.jit.load(jit_model_path).to(device)
     model.eval()
+    # Load tokenizer (still regular HF)
+    tokenizer = AutoTokenizer.from_pretrained(tokenizer_id)
+    # Tokenize input
+    inputs = tokenizer(
+        text,
+        max_length=256,
+        truncation=True,
+        padding="do_not_pad",
+        return_tensors="pt"
+    )
+    inputs = {k: v.to(device) for k, v in inputs.items()}
     with torch.no_grad():
+        output = model(inputs["input_ids"], inputs["attention_mask"])
+        print(output) # debug
+        logits = output["logits"]
     release_model(model, model_id)
     probs = torch.nn.functional.softmax(logits, dim=1).cpu().numpy().flatten()

utils.py CHANGED Viewed

@@ -75,7 +75,7 @@ def download_hf_models():
         safe_model_name = model_id.replace("/", "_")
         traced_model_path = os.path.join(JIT_DIR, f"{safe_model_name}.pt")
-        if os.path.exists(traced_model_path) or "pooled-cap" not in model_id:
             print(f"⏩ Skipping JIT — already exists: {traced_model_path}")
         else:
             print(f"⚙️  Tracing and saving: {traced_model_path}")

         safe_model_name = model_id.replace("/", "_")
         traced_model_path = os.path.join(JIT_DIR, f"{safe_model_name}.pt")
+        if os.path.exists(traced_model_path):
             print(f"⏩ Skipping JIT — already exists: {traced_model_path}")
         else:
             print(f"⚙️  Tracing and saving: {traced_model_path}")