Spaces:

Luigi
/

Streaming-Zipformer

Running

App Files Files Community

Luigi commited on Jun 8

Commit

b26d94c

1 Parent(s): ab9b679

fix local model path err

Browse files

Files changed (1) hide show

app/asr_worker.py +15 -29

app/asr_worker.py CHANGED Viewed

@@ -1,21 +1,13 @@
 import numpy as np
 import sherpa_onnx
-from pathlib import Path
 import scipy.signal
 from opencc import OpenCC
 from huggingface_hub import hf_hub_download
 converter = OpenCC('s2t')
-def resample_audio(audio, orig_sr, target_sr):
-    return scipy.signal.resample_poly(audio, target_sr, orig_sr)
-# HuggingFace repository ID and local model directory
 REPO_ID = "pfluo/k2fsa-zipformer-chinese-english-mixed"
-MODEL_DIR = Path("models") / REPO_ID.replace("/", "_")
-# Map logical names to paths within the repo
 FILES = {
     "tokens": "data/lang_char_bpe/tokens.txt",
     "encoder": "exp/encoder-epoch-99-avg-1.int8.onnx",
@@ -23,31 +15,25 @@ FILES = {
     "joiner": "exp/joiner-epoch-99-avg-1.int8.onnx",
 }
-# Download model files from HuggingFace Hub if missing
-def download_model(repo_id: str, model_dir: Path):
-    for subpath in FILES.values():
-        local_path = model_dir / subpath
-        if not local_path.exists():
-            print(f"Downloading {subpath} from {repo_id}...")
-            # Ensure parent directories exist
-            local_path.parent.mkdir(parents=True, exist_ok=True)
-            hf_hub_download(
-                repo_id=repo_id,
-                filename=subpath,
-                local_dir=str(model_dir),
-                local_dir_use_symlinks=False,
-            )
-# Initialize and download model on import
-download_model(REPO_ID, MODEL_DIR)
 # Build the online recognizer with int8 weights
 def create_recognizer():
     return sherpa_onnx.OnlineRecognizer.from_transducer(
-        tokens=str(MODEL_DIR / FILES['tokens']),
-        encoder=str(MODEL_DIR / FILES['encoder']),
-        decoder=str(MODEL_DIR / FILES['decoder']),
-        joiner=str(MODEL_DIR / FILES['joiner']),
         provider="cpu",
         num_threads=1,
         sample_rate=16000,

 import numpy as np
 import sherpa_onnx
 import scipy.signal
 from opencc import OpenCC
 from huggingface_hub import hf_hub_download
 converter = OpenCC('s2t')
+# ASR model repository and file paths
 REPO_ID = "pfluo/k2fsa-zipformer-chinese-english-mixed"
 FILES = {
     "tokens": "data/lang_char_bpe/tokens.txt",
     "encoder": "exp/encoder-epoch-99-avg-1.int8.onnx",
     "joiner": "exp/joiner-epoch-99-avg-1.int8.onnx",
 }
+# Download and cache each file via HuggingFace Hub
+LOCAL_PATHS = {}
+for key, path in FILES.items():
+    LOCAL_PATHS[key] = hf_hub_download(
+        repo_id=REPO_ID,
+        filename=path,
+    )
+# Audio resampling utility
+def resample_audio(audio: np.ndarray, orig_sr: int, target_sr: int) -> np.ndarray:
+    return scipy.signal.resample_poly(audio, target_sr, orig_sr)
 # Build the online recognizer with int8 weights
 def create_recognizer():
     return sherpa_onnx.OnlineRecognizer.from_transducer(
+        tokens=LOCAL_PATHS['tokens'],
+        encoder=LOCAL_PATHS['encoder'],
+        decoder=LOCAL_PATHS['decoder'],
+        joiner=LOCAL_PATHS['joiner'],
         provider="cpu",
         num_threads=1,
         sample_rate=16000,