Spaces:

jhansss
/

SingingSDS

Running

App Files Files Community

jhansss commited on Jul 1

Commit

be053b4

1 Parent(s): 5749621

llm refactor

Browse files

Files changed (6) hide show

modules/llm/__init__.py +11 -0
modules/llm/base.py +15 -0
modules/{llm.py → llm/hf_pipeline.py} +7 -35
modules/llm/registry.py +19 -0
tests/__init__.py +0 -0
tests/test_llm_infer.py +26 -0

modules/llm/__init__.py ADDED Viewed

	@@ -0,0 +1,11 @@

+from .base import AbstractLLMModel
+from .registry import LLM_MODEL_REGISTRY, get_llm_model, register_llm_model
+from .hf_pipeline import HFTextGenerationLLM
+from .qwen import QwenLLM
+__all__ = [
+    "AbstractLLMModel",
+    "get_llm_model",
+    "register_llm_model",
+    "LLM_MODEL_REGISTRY",
+]

modules/llm/base.py ADDED Viewed

	@@ -0,0 +1,15 @@

+from abc import ABC, abstractmethod
+class AbstractLLMModel(ABC):
+    def __init__(
+        self, model_id: str, device: str = "cpu", cache_dir: str = "cache", **kwargs
+    ):
+        print(f"Loading LLM model {model_id}...")
+        self.model_id = model_id
+        self.device = device
+        self.cache_dir = cache_dir
+    @abstractmethod
+    def generate(self, prompt: str, **kwargs) -> str:
+        pass

modules/{llm.py → llm/hf_pipeline.py} RENAMED Viewed

@@ -1,45 +1,16 @@
 import os
-from abc import ABC, abstractmethod
 from transformers import pipeline
-LLM_MODEL_REGISTRY = {}
-hf_token = os.getenv("HF_TOKEN")
-class AbstractLLMModel(ABC):
-    def __init__(
-        self, model_id: str, device: str = "cpu", cache_dir: str = "cache", **kwargs
-    ):
-        print(f"Loading LLM model {model_id}...")
-        self.model_id = model_id
-        self.device = device
-        self.cache_dir = cache_dir
-    @abstractmethod
-    def generate(self, prompt: str, **kwargs) -> str:
-        pass
-def register_llm_model(prefix: str):
-    def wrapper(cls):
-        assert issubclass(cls, AbstractLLMModel), f"{cls} must inherit AbstractLLMModel"
-        LLM_MODEL_REGISTRY[prefix] = cls
-        return cls
-    return wrapper
-def get_llm_model(model_id: str, device="cpu", **kwargs) -> AbstractLLMModel:
-    for prefix, cls in LLM_MODEL_REGISTRY.items():
-        if model_id.startswith(prefix):
-            return cls(model_id, device=device, **kwargs)
-    raise ValueError(f"No LLM wrapper found for model: {model_id}")
-@register_llm_model("google/gemma")
-@register_llm_model("tii/")  # e.g., Falcon
-@register_llm_model("meta-llama")
 class HFTextGenerationLLM(AbstractLLMModel):
     def __init__(
         self, model_id: str, device: str = "cpu", cache_dir: str = "cache", **kwargs
@@ -53,6 +24,7 @@ class HFTextGenerationLLM(AbstractLLMModel):
             device=0 if device == "cuda" else -1,
             return_full_text=False,
             token=hf_token,
             **kwargs,
         )

 import os
 from transformers import pipeline
+from .base import AbstractLLMModel
+from .registry import register_llm_model
+hf_token = os.getenv("HF_TOKEN")
+@register_llm_model("openai-community/")
+@register_llm_model("google/gemma-")
+@register_llm_model("meta-llama/Llama-")
 class HFTextGenerationLLM(AbstractLLMModel):
     def __init__(
         self, model_id: str, device: str = "cpu", cache_dir: str = "cache", **kwargs
             device=0 if device == "cuda" else -1,
             return_full_text=False,
             token=hf_token,
+            trust_remote_code=True,
             **kwargs,
         )

modules/llm/registry.py ADDED Viewed

	@@ -0,0 +1,19 @@

+from .base import AbstractLLMModel
+LLM_MODEL_REGISTRY = {}
+def register_llm_model(prefix: str):
+    def wrapper(cls):
+        assert issubclass(cls, AbstractLLMModel), f"{cls} must inherit AbstractLLMModel"
+        LLM_MODEL_REGISTRY[prefix] = cls
+        return cls
+    return wrapper
+def get_llm_model(model_id: str, device="cpu", **kwargs) -> AbstractLLMModel:
+    for prefix, cls in LLM_MODEL_REGISTRY.items():
+        if model_id.startswith(prefix):
+            return cls(model_id, device=device, **kwargs)
+    raise ValueError(f"No LLM wrapper found for model: {model_id}")

tests/__init__.py ADDED Viewed

File without changes

tests/test_llm_infer.py ADDED Viewed

	@@ -0,0 +1,26 @@

+from modules.llm import get_llm_model
+if __name__ == "__main__":
+    supported_llms = [
+        # "MiniMaxAI/MiniMax-M1-80k", #-》load with custom code
+        # "Qwen/Qwen-1_8B",
+        # "meta-llama/Llama-3.1-8B-Instruct", # pending for approval
+        # "tiiuae/Falcon-H1-1B-Base",
+        # "tiiuae/Falcon-H1-3B-Instruct",
+        # "tencent/Hunyuan-A13B-Instruct", # -> load with custom code
+        # "deepseek-ai/DeepSeek-R1-0528",
+        # "openai-community/gpt2-xl",
+        # "google/gemma-2-2b",
+    ]
+    for model_id in supported_llms:
+        try:
+            print(f"Loading model: {model_id}")
+            llm = get_llm_model(model_id, cache_dir="./.cache")
+            prompt = "你好，今天你心情怎么样？"
+            result = llm.generate(prompt)
+            print(f"=================")
+            print(f"[{model_id}] LLM inference result:", result)
+        except Exception as e:
+            print(f"Failed to load model {model_id}: {e}")
+            breakpoint()
+            continue