Spaces:

MoraxCheng
/

Transeption_iGEM_BASISCHINA_2025

Running on Zero

App Files Files Community

MoraxCheng commited on 20 days ago

Commit

d416dd8

1 Parent(s): b55bd43

Implement direct model loading with manual config handling and enhance cache management for model loading

Browse files

Files changed (2) hide show

.claude/settings.local.json +4 -1
app.py +117 -30

.claude/settings.local.json CHANGED Viewed

@@ -11,7 +11,10 @@
       "Bash(python test:*)",
       "Bash(rm:*)",
       "Bash(chmod:*)",
-      "Bash(cp:*)"
     ],
     "deny": []
   }

       "Bash(python test:*)",
       "Bash(rm:*)",
       "Bash(chmod:*)",
+      "Bash(cp:*)",
+      "Bash(ls:*)",
+      "Bash(python:*)",
+      "Bash(conda:*)"
     ],
     "deny": []
   }

app.py CHANGED Viewed

@@ -111,6 +111,67 @@ def get_model_path(model_name):
     # Always return the HF Hub path to leverage this caching
     return f"PascalNotin/{model_name}"
 def load_model_cached(model_type):
     """Load model with caching to avoid re-downloading"""
     global MODEL_CACHE
@@ -125,14 +186,33 @@ def load_model_cached(model_type):
     model_path = get_model_path(model_name)
     try:
-        # Create cache directory if it doesn't exist
         cache_dir = "/tmp/huggingface/transformers"
         os.makedirs(cache_dir, exist_ok=True)
-        # Try loading with minimal parameters first
         model = tranception.model_pytorch.TranceptionLMHeadModel.from_pretrained(
             model_path,
-            cache_dir=cache_dir
         )
         MODEL_CACHE[model_type] = model
         print(f"{model_type} model loaded and cached")
@@ -155,43 +235,50 @@ def load_model_cached(model_type):
         except Exception as e2:
             print(f"Alternative loading also failed: {e2}")
-            # Final attempt: manually download config first
             try:
                 import json
                 import requests
-                # Download config.json manually
-                config_url = f"https://huggingface.co/PascalNotin/Tranception_{model_type}/raw/main/config.json"
-                print(f"Manually downloading config from: {config_url}")
-                response = requests.get(config_url)
-                if response.status_code == 200:
-                    # Save config locally
-                    local_model_dir = f"/tmp/Tranception_{model_type}"
-                    os.makedirs(local_model_dir, exist_ok=True)
-                    with open(f"{local_model_dir}/config.json", "w") as f:
-                        json.dump(response.json(), f)
-                    # Now try loading from the HF model ID again
-                    model = tranception.model_pytorch.TranceptionLMHeadModel.from_pretrained(
-                        f"PascalNotin/Tranception_{model_type}",
-                        cache_dir=cache_dir,
-                        local_files_only=False
-                    )
-                    MODEL_CACHE[model_type] = model
-                    print(f"{model_type} model loaded successfully after manual config download")
-                    return model
-                else:
-                    print(f"Failed to download config: {response.status_code}")
             except Exception as e3:
-                print(f"Manual download also failed: {e3}")
             # Fallback to Medium if requested model fails
-            if model_type != "Medium":
                 print("Falling back to Medium model...")
                 return load_model_cached("Medium")
-            raise
 AA_vocab = "ACDEFGHIKLMNPQRSTVWY"
 tokenizer = PreTrainedTokenizerFast(tokenizer_file="./tranception/utils/tokenizers/Basic_tokenizer",

     # Always return the HF Hub path to leverage this caching
     return f"PascalNotin/{model_name}"
+def load_model_direct(model_type):
+    """Direct model loading with manual config handling"""
+    import json
+    import tempfile
+    from transformers import AutoConfig
+    print(f"Attempting direct load of {model_type} model...")
+    # Create a proper config manually based on model type
+    config_data = {
+        "architectures": ["TranceptionLMHeadModel"],
+        "model_type": "tranception",
+        "_name_or_path": f"Tranception_{model_type}",
+        "activation_function": "squared_relu",
+        "attention_mode": "tranception",
+        "attn_pdrop": 0.1,
+        "embd_pdrop": 0.1,
+        "initializer_range": 0.02,
+        "layer_norm_epsilon": 1e-5,
+        "n_embd": 768 if model_type == "Small" else (1024 if model_type == "Medium" else 1280),
+        "n_head": 12 if model_type == "Small" else (16 if model_type == "Medium" else 20),
+        "n_inner": None,
+        "n_layer": 12 if model_type == "Small" else (24 if model_type == "Medium" else 30),
+        "n_positions": 2048,
+        "resid_pdrop": 0.1,
+        "summary_activation": None,
+        "summary_first_dropout": 0.1,
+        "summary_proj_to_labels": True,
+        "summary_type": "cls_index",
+        "summary_use_proj": True,
+        "vocab_size": 50257,
+        "pad_token_id": 50256,
+        "bos_token_id": 50256,
+        "eos_token_id": 50256
+    }
+    # Save config to temp file
+    with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as f:
+        json.dump(config_data, f)
+        config_path = f.name
+    try:
+        # Load config from temp file
+        config = AutoConfig.from_pretrained(config_path, trust_remote_code=True)
+        # Load model with manual config
+        model = tranception.model_pytorch.TranceptionLMHeadModel.from_pretrained(
+            f"PascalNotin/Tranception_{model_type}",
+            config=config,
+            trust_remote_code=True,
+            ignore_mismatched_sizes=True
+        )
+        os.unlink(config_path)  # Clean up temp file
+        return model
+    except Exception as e:
+        print(f"Direct load failed: {e}")
+        if os.path.exists(config_path):
+            os.unlink(config_path)
+        raise
 def load_model_cached(model_type):
     """Load model with caching to avoid re-downloading"""
     global MODEL_CACHE
     model_path = get_model_path(model_name)
     try:
+        # Clear any corrupted cache files
+        import shutil
         cache_dir = "/tmp/huggingface/transformers"
+        if os.path.exists(cache_dir):
+            # Remove corrupted tranception cache files
+            for file in os.listdir(cache_dir):
+                if "tranception" in file.lower():
+                    try:
+                        filepath = os.path.join(cache_dir, file)
+                        if os.path.isfile(filepath) and os.path.getsize(filepath) < 1000:
+                            os.remove(filepath)
+                            print(f"Removed corrupted cache file: {file}")
+                    except:
+                        pass
         os.makedirs(cache_dir, exist_ok=True)
+        # Try loading with force_download to avoid corrupted cache
+        # Use HF_ENDPOINT environment variable to ensure proper URL
+        os.environ["HF_ENDPOINT"] = "https://huggingface.co"
         model = tranception.model_pytorch.TranceptionLMHeadModel.from_pretrained(
             model_path,
+            cache_dir=cache_dir,
+            force_download=True,
+            trust_remote_code=True,
+            resume_download=False
         )
         MODEL_CACHE[model_type] = model
         print(f"{model_type} model loaded and cached")
         except Exception as e2:
             print(f"Alternative loading also failed: {e2}")
+            # Final attempt: use AutoModel with manual config
             try:
                 import json
                 import requests
+                from transformers import AutoConfig, AutoModel
+                print(f"Attempting to load with AutoModel...")
+                # Clear cache and try with AutoModel which handles config better
+                cache_dir_auto = "/tmp/huggingface/auto"
+                os.makedirs(cache_dir_auto, exist_ok=True)
+                # Try direct loading with manual config
+                model = load_model_direct(model_type)
+                MODEL_CACHE[model_type] = model
+                print(f"{model_type} model loaded successfully with AutoConfig")
+                return model
             except Exception as e3:
+                print(f"AutoModel loading also failed: {e3}")
             # Fallback to Medium if requested model fails
+            if model_type == "Large":
                 print("Falling back to Medium model...")
                 return load_model_cached("Medium")
+            elif model_type == "Medium":
+                print("Medium model failed, trying Small model...")
+                # Try Small model as last resort
+                try:
+                    model = tranception.model_pytorch.TranceptionLMHeadModel.from_pretrained(
+                        "PascalNotin/Tranception_Small",
+                        trust_remote_code=True,
+                        force_download=True,
+                        cache_dir="/tmp/huggingface/small"
+                    )
+                    MODEL_CACHE["Small"] = model
+                    print("Small model loaded as fallback")
+                    return model
+                except Exception as e_small:
+                    print(f"Small model also failed: {e_small}")
+                    raise RuntimeError("Failed to load any Tranception model")
+            else:
+                raise RuntimeError(f"Failed to load {model_type} model")
 AA_vocab = "ACDEFGHIKLMNPQRSTVWY"
 tokenizer = PreTrainedTokenizerFast(tokenizer_file="./tranception/utils/tokenizers/Basic_tokenizer",