Spaces:

silveroxides
/

Pytorch-to-Safetensors

Running on Zero

App Files Files Community

silveroxides commited on Jun 30

Commit

b970c25

1 Parent(s): ee0fa2a

add app.py and convertion code

Browse files

Files changed (5) hide show

app.py +34 -0
convert.py +73 -0
hf_utils.py +50 -0
requirements.txt +8 -0
utils.py +6 -0

app.py ADDED Viewed

	@@ -0,0 +1,34 @@

+import gradio as gr
+from convert import convert
+DESCRIPTION = """
+The steps are the following:
+- Create a new model repo for the converted model if you do not already have one.
+- Paste a read-access token in the your_hf_token box from hf.co/settings/tokens. Read access is enough given that we will open a PR against your created repo.
+- Input a model id (username/repo) which can be put in clipboard by clicking the copy icon ⧉ next to the title of the repo then paste in the model_id box.
+- Input the filename from the root dir of the repo that you would like to convert which can be added to clipboard by clicking the filename and then the copy icon ⧉ next to file names title and input that to filename box.
+- Paste the model id of your new repo in the your_model_id box.
+- Click "Submit".
+- That's it! You'll get feedback if it works or not, and if it worked, you'll get the URL of the opened PR 🔥.
+⚠️ If you encounter weird error messages, please have a look into the Logs and feel free to open a PR to correct the error messages.
+"""
+demo = gr.Interface(
+    title="Convert any weights only .pt, .pth, .bin, .ckpt to .safetensors and open a PR",
+    description=DESCRIPTION,
+    flagging_mode="never",
+    article="placeholder",
+    inputs=[
+        gr.Text(max_lines=1, label="your_hf_token"),
+        gr.Text(max_lines=1, label="model_id"),
+        gr.Text(max_lines=1, label="filename"),
+        gr.Text(max_lines=1, label="your_model_id"),
+    ],
+    outputs=[gr.Markdown(label="output")],
+    fn=convert,
+)
+demo.launch(show_api=True)

convert.py ADDED Viewed

	@@ -0,0 +1,73 @@

+import gradio as gr
+import requests
+import os
+import shutil
+from pathlib import Path
+from typing import Any
+from tempfile import TemporaryDirectory
+from typing import Optional
+import torch
+from io import BytesIO
+from huggingface_hub import CommitInfo, Discussion, HfApi, hf_hub_download
+from huggingface_hub.file_download import repo_folder_name
+import spaces
+COMMIT_MESSAGE = " This PR adds weights in safetensors format"
+device = "cpu"
+def convert_pt_to_safetensors(model_path, safe_path):
+    model = torch.load(model_path, map_location="cpu", weights_only=False)
+    metadata = {"format":"pt"}
+    save_file(model, safe_path, metadata)
+def convert_single(model_id: str, filename: str, folder: str, progress: Any, token: str):
+    progress(0, desc="Downloading model")
+    local_file = os.path.join(model_id, filename)
+    local_dir = os.path.dirname(local_file)
+    model_path = local_file if os.path.isfile(local_file) else hf_hub_download(repo_id=model_id, filename=filename, token=token, local_dir=local_dir)
+    file_path = os.path.splitext(model_path)[0]
+    safe_path = file_path + ".safetensors"
+    convert_pt_to_safetensors(model_path, safe_path)
+    return safe_path
+def previous_pr(api: "HfApi", model_id: str, pr_title: str) -> Optional["Discussion"]:
+    try:
+        discussions = api.get_repo_discussions(repo_id=model_id)
+    except Exception:
+        return None
+    for discussion in discussions:
+        if discussion.status == "open" and discussion.is_pull_request and discussion.title == pr_title:
+            details = api.get_discussion_details(repo_id=model_id, discussion_num=discussion.num)
+            if details.target_branch == "refs/heads/main":
+                return discussion
+@spaces.GPU()
+def convert(token: str, model_id: str, filename: str, your_model_id: str, progress=gr.Progress()):
+    api = HfApi()
+    pr_title = "Adding model converted to .safetensors"
+    with TemporaryDirectory() as d:
+        folder = os.path.join(d, repo_folder_name(repo_id=model_id, repo_type="models"))
+        os.makedirs(folder)
+        new_pr = None
+        try:
+            converted_model = convert_single(model_id, filename, folder, progress, token)
+            progress(0.7, desc="Uploading to Hub")
+            new_pr  = api.upload_file(path_or_fileobj=converted_model, path_in_repo=filename, repo_id=your_model_id, repo_type="model", token=token, commit_message=pr_title, commit_description=COMMIT_MESSAGE.format(your_model_id), create_pr=True)
+            pr_number = new_pr.split("%2F")[-1].split("/")[0]
+            link = f"Pr created at: {'https://huggingface.co/' + os.path.join(your_model_id, 'discussions', pr_number)}"
+            progress(1, desc="Done")
+        except Exception as e:
+            raise gr.exceptions.Error(str(e))
+        finally:
+            shutil.rmtree(folder)
+        return link

hf_utils.py ADDED Viewed

	@@ -0,0 +1,50 @@

+from huggingface_hub import get_hf_file_metadata, hf_hub_url, hf_hub_download, scan_cache_dir, whoami, list_models
+def get_my_model_names(token):
+    try:
+        author = whoami(token=token)
+        model_infos = list_models(author=author["name"], use_auth_token=token)
+        return [model.modelId for model in model_infos], None
+    except Exception as e:
+        return [], e
+def download_file(repo_id: str, filename: str, token: str):
+    """Download a file from a repo on the Hugging Face Hub.
+    Returns:
+        file_path (:obj:`str`): The path to the downloaded file.
+        revision (:obj:`str`): The commit hash of the file.
+        """
+    md = get_hf_file_metadata(hf_hub_url(repo_id=repo_id, filename=filename), token=token)
+    revision = md.commit_hash
+    file_path = hf_hub_download(repo_id=repo_id, filename=filename, revision=revision, token=token)
+    return file_path, revision
+def delete_file(revision: str):
+    """Delete a file from local cache.
+    Args:
+        revision (:obj:`str`): The commit hash of the file.
+    Returns:
+        None
+        """
+    scan_cache_dir().delete_revisions(revision).execute()
+def get_pr_url(api, repo_id, title):
+    try:
+        discussions = api.get_repo_discussions(repo_id=repo_id)
+    except Exception:
+        return None
+    for discussion in discussions:
+        if (
+            discussion.status == "open"
+            and discussion.is_pull_request
+            and discussion.title == title
+        ):
+            return f"https://huggingface.co/{repo_id}/discussions/{discussion.num}"

requirements.txt ADDED Viewed

	@@ -0,0 +1,8 @@

+huggingface_hub[hf_transfer]
+safetensors
+transformers
+accelerate
+omegaconf
+pytorch_lightning
+pyngrok

utils.py ADDED Viewed

	@@ -0,0 +1,6 @@

+def is_google_colab():
+    try:
+        import google.colab
+        return True
+    except:
+        return False