build-space / app_logic.py
broadfield-dev's picture
Update app_logic.py
13591d5 verified
raw
history blame
15.3 kB
import os
import re
import tempfile
import shutil # For rmtree
import git # Used by Repository indirectly
from huggingface_hub import (
create_repo,
upload_folder,
list_repo_files,
Repository,
whoami,
)
import logging
from pathlib import Path
from PIL import Image
# Attempt to import keylock_decode
try:
from keylock_decode import decode_from_image_pil
KEYLOCK_DECODE_AVAILABLE = True
except ImportError:
KEYLOCK_DECODE_AVAILABLE = False
decode_from_image_pil = None
logging.warning("keylock-decode library not found. KeyLock Wallet image feature will be disabled.")
logging.basicConfig(
level=logging.INFO,
format="%(asctime)s - %(name)s - %(levelname)s - %(message)s"
)
logger = logging.getLogger(__name__)
# --- Helper Function to Get API Token (Unchanged) ---
def _get_api_token(ui_token_from_textbox=None):
env_token = os.getenv('HF_TOKEN')
if env_token:
logger.info("Using HF_TOKEN from environment.")
return env_token, None
if ui_token_from_textbox:
logger.info("Using API token from UI textbox.")
return ui_token_from_textbox, None
logger.warning("HF API token not found in environment or UI textbox.")
return None, "Error: Hugging Face API token not provided. Please enter it or load from a KeyLock Wallet image."
# --- `load_token_from_image_and_set_env` (Unchanged from previous debug version, ensure debug lines are suitable) ---
def load_token_from_image_and_set_env(image_pil_object: Image.Image, password: str):
if not KEYLOCK_DECODE_AVAILABLE:
return "Error: KeyLock-Decode library is not installed. This feature is disabled."
if image_pil_object is None: return "Error: No KeyLock Wallet image provided for decoding."
if not password: return "Error: Password cannot be empty for image decoding."
status_messages_display = []
# Optional: Keep debug saving if still needed, otherwise remove for cleaner output
# debug_image_path_str = "Not saved."
# try: ... debug save logic ...
# except Exception as save_exc: ...
try:
logger.info(f"Attempting to decode from KeyLock Wallet image...")
decoded_data, status_msgs_from_lib = decode_from_image_pil(image_pil_object, password, set_environment_variables=True)
status_messages_display.extend(status_msgs_from_lib)
if decoded_data:
status_messages_display.append("\n**Decoded Data Summary (sensitive values masked):**")
for key, value in decoded_data.items():
display_value = '********' if any(k_word in key.upper() for k_word in ['TOKEN', 'KEY', 'SECRET', 'PASS']) else value
status_messages_display.append(f"- {key}: {display_value}")
if os.getenv('HF_TOKEN'):
status_messages_display.append(f"\n**SUCCESS: HF_TOKEN was found and set in environment from KeyLock Wallet image.**")
elif 'HF_TOKEN' in decoded_data:
status_messages_display.append(f"\nWarning: HF_TOKEN decoded but os.getenv('HF_TOKEN') not found (unexpected).")
else:
status_messages_display.append("\nNote: HF_TOKEN not specifically found in decoded KeyLock Wallet image data.")
except ValueError as e: # Specific errors from keylock-decode
status_messages_display.append(f"**Decoding Error (e.g., bad password, corrupted data):** {e}")
except Exception as e:
logger.exception("Unexpected error during KeyLock Wallet image decoding:")
status_messages_display.append(f"**An unexpected error occurred during decoding:** {str(e)}")
return "\n".join(status_messages_display)
# --- `parse_markdown` (Unchanged from previous corrected version) ---
def parse_markdown(markdown_input):
space_info = {"repo_name_md": "", "owner_md": "", "files": []}
current_file_path = None; current_file_content_lines = []
in_file_definition = False; in_code_block = False
lines = markdown_input.strip().split("\n")
for line_content_orig in lines:
line_content_stripped = line_content_orig.strip()
if line_content_stripped.startswith("### File:"):
if current_file_path and in_file_definition:
space_info["files"].append({"path": current_file_path, "content": "\n".join(current_file_content_lines)})
current_file_path = line_content_stripped.replace("### File:", "").strip()
current_file_content_lines = []
in_file_definition = True; in_code_block = False
continue
if not in_file_definition:
if line_content_stripped.startswith("# Space:"):
full_space_name_md = line_content_stripped.replace("# Space:", "").strip()
if "/" in full_space_name_md: space_info["owner_md"], space_info["repo_name_md"] = full_space_name_md.split("/", 1)
else: space_info["repo_name_md"] = full_space_name_md
continue
if line_content_stripped.startswith("```"):
in_code_block = not in_code_block
continue
current_file_content_lines.append(line_content_orig)
if current_file_path and in_file_definition:
space_info["files"].append({"path": current_file_path, "content": "\n".join(current_file_content_lines)})
space_info["files"] = [f for f in space_info["files"] if f.get("path")]
return space_info
# --- `_determine_repo_id` (Unchanged) ---
def _determine_repo_id(ui_api_token_from_textbox, space_name_ui, owner_ui):
if not space_name_ui: return None, "Error: Space Name cannot be empty."
if "/" in space_name_ui: return None, "Error: Space Name should not contain '/'. Use Owner field."
final_owner = owner_ui; error_message = None
if not final_owner:
resolved_api_token, token_err = _get_api_token(ui_api_token_from_textbox)
if token_err: return None, token_err
if not resolved_api_token: return None, "Error: API token required for auto owner determination."
try:
user_info = whoami(token=resolved_api_token)
if user_info and 'name' in user_info: final_owner = user_info['name']
else: error_message = "Error: Could not retrieve username. Check token/permissions or specify Owner."
except Exception as e: error_message = f"Error retrieving username: {str(e)}. Specify Owner."
if error_message: return None, error_message
if not final_owner: return None, "Error: Owner could not be determined."
return f"{final_owner}/{space_name_ui}", None
# --- New/Modified Functions for File Browsing and Editing ---
CLONE_BASE_DIR = Path(tempfile.gettempdir()) / "space_builder_active_clones"
CLONE_BASE_DIR.mkdir(parents=True, exist_ok=True)
def _cleanup_old_clones(repo_id_slug_to_keep=None):
"""Clean up old clone directories, optionally keeping one specific repo's clone."""
try:
for item in CLONE_BASE_DIR.iterdir():
if item.is_dir():
if repo_id_slug_to_keep and item.name == repo_id_slug_to_keep:
continue
logger.info(f"Cleaning up old clone: {item}")
shutil.rmtree(item)
except Exception as e:
logger.error(f"Error during old clone cleanup: {e}")
def get_space_local_clone_path(ui_api_token_from_textbox, space_name_ui, owner_ui, force_refresh=False):
"""Clones a Space locally, manages cleanup, and returns the path."""
repo_id_for_error_logging = f"{owner_ui}/{space_name_ui}" if owner_ui else space_name_ui
try:
resolved_api_token, token_err = _get_api_token(ui_api_token_from_textbox)
if token_err: return None, token_err
repo_id, err = _determine_repo_id(ui_api_token_from_textbox, space_name_ui, owner_ui)
if err: return None, err
repo_id_for_error_logging = repo_id
repo_id_slug = repo_id.replace("/", "_") # Sanitize for directory name
_cleanup_old_clones(repo_id_slug_to_keep=repo_id_slug)
local_clone_dir = CLONE_BASE_DIR / repo_id_slug
if force_refresh and local_clone_dir.exists():
logger.info(f"Force refresh: Removing existing clone at {local_clone_dir}")
shutil.rmtree(local_clone_dir)
if not local_clone_dir.exists():
local_clone_dir.mkdir(parents=True, exist_ok=True) # Ensure parent exists before Repository tries to use it
logger.info(f"Cloning Space {repo_id} to {local_clone_dir}...")
try:
Repository(
local_dir=str(local_clone_dir),
clone_from=f"https://huggingface.co/spaces/{repo_id}",
repo_type="space", use_auth_token=resolved_api_token,
)
logger.info(f"Successfully cloned {repo_id} to {local_clone_dir}")
except Exception as clone_exc:
logger.exception(f"Error cloning {repo_id}:")
if local_clone_dir.exists(): shutil.rmtree(local_clone_dir) # Cleanup partial clone
return None, f"Error cloning Space '{repo_id}': {str(clone_exc)}"
else:
logger.info(f"Using existing clone for {repo_id} at {local_clone_dir}")
# For a true refresh of an existing clone, you'd `git pull` here.
# `force_refresh=True` handles this by re-cloning.
return str(local_clone_dir), None
except Exception as e:
logger.exception(f"Error in get_space_local_clone_path for {repo_id_for_error_logging}:")
return None, f"Error preparing local clone: {str(e)}"
def read_file_from_local_path(absolute_local_file_path_str: str):
"""Reads content of a file given its absolute local path."""
try:
file_path = Path(absolute_local_file_path_str)
if not file_path.is_file():
return None, f"Error: Path is not a file or does not exist: {absolute_local_file_path_str}"
content = file_path.read_text(encoding="utf-8")
return content, None
except Exception as e:
logger.exception(f"Error reading local file {absolute_local_file_path_str}:")
return None, f"Error reading file content: {str(e)}"
# --- Core Functions: `create_space`, `update_space_file` (view_space_files can be deprecated) ---
def create_space(ui_api_token_from_textbox, space_name_ui, owner_ui, sdk_ui, markdown_input):
# (Unchanged from previous correct version)
repo_id_for_error_logging = f"{owner_ui}/{space_name_ui}" if owner_ui else space_name_ui
try:
resolved_api_token, token_err = _get_api_token(ui_api_token_from_textbox)
if token_err: return token_err
repo_id, err = _determine_repo_id(ui_api_token_from_textbox, space_name_ui, owner_ui)
if err: return err
repo_id_for_error_logging = repo_id
space_info = parse_markdown(markdown_input)
if not space_info["files"]: return "Error: No files found in markdown. Use '### File: path/to/file.ext'."
with tempfile.TemporaryDirectory() as temp_dir: # Temp dir for staging files from markdown
repo_staging_path = Path(temp_dir) / "repo_staging_content"
repo_staging_path.mkdir(exist_ok=True)
for file_info in space_info["files"]:
if not file_info.get("path"): continue
file_path_abs = repo_staging_path / file_info["path"]
file_path_abs.parent.mkdir(parents=True, exist_ok=True)
with open(file_path_abs, "w", encoding="utf-8") as f: f.write(file_info["content"])
try:
create_repo(repo_id=repo_id, token=resolved_api_token, repo_type="space", space_sdk=sdk_ui, private=False)
except Exception as e:
err_str = str(e).lower()
if not ("already exists" in err_str or "you already created this repo" in err_str or "exists" in err_str):
return f"Error creating Space '{repo_id}': {str(e)}"
logger.info(f"Space {repo_id} already exists or creation confirmed, proceeding with upload.")
upload_folder(repo_id=repo_id, folder_path=str(repo_staging_path), path_in_repo=".", token=resolved_api_token, repo_type="space", commit_message=f"Initial Space setup of {repo_id} via Builder")
return f"Successfully created/updated Space: [{repo_id}](https://huggingface.co/spaces/{repo_id})"
except Exception as e:
logger.exception(f"Error in create_space for {repo_id_for_error_logging}:")
return f"Error during Space creation/update: {str(e)}"
# view_space_files can be removed or kept as a simple alternative list view
# def view_space_files(...)
def update_space_file(ui_api_token_from_textbox, space_name_ui, owner_ui, file_path_in_repo, file_content, commit_message_ui):
# This function is now simpler as it expects file_path_in_repo to be the correct relative path.
# It still does its own clone for transactional integrity.
repo_id_for_error_logging = f"{owner_ui}/{space_name_ui}" if owner_ui else space_name_ui
try:
resolved_api_token, token_err = _get_api_token(ui_api_token_from_textbox)
if token_err: return token_err
repo_id, err = _determine_repo_id(ui_api_token_from_textbox, space_name_ui, owner_ui)
if err: return err
repo_id_for_error_logging = repo_id
if not file_path_in_repo: return "Error: File Path to update cannot be empty."
# Sanitize file_path_in_repo: remove leading slashes, ensure forward slashes
file_path_in_repo = file_path_in_repo.lstrip('/').replace(os.sep, '/')
commit_message_ui = commit_message_ui or f"Update {file_path_in_repo} via Space Builder"
with tempfile.TemporaryDirectory() as temp_dir_for_update: # Fresh temp dir for this update operation
repo_local_clone_path = Path(temp_dir_for_update) / "update_clone"
cloned_repo = Repository(
local_dir=str(repo_local_clone_path),
clone_from=f"https://huggingface.co/spaces/{repo_id}",
repo_type="space", use_auth_token=resolved_api_token,
git_user="Space Builder Bot", git_email="[email protected]" # Optional
)
logger.info(f"Cloned Space {repo_id} to {repo_local_clone_path} for update operation.")
# The file_path_in_repo is relative to the cloned_repo.local_dir
full_local_file_path = Path(cloned_repo.local_dir) / file_path_in_repo
full_local_file_path.parent.mkdir(parents=True, exist_ok=True) # Create parent dirs if needed
with open(full_local_file_path, "w", encoding="utf-8") as f:
f.write(file_content)
logger.info(f"Wrote updated content to {full_local_file_path} for commit.")
cloned_repo.push_to_hub(commit_message=commit_message_ui)
logger.info(f"Pushed update for {file_path_in_repo} to {repo_id}")
return f"Successfully updated `{file_path_in_repo}` in Space [{repo_id}](https://huggingface.co/spaces/{repo_id})"
except Exception as e:
logger.exception(f"Error in update_space_file for {repo_id_for_error_logging}, file {file_path_in_repo}:")
return f"Error updating file for `{repo_id_for_error_logging}`: {str(e)}"