Spaces:

Zack3D
/

SillyTavernCardCreatorCLEAN

Running

App Files Files Community

Zack3D commited on Apr 27

Commit

6e2642c

verified ·

1 Parent(s): 5272a9c

Update app.py

Browse files

Files changed (1) hide show

app.py +337 -288

app.py CHANGED Viewed

@@ -1,302 +1,351 @@
-import gradio as gr
-from anthropic import Anthropic
-from openai import OpenAI
-import openai
 import json
-import uuid
 import os
-import base64
 from PIL import Image
 from PIL.PngImagePlugin import PngInfo
-from io import BytesIO
-default_urls = ["https://api.anthropic.com", "https://api.openai.com/v1"]
-# List of available Claude models
-claude_models = ["claude-3-5-sonnet-20240620", "claude-3-opus-20240229", "claude-3-sonnet-20240229", "claude-3-haiku-20240307"]
-# List of available OpenAI models
-openai_models = ["gpt-4o", "gpt-4o-mini", "gpt-4", "gpt-4-32k", "gpt-3.5-turbo", "gpt-4-0125-preview", "gpt-4-turbo-preview", "gpt-4-1106-preview", "gpt-4-0613"]
-image_prompter = ["SDXL", "midjourney"]
-both_models = claude_models + openai_models
-def generate_response(endpoint, api_key, model, user_prompt):
-    print(endpoint)
-    if endpoint in default_urls:
-        #check api keys as normal
-        if api_key.startswith("sk-ant-"):
-            client = Anthropic(api_key=api_key, base_url=endpoint)
-            system_prompt_path = __file__.replace("app.py", "json.txt")
-        elif api_key.startswith("sk-"):
-            client = OpenAI(api_key=api_key, base_url=endpoint)
-            system_prompt_path = __file__.replace("app.py", "json.txt")
-        else:
-            print(f"Invalid API key: {api_key}")
-            return "Invalid API key", "Invalid API key", None
-    else:
-        if model in claude_models:
-            # Set the Anthropic API key
-            client = Anthropic(api_key=api_key, base_url=endpoint)
-            system_prompt_path = __file__.replace("app.py", "json.txt")
-        else:
-            # Set the OpenAI API key
-            client = OpenAI(api_key=api_key, base_url=endpoint)
-            system_prompt_path = __file__.replace("app.py", "json.txt")
-    # Read the system prompt from a text file
-    with open(system_prompt_path, "r") as file:
-        system_prompt = file.read()
-    if model in claude_models:
-        # Generate a response using the selected Anthropic model
-        try:
-            response = client.messages.create(
-                system=system_prompt,
-                messages=[{"role": "user", "content": user_prompt}],
-                model=model,
-                max_tokens=4096
-            )
-            response_text = response.content[0].text
-        except Exception as e:
-            print(e)
-            response_text = f"An error occurred while generating the response. Check that your API key is correct! More info: {e}"
-    else:
-        try:
-            # Generate a response using the selected OpenAI model
-            response = client.chat.completions.create(
-                model=model,
-                messages=[
-                    {"role": "system", "content": system_prompt},
-                    {"role": "user", "content": user_prompt}
-                ],
-                max_tokens=4096
-            )
-            response_text = response.choices[0].message.content
-        except Exception as e:
-            print(e)
-            response_text = f"An error occurred while generating the response. Check that your API key is correct! More info: {e}"
-    json_string, json_json = extract_json(response_text)
-    json_file = json_string if json_string else None
-    create_unique_id = str(uuid.uuid4())
-    json_folder = __file__.replace("app.py", f"outputs/")
-    if not os.path.exists(json_folder):
-        os.makedirs(json_folder)
-    path = None
-    if json_string:
-        with open(f"{json_folder}{json_json['name']}_{create_unique_id}.json", "w") as file:
-            file.write(json_file)
-        path = f"{json_folder}{json_json['name']}_{create_unique_id}.json"
-    else:
-        json_string = "No JSON data was found, or the JSON data was incomplete."
-    return response_text, json_string or "", path
-def extract_json(generated_output):
     try:
-        generated_output = generated_output.replace("```json", "").replace("```", "").strip()
-        # Find the JSON string in the generated output
-        json_start = generated_output.find("{")
-        json_end = generated_output.rfind("}") + 1
-        json_string = generated_output[json_start:json_end]
-        print(json_string)
-        # Parse the JSON string
-        json_data = json.loads(json_string)
-        json_data['name'] = json_data['char_name']
-        json_data['personality'] = json_data['char_persona']
-        json_data['scenario'] = json_data['world_scenario']
-        json_data['first_mes'] = json_data['char_greeting']
-        # Check if all the required keys are present
-        required_keys = ["char_name", "char_persona", "world_scenario", "char_greeting", "example_dialogue", "description"]
-        if all(key in json_data for key in required_keys):
-            return json.dumps(json_data), json_data
-        else:
-            return None, None
-    except Exception as e:
-        print(e)
         return None, None
-def generate_second_response(endpoint, api_key, model, generated_output, image_model):
-    if endpoint in default_urls:
-        #check api keys as normal
-        if api_key.startswith("sk-ant-"):
-            client = Anthropic(api_key=api_key, base_url=endpoint)
-            system_prompt_path = __file__.replace("app.py", f"{image_model}.txt")
-        elif api_key.startswith("sk-"):
-            client = OpenAI(api_key=api_key, base_url=endpoint)
-            system_prompt_path = __file__.replace("app.py", f"{image_model}.txt")
-        else:
-            print("Invalid API key")
-            return "Invalid API key", "Invalid API key", None
-    else:
-        if model in claude_models:
-            # Set the Anthropic API key
-            client = Anthropic(api_key=api_key, base_url=endpoint)
-            system_prompt_path = __file__.replace("app.py", f"{image_model}.txt")
-        else:
-            # Set the OpenAI API key
-            client = OpenAI(api_key=api_key, base_url=endpoint)
-            system_prompt_path = __file__.replace("app.py", f"{image_model}.txt")
-    # Read the system prompt from a text file
-    with open(system_prompt_path, "r") as file:
-        system_prompt = file.read()
-    if model in claude_models:
-        try:
-            # Generate a second response using the selected Anthropic model and the previously generated output
-            response = client.messages.create(
-                system=system_prompt,
-                messages=[{"role": "user", "content": generated_output}],
-                model=model,
-                max_tokens=4096
-            )
-            response_text = response.content[0].text
-        except Exception as e:
-            print(e)
-            response_text = f"An error occurred while generating the response. Check that your API key is correct! More info: {e}"
-    else:
-        try:
-            # Generate a response using the selected OpenAI model
-            response = client.chat.completions.create(
-                model=model,
-                messages=[
-                    {"role": "system", "content": system_prompt},
-                    {"role": "user", "content": generated_output}
-                ],
-                max_tokens=4096
-            )
-            response_text = response.choices[0].message.content
-        except Exception as e:
-            print(e)
-            response_text = f"An error occurred while generating the response. Check that your API key is correct! More info: {e}"
-    return response_text
-def inject_json_to_png(image, json_data):
-    if isinstance(json_data, str):
-        json_data = json.loads(json_data)
-    img = Image.open(image)
-    # Calculate the aspect ratio of the original image
-    width, height = img.size
-    aspect_ratio = width / height
-    # Calculate the cropping dimensions based on the aspect ratio
-    if aspect_ratio > 400 / 600:
-        # Image is wider than 400x600, crop the sides
-        new_width = int(height * 400 / 600)
-        left = (width - new_width) // 2
-        right = left + new_width
-        top = 0
-        bottom = height
-    else:
-        # Image is taller than 400x600, crop the top and bottom
-        new_height = int(width * 600 / 400)
-        left = 0
-        right = width
-        top = (height - new_height) // 2
-        bottom = top + new_height
-    # Perform cropping
-    img = img.crop((left, top, right, bottom))
-    # Resize the cropped image to 400x600 pixels
     img = img.resize((400, 600), Image.LANCZOS)
-    # Convert the JSON data to bytes
-    json_bytes = json.dumps(json_data).encode('utf-8')
-    # Create a new PNG image with the JSON data injected into the tEXT chunk
-    output = BytesIO()
-    img.save(output, format='PNG')
-    output.seek(0)
-    # Add the tEXT chunk with the tag 'chara'
-    metadata = PngInfo()
-    metadata.add_text("chara", base64.b64encode(json_bytes))
-    # Save the modified PNG image to a BytesIO object
-    output = BytesIO()
-    create_unique_id = str(uuid.uuid4())
-    if json_data['name']:
-        filename = f"{json_data['name']}_{create_unique_id}.png"
-    img_folder = __file__.replace("app.py", f"outputs/")
-    img.save(f"{img_folder}/{filename}", format='PNG', pnginfo=metadata)
-    return f"{img_folder}/{filename}"
-# Set up the Gradio interface
-with gr.Blocks() as demo:
-    gr.Markdown("# SillyTavern Character Generator")
-    #Text explaining that you can use the API key from the Anthropic API or the OpenAI API
-    gr.Markdown("You can use the API key from the Anthropic API or the OpenAI API. The API key should start with 'sk-ant-' for Anthropic or 'sk-' for OpenAI.")
-    gr.Markdown("Please Note: If you use a proxy it must support the OpenAI or Anthropic standard api calls! khanon does, Openrouter based ones usually do not.")
-    gr.Markdown("Generating images locally and want to use the prompts from here in your workflow? Well do that I guess... a link to the virus used to be here. Maybe check me out? https://goocat.gay")
-    with gr.Tab("JSON Generate"):
-        with gr.Row():
-            with gr.Column():
-                endpoint = gr.Textbox(label="Endpoint", value="https://api.anthropic.com")
-                api_key = gr.Textbox(label="API Key", type="password", placeholder="sk-ant-api03-... or sk-...")
-                model_dropdown = gr.Dropdown(choices=[], label="Select a model")
-                user_prompt = gr.Textbox(label="User Prompt", value="Make me a card for a panther made of translucent pastel colored goo. Its color never changes once it exists but each 'copy' has a different color. The creature comes out of a small jar, seemingly defying physics with its size. It is the size of a real panther, and as strong as one too. By default its female but is able to change gender. It can even split into multiple copies of itself if needed with no change in its own size or mass. Its outside is normally lightly squishy but solid, but on command it can become viscous like non-newtonian fluids. Be descriptive when describing this character, and make sure to describe all of its features in char_persona just like you do in description. Make sure to describe commonly used features in detail (visual, smell, taste, touch, etc).")
-                generate_button = gr.Button("Generate JSON")
-            with gr.Column():
-                generated_output = gr.Textbox(label="Generated Output")
-                json_output = gr.Textbox(label="JSON Output")
-                json_download = gr.File(label="Download JSON")
-        with gr.Row():
-            with gr.Column():
-                image_model = gr.Dropdown(choices=image_prompter, label="Image Model to prompt for", value="SDXL")
-                generate_button_2 = gr.Button("Generate SDXL Prompt")
-            with gr.Column():
-                generated_output_2 = gr.Textbox(label="Generated SDXL Prompt")
-        def update_models(api_key):
             if api_key.startswith("sk-ant-"):
-                return gr.Dropdown(choices=claude_models), gr.Textbox(label="Endpoint", value="https://api.anthropic.com")
-            elif api_key.startswith("sk-"):
-                return gr.Dropdown(choices=openai_models), gr.Textbox(label="Endpoint", value="https://api.openai.com/v1")
-            else:
-                return gr.Dropdown(choices=both_models), gr.Textbox(label="Endpoint", value="https://api.anthropic.com")
-        api_key.change(update_models, inputs=api_key, outputs=[model_dropdown, endpoint])
-        generate_button.click(generate_response, inputs=[endpoint, api_key, model_dropdown, user_prompt], outputs=[generated_output, json_output, json_download])
-        generate_button_2.click(generate_second_response, inputs=[endpoint, api_key, model_dropdown, generated_output, image_model], outputs=generated_output_2)
-    with gr.Tab("PNG Inject"):
-        gr.Markdown("# PNG Inject")
-        gr.Markdown("Upload a PNG image and inject JSON content into the PNG. PNG gets resized to 400x600 Center Crop.")
-        with gr.Row():
-            with gr.Column():
-                image_input = gr.Image(type="filepath", label="Upload PNG Image")
-                json_input = gr.Textbox(label="JSON Data")
-                json_file_input = gr.File(label="Or Upload JSON File", file_types=[".json"])
-                inject_button = gr.Button("Inject JSON and Download PNG")
-            with gr.Column():
-                injected_image_output = gr.File(label="Download Injected PNG")
-        def inject_json(image, json_data, json_file):
-            if json_file:
-                jsonc = open(json_file,)
-                json_data = json.load(jsonc)
-            if image is None:
                 return None
-            if json_data is None:
                 return None
-            injected_image = inject_json_to_png(image, json_data)
-            return injected_image
-        inject_button.click(inject_json, inputs=[image_input, json_input, json_file_input], outputs=injected_image_output)
-demo.launch()

+#!/usr/bin/env python3
+"""
+SillyTavern Character‑Card Generator — version 2.0 (April 2025)
+----------------------------------------------------------------
+* Adds the newest "thinking / reasoning" model names (o‑series, Claude 3.7, GPT‑4.1 …)
+* Unifies Anthropic & OpenAI logic behind a tiny abstraction layer
+* Adds an optional **Thinking mode** toggle (Gradio UI) — when enabled we
+  pass provider‑specific knobs that push the model to reason more deeply
+  (e.g. `vision: "detailed"` for Anthropic, `reasoning_mode: "enhanced"` for
+  OpenAI; both are ignored gracefully by older models)
+* Factorises duplicated code, trims global namespace, and drops legacy bits
+  that are no longer needed.
+The public interface of the script is still the same: run it, fill in your key,
+choose a model, hit *Generate JSON*, then optionally *Generate SDXL Prompt* or
+*Inject into PNG*.
+"""
+from __future__ import annotations
 import json
 import os
+import uuid
+from dataclasses import dataclass
+from functools import cached_property
+from io import BytesIO
+from pathlib import Path
+from typing import Any, Dict, List, Tuple, Union
+import gradio as gr
 from PIL import Image
 from PIL.PngImagePlugin import PngInfo
+# Third‑party SDKs — import lazily to avoid mandatory install when not used
+try:
+    from anthropic import Anthropic, APITimeoutError as AnthropicTimeout
+except ImportError:  # pragma: no cover
+    Anthropic = None  # type: ignore
+try:
+    from openai import OpenAI, APITimeoutError as OpenAITimeout
+except ImportError:  # pragma: no cover
+    OpenAI = None  # type: ignore
+###############################################################################
+#  Model catalog
+###############################################################################
+CLAUDE_MODELS: List[str] = [
+    # → classic 3‑series
+    "claude-3-opus-20240229",
+    "claude-3-sonnet-20240229",
+    "claude-3-haiku-20240307",
+    # → 3.5 refreshes
+    "claude-3-5-sonnet-20240620",
+    "claude-3-5-sonnet-20241022",
+    "claude-3-5-haiku-20241022",
+    # → newest 3.7 extended‑thinking (Feb 2025)
+    "claude-3-7-sonnet-20250219",
+]
+OPENAI_MODELS: List[str] = [
+    # o‑series — small/medium reasoning models (Apr 2025)
+    "o3", "o3-mini", "o4-mini",
+    # 4.1 family — 1 M‑token context (Apr 2025)
+    "gpt-4.1", "gpt-4.1-mini", "gpt-4.1-nano",
+    # 4‑series mainline
+    "gpt-4o", "gpt-4o-mini", "gpt-4", "gpt-4-32k",
+    "gpt-4-0125-preview", "gpt-4-turbo-preview", "gpt-4-1106-preview",
+    # 3.5 for cheap/fast baseline
+    "gpt-3.5-turbo",
+]
+ALL_MODELS = CLAUDE_MODELS + OPENAI_MODELS
+DEFAULT_ANTHROPIC_ENDPOINT = "https://api.anthropic.com"
+DEFAULT_OPENAI_ENDPOINT = "https://api.openai.com/v1"
+###############################################################################
+#  Helper classes
+###############################################################################
+JsonDict = Dict[str, Any]
+@dataclass
+class APIConfig:
+    endpoint: str
+    api_key: str
+    model: str
+    # UI knobs — not required but exposed for flexibility
+    temperature: float = 0.7
+    top_p: float = 0.9
+    thinking: bool = False  # when True we request "enhanced reasoning"
+    # ---------------------------------------------------------------------
+    #  Derived helpers
+    # ---------------------------------------------------------------------
+    @cached_property
+    def provider(self) -> str:
+        if self.model in CLAUDE_MODELS:
+            return "anthropic"
+        elif self.model in OPENAI_MODELS:
+            return "openai"
+        raise ValueError(f"Unknown model family for {self.model}")
+    @cached_property
+    def sdk(self):
+        if self.provider == "anthropic":
+            if Anthropic is None:
+                raise RuntimeError("anthropic‑python not installed — `pip install anthropic`")
+            return Anthropic(api_key=self.api_key, base_url=self.endpoint)
+        if self.provider == "openai":
+            if OpenAI is None:
+                raise RuntimeError("openai‑python not installed — `pip install openai`")
+            return OpenAI(api_key=self.api_key, base_url=self.endpoint)
+        raise AssertionError  # unreachable
+    # ------------------------------------------------------------------
+    #  Public send convenience
+    # ------------------------------------------------------------------
+    def chat(self, user_prompt: str, system_prompt: str = "", max_tokens: int = 4096) -> str:
+        """Send the prompt; return *content* string."""
+        if self.provider == "anthropic":
+            opts = {
+                "model": self.model,
+                "system": system_prompt,
+                "messages": [{"role": "user", "content": user_prompt}],
+                "max_tokens": max_tokens,
+                "temperature": self.temperature,
+                "top_p": self.top_p,
+            }
+            if self.thinking:
+                opts["vision"] = "detailed"  # currently Anthropic's knob for deeper‑reasoning & image understanding
+            resp = self.sdk.messages.create(**opts)
+            return resp.content[0].text
+        # OpenAI branch --------------------------------------------------
+        opts = {
+            "model": self.model,
+            "messages": [
+                {"role": "system", "content": system_prompt},
+                {"role": "user", "content": user_prompt},
+            ],
+            "max_tokens": max_tokens,
+            "temperature": self.temperature,
+            "top_p": self.top_p,
+        }
+        if self.thinking:
+            opts["reasoning_mode"] = "enhanced"  # silently ignored by models that do not support it
+        resp = self.sdk.chat.completions.create(**opts)
+        return resp.choices[0].message.content
+###############################################################################
+#  Character‑card helpers  (unchanged logic, just cleaner)
+###############################################################################
+CARD_REQUIRED_KEYS = {
+    "char_name",
+    "char_persona",
+    "world_scenario",
+    "char_greeting",
+    "example_dialogue",
+    "description",
+}
+def extract_card_json(generated_output: str) -> Tuple[str | None, JsonDict | None]:
+    """Return (raw_json_str_or_None, parsed_json_or_None)."""
     try:
+        snippet = generated_output.replace("```json", "").replace("```", "").strip()
+        raw = snippet[snippet.find("{") : snippet.rfind("}") + 1]
+        data: JsonDict = json.loads(raw)
+        # remap
+        data["name"] = data["char_name"]
+        data["personality"] = data["char_persona"]
+        data["scenario"] = data["world_scenario"]
+        data["first_mes"] = data["char_greeting"]
+        if CARD_REQUIRED_KEYS.issubset(data):
+            return json.dumps(data, ensure_ascii=False, indent=2), data
+        return None, None
+    except Exception:
         return None, None
+###############################################################################
+#  PNG utils
+###############################################################################
+def inject_card_into_png(image_path: str | Path, card_json: Union[str, JsonDict]) -> Path:
+    card: JsonDict = json.loads(card_json) if isinstance(card_json, str) else card_json
+    img = Image.open(image_path)
+    # Centre‑crop to 400×600 while preserving aspect ratio ----------------
+    w, h = img.size
+    target_ratio = 400 / 600
+    if w / h > target_ratio:  # wider → crop sides
+        new_w = int(h * target_ratio)
+        left = (w - new_w) // 2
+        img = img.crop((left, 0, left + new_w, h))
+    else:                       # taller → crop top/bottom
+        new_h = int(w / target_ratio)
+        top = (h - new_h) // 2
+        img = img.crop((0, top, w, top + new_h))
     img = img.resize((400, 600), Image.LANCZOS)
+    # Embed the JSON as base64 inside a tEXt chunk ------------------------
+    meta = PngInfo()
+    meta.add_text("chara", json.dumps(card).encode("utf‑8").hex())
+    out_dir = Path(__file__).with_name("outputs")
+    out_dir.mkdir(exist_ok=True)
+    filename = f"{card['name']}_{uuid.uuid4()}.png"
+    out_path = out_dir / filename
+    img.save(out_path, format="PNG", pnginfo=meta)
+    return out_path
+###############################################################################
+#  Gradio UI
+###############################################################################
+def build_ui():
+    """Return a ready‑to‑launch Gradio Blocks app."""
+    with gr.Blocks(title="SillyTavern Character Generator 2.0") as demo:
+        gr.Markdown("# 🃏 SillyTavern Character Generator 2.0")
+        # ----------------------------------------------------------------
+        #  Tab:  JSON generator
+        # ----------------------------------------------------------------
+        with gr.Tab("JSON Generate"):
+            with gr.Row():
+                with gr.Column():
+                    endpoint_box = gr.Textbox(label="Endpoint", value=DEFAULT_ANTHROPIC_ENDPOINT)
+                    api_key_box = gr.Textbox(label="API Key", type="password", placeholder="sk-ant-… or sk-…")
+                    model_dropdown = gr.Dropdown(choices=ALL_MODELS, label="Model")
+                    thinking_toggle = gr.Checkbox(label="Thinking / deep‑reasoning mode", value=False)
+                    temp_slider = gr.Slider(label="Temperature", minimum=0.0, maximum=1.0, value=0.7, step=0.05)
+                    topp_slider = gr.Slider(label="Top‑P", minimum=0.0, maximum=1.0, value=0.9, step=0.05)
+                    user_prompt_box = gr.Textbox(
+                        label="Prompt",
+                        placeholder="Describe the character you want…",
+                        lines=6,
+                    )
+                    gen_btn = gr.Button("Generate JSON")
+                with gr.Column():
+                    llm_raw_out = gr.Textbox(label="Model output (raw)")
+                    json_out = gr.Textbox(label="Extracted JSON (ready for PNG)")
+                    json_download = gr.File(label="Download .json")
+            # SDXL prompt tab (unchanged logic) --------------------------
+            with gr.Row():
+                image_model_dropdown = gr.Dropdown(["SDXL", "midjourney"], label="Image model", value="SDXL")
+                gen_sdxl_btn = gr.Button("Generate image prompt")
+                sdxl_out = gr.Textbox(label="Generated prompt")
+        # ----------------------------------------------------------------
+        #  Tab:  PNG injector
+        # ----------------------------------------------------------------
+        with gr.Tab("PNG Inject"):
+            gr.Markdown("Upload an image (any resolution) and embed the JSON card.")
+            with gr.Row():
+                img_upload = gr.Image(type="filepath", label="PNG image")
+                json_text = gr.Textbox(label="JSON")
+                json_file = gr.File(label="…or choose a .json file", file_types=[".json"])
+                inject_btn = gr.Button("Inject & download")
+                injected_png = gr.File(label="Download new PNG")
+        # ── Callbacks ────────────────────────────────────────────────────
+        def _choose_default_endpoint(api_key: str):
             if api_key.startswith("sk-ant-"):
+                return DEFAULT_ANTHROPIC_ENDPOINT
+            if api_key.startswith("sk-"):
+                return DEFAULT_OPENAI_ENDPOINT
+            return DEFAULT_ANTHROPIC_ENDPOINT
+        api_key_box.change(_choose_default_endpoint, api_key_box, endpoint_box)
+        # Main JSON generation ------------------------------------------
+        def _generate_json(endpoint: str, api_key: str, model: str, thinking: bool,
+                            temp: float, top_p: float, prompt: str):
+            cfg = APIConfig(endpoint.strip(), api_key.strip(), model, temp, top_p, thinking)
+            # System prompt lives next to this script -------------------
+            sys_prompt_path = Path(__file__).with_name("json.txt")
+            system_prompt = sys_prompt_path.read_text(encoding="utf‑8") if sys_prompt_path.exists() else ""
+            try:
+                llm_output = cfg.chat(prompt, system_prompt)
+            except (AnthropicTimeout, OpenAITimeout) as exc:  # type: ignore
+                return f"Request timed out: {exc}", "", None
+            except Exception as exc:
+                return f"Error: {exc}", "", None
+            raw_json, parsed = extract_card_json(llm_output)
+            if raw_json and parsed:
+                out_dir = Path(__file__).with_name("outputs")
+                out_dir.mkdir(exist_ok=True)
+                path = out_dir / f"{parsed['name']}_{uuid.uuid4()}.json"
+                path.write_text(raw_json, encoding="utf‑8")
+                return llm_output, raw_json, str(path)
+            return llm_output, "(no valid JSON detected)", None
+        gen_btn.click(
+            _generate_json,
+            [endpoint_box, api_key_box, model_dropdown, thinking_toggle, temp_slider, topp_slider, user_prompt_box],
+            [llm_raw_out, json_out, json_download],
+        )
+        # SDXL prompt generation ---------------------------------------
+        def _generate_sdxl_prompt(endpoint: str, api_key: str, model: str, prompt: str, image_model: str):
+            cfg = APIConfig(endpoint.strip(), api_key.strip(), model)
+            system_path = Path(__file__).with_name(f"{image_model}.txt")
+            system_prompt = system_path.read_text(encoding="utf‑8") if system_path.exists() else ""
+            try:
+                return cfg.chat(prompt, system_prompt)
+            except Exception as exc:
+                return f"Error: {exc}"
+        gen_sdxl_btn.click(
+            _generate_sdxl_prompt,
+            [endpoint_box, api_key_box, model_dropdown, llm_raw_out, image_model_dropdown],
+            sdxl_out,
+        )
+        # PNG injection --------------------------------------------------
+        def _inject_png(img_path: str | None, json_str: str | None, json_file_path: str | None):
+            if not img_path:
                 return None
+            if json_file_path:
+                json_str = Path(json_file_path).read_text(encoding="utf‑8")
+            if not json_str:
                 return None
+            new_png = inject_card_into_png(img_path, json_str)
+            return str(new_png)
+        inject_btn.click(_inject_png, [img_upload, json_text, json_file], injected_png)
+    return demo
+###############################################################################
+#  Entrypoint
+###############################################################################
+if __name__ == "__main__":
+    build_ui().launch()