Spaces:

Deadmon
/

veo3

Running

App Files Files Community

Deadmon commited on 1 day ago

Commit

0fea6b2

verified ·

1 Parent(s): 6006b4e

Update app.py

Browse files

Files changed (1) hide show

app.py +93 -86

app.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# app.py
 import os
 import gradio as gr
@@ -10,13 +10,11 @@ import google.auth
 import google.auth.transport.requests
 from huggingface_hub import login
-# --- 1. Configuration and Authentication ---
 GCP_PROJECT_ID = os.environ.get("GCP_PROJECT_ID")
 GCP_LOCATION = os.environ.get("GCP_LOCATION")
-# --- Authentication and Sanity Checks Block ---
 hf_token = os.environ.get("HF_TOKEN")
 if hf_token:
     print("Hugging Face token found. Logging in.")
@@ -27,92 +25,101 @@ else:
 creds_json_str = os.environ.get("GOOGLE_APPLICATION_CREDENTIALS_JSON")
 if not all([GCP_PROJECT_ID, GCP_LOCATION, creds_json_str]):
-    missing_secrets = [s for s, v in {
-        "GCP_PROJECT_ID": GCP_PROJECT_ID,
-        "GCP_LOCATION": GCP_LOCATION,
-        "GOOGLE_APPLICATION_CREDENTIALS_JSON": creds_json_str
-    }.items() if not v]
     error_message = f"FATAL: Missing required secrets: {', '.join(missing_secrets)}."
     print(error_message)
-    def generate_video(prompt):
-        raise gr.Error(error_message)
-else:
-    print("All required secrets are loaded.")
-    MODEL_ID = "veo-3.0-generate-preview"
-    API_ENDPOINT = f"{GCP_LOCATION}-aiplatform.googleapis.com"
-    PREDICT_URL = f"https://{API_ENDPOINT}/v1/projects/{GCP_PROJECT_ID}/locations/{GCP_LOCATION}/publishers/google/models/{MODEL_ID}:predictLongRunning"
-    FETCH_URL = f"https://{API_ENDPOINT}/v1/projects/{GCP_PROJECT_ID}/locations/{GCP_LOCATION}/publishers/google/models/{MODEL_ID}:fetchPredictOperation"
-    with open("gcp_creds.json", "w") as f: f.write(creds_json_str)
-    SCOPES = ["https://www.googleapis.com/auth/cloud-platform"]
-    credentials, _ = google.auth.load_credentials_from_file("gcp_creds.json", scopes=SCOPES)
-    def get_access_token():
-        auth_req = google.auth.transport.requests.Request()
-        credentials.refresh(auth_req)
-        return credentials.token
-    # --- 2. Core Video Generation Logic ---
-    def generate_video(prompt: str):
-        if not prompt:
-            raise gr.Error("Prompt cannot be empty.")
-        yield "Status: Submitting job...", None
-        try:
-            headers = {"Authorization": f"Bearer {get_access_token()}", "Content-Type": "application/json"}
-            payload = {"instances": [{"prompt": prompt}], "parameters": {"aspectRatio": "16:9", "sampleCount": 1, "durationSeconds": 8, "personGeneration": "allow_all", "addWatermark": True, "includeRaiReason": True, "generateAudio": True}}
-            response = requests.post(PREDICT_URL, headers=headers, json=payload)
-            response.raise_for_status()
-            operation_name = response.json()["name"]
-            print(f"Successfully submitted job. Operation Name: {operation_name}")
-            MAX_POLL_ATTEMPTS = 60
-            for i in range(MAX_POLL_ATTEMPTS):
-                yield f"Status: Polling (Attempt {i+1}/{MAX_POLL_ATTEMPTS})...", None
-                headers["Authorization"] = f"Bearer {get_access_token()}"
-                fetch_payload = {"operationName": operation_name}
-                poll_response = requests.post(FETCH_URL, headers=headers, json=fetch_payload)
-                poll_response.raise_for_status()
-                poll_result = poll_response.json()
-                if poll_result.get("done"):
-                    print("Job finished.")
-                    # <<< CHANGE: The debugging line below is now commented out for cleaner logs. >>>
-                    # print(f"Full response payload: {json.dumps(poll_result, indent=2)}")
-                    response_data = poll_result.get("response", {})
-                    if "videos" in response_data and response_data["videos"]:
-                        video_base64 = response_data["videos"][0]["bytesBase64Encoded"]
-                        video_bytes = base64.b64decode(video_base64)
-                        with open("generated_video.mp4", "wb") as f: f.write(video_bytes)
-                        yield "Status: Done!", "generated_video.mp4"
-                        return
-                    else:
-                        error_message = "Video generation failed."
-                        if "error" in poll_result:
-                            error_details = poll_result["error"].get("message", "No details provided.")
-                            error_message += f"\nAPI Error: {error_details}"
-                        elif "raiResult" in response_data:
-                            rai_reason = response_data.get("raiMediaFilteredReason", "Unknown reason.")
-                            error_message += f"\nReason: Content was blocked by safety filters ({rai_reason})."
-                        else:
-                            error_message += "\nReason: The API did not return a video or a specific error."
-                        raise gr.Error(error_message)
-                time.sleep(10)
-            raise gr.Error("Operation timed out.")
-        except Exception as e:
-            print(f"An error occurred: {e}")
-            raise gr.Error(str(e))
-# --- 3. Gradio User Interface ---
-with gr.Blocks(theme=gr.themes.Soft()) as demo:
-    gr.Markdown("# 🎬 Vertex AI VEO Video Generator")
-    gr.Markdown("Generate short videos from a text prompt using Google's VEO model.")
-    with gr.Row():
-        with gr.Column(scale=1):
-            prompt_input = gr.Textbox(label="Prompt", placeholder="A majestic lion...", lines=3)
-            submit_button = gr.Button("Generate Video", variant="primary")
-        with gr.Column(scale=1):
-            status_output = gr.Markdown("Status: Ready")
-            video_output = gr.Video(label="Generated Video", interactive=False)
-    gr.Examples(["A high-speed drone shot flying through a futuristic city with flying vehicles."], inputs=prompt_input)
-    submit_button.click(fn=generate_video, inputs=prompt_input, outputs=[status_output, video_output])
 demo.launch()

+# app.py (API-Only Version)
 import os
 import gradio as gr
 import google.auth.transport.requests
 from huggingface_hub import login
+# --- 1. Configuration and Authentication (Unchanged) ---
 GCP_PROJECT_ID = os.environ.get("GCP_PROJECT_ID")
 GCP_LOCATION = os.environ.get("GCP_LOCATION")
+# --- Authentication and Sanity Checks Block (Unchanged) ---
 hf_token = os.environ.get("HF_TOKEN")
 if hf_token:
     print("Hugging Face token found. Logging in.")
 creds_json_str = os.environ.get("GOOGLE_APPLICATION_CREDENTIALS_JSON")
 if not all([GCP_PROJECT_ID, GCP_LOCATION, creds_json_str]):
+    missing_secrets = [s for s, v in {"GCP_PROJECT_ID": GCP_PROJECT_ID, "GCP_LOCATION": GCP_LOCATION, "GOOGLE_APPLICATION_CREDENTIALS_JSON": creds_json_str}.items() if not v]
     error_message = f"FATAL: Missing required secrets: {', '.join(missing_secrets)}."
     print(error_message)
+    # This initial error will still be raised if the app can't start
+    raise RuntimeError(error_message)
+print("All required secrets are loaded. Initializing API service.")
+MODEL_ID = "veo-3.0-generate-preview"
+API_ENDPOINT = f"{GCP_LOCATION}-aiplatform.googleapis.com"
+PREDICT_URL = f"https://{API_ENDPOINT}/v1/projects/{GCP_PROJECT_ID}/locations/{GCP_LOCATION}/publishers/google/models/{MODEL_ID}:predictLongRunning"
+FETCH_URL = f"https://{API_ENDPOINT}/v1/projects/{GCP_PROJECT_ID}/locations/{GCP_LOCATION}/publishers/google/models/{MODEL_ID}:fetchPredictOperation"
+with open("gcp_creds.json", "w") as f: f.write(creds_json_str)
+SCOPES = ["https://www.googleapis.com/auth/cloud-platform"]
+credentials, _ = google.auth.load_credentials_from_file("gcp_creds.json", scopes=SCOPES)
+def get_access_token():
+    auth_req = google.auth.transport.requests.Request()
+    credentials.refresh(auth_req)
+    return credentials.token
+# --- 2. Core Video Generation Logic (Refactored for API) ---
+# The function now returns a final JSON object instead of yielding updates.
+def generate_video_api(prompt: str):
+    if not prompt:
+        return {"status": "error", "message": "Prompt cannot be empty."}
+    try:
+        headers = {"Authorization": f"Bearer {get_access_token()}", "Content-Type": "application/json"}
+        payload = {"instances": [{"prompt": prompt}], "parameters": {"aspectRatio": "16:9", "sampleCount": 1, "durationSeconds": 8, "personGeneration": "allow_all", "addWatermark": True, "includeRaiReason": True, "generateAudio": True}}
+        # Submit job
+        response = requests.post(PREDICT_URL, headers=headers, json=payload)
+        response.raise_for_status()
+        operation_name = response.json()["name"]
+        print(f"Successfully submitted job. Operation Name: {operation_name}")
+        # Poll for result
+        MAX_POLL_ATTEMPTS = 60
+        for i in range(MAX_POLL_ATTEMPTS):
+            print(f"Polling (Attempt {i+1}/{MAX_POLL_ATTEMPTS})...")
+            time.sleep(10) # Wait before polling
+            headers["Authorization"] = f"Bearer {get_access_token()}"
+            fetch_payload = {"operationName": operation_name}
+            poll_response = requests.post(FETCH_URL, headers=headers, json=fetch_payload)
+            poll_response.raise_for_status()
+            poll_result = poll_response.json()
+            if poll_result.get("done"):
+                print("Job finished.")
+                response_data = poll_result.get("response", {})
+                # Case 1: Success, video is present
+                if "videos" in response_data and response_data["videos"]:
+                    video_base64 = response_data["videos"][0]["bytesBase64Encoded"]
+                    return {"status": "success", "video_base64": video_base64}
+                # Case 2: Failure, an error message is present
+                error_message = "Video generation failed."
+                if "error" in poll_result:
+                    error_details = poll_result["error"].get("message", "No details provided.")
+                    error_message += f" API Error: {error_details}"
+                elif "raiResult" in response_data:
+                    rai_reason = response_data.get("raiMediaFilteredReason", "Unknown reason.")
+                    error_message += f" Content was blocked by safety filters ({rai_reason})."
+                else:
+                    error_message += " The API did not return a video or a specific error."
+                return {"status": "error", "message": error_message}
+        return {"status": "error", "message": "Operation timed out."}
+    except requests.exceptions.HTTPError as e:
+        print(f"HTTP Error: {e.response.text}")
+        return {"status": "error", "message": f"API Error: {e.response.status_code}. Details: {e.response.text}"}
+    except Exception as e:
+        print(f"An unexpected error occurred: {e}")
+        return {"status": "error", "message": f"An unexpected error occurred: {str(e)}"}
+# --- 3. Gradio API Definition (No UI) ---
+# We define the components that make up the API contract, but they are not made visible.
+with gr.Blocks() as demo:
+    # Define the inputs and outputs for the API
+    prompt_input = gr.Textbox(label="prompt", visible=False)
+    output_json = gr.JSON(label="result", visible=False)
+    # Create the API endpoint named "predict"
+    # This will be available at /run/predict
+    gr.Interface(
+        fn=generate_video_api,
+        inputs=prompt_input,
+        outputs=output_json,
+        api_name="predict"
+    )
+# The launch() call is still needed to start the web server that listens for API calls.
 demo.launch()