Spaces:

AIMaster7
/

Mono

Running

App Files Files Community

AIMaster7 commited on Jul 4

Commit

06dc2f1

verified ·

1 Parent(s): c18e9c8

Update main.py

Browse files

Files changed (1) hide show

main.py +284 -85

main.py CHANGED Viewed

@@ -5,7 +5,7 @@ import secrets
 import string
 import time
 import tempfile
-import ast  # <-- NEW IMPORT for safe literal evaluation
 from typing import List, Optional, Union, Any
 import httpx
@@ -14,11 +14,13 @@ from fastapi import FastAPI, HTTPException
 from fastapi.responses import JSONResponse, StreamingResponse
 from pydantic import BaseModel, Field, model_validator
-# New import for OCR
 from gradio_client import Client, handle_file
 # --- Configuration ---
 load_dotenv()
 IMAGE_API_URL = os.environ.get("IMAGE_API_URL", "https://image.api.example.com")
 SNAPZION_UPLOAD_URL = "https://upload.snapzion.com/api/public-upload"
 SNAPZION_API_KEY = os.environ.get("SNAP", "")
@@ -41,36 +43,43 @@ MODEL_ALIASES = {}
 app = FastAPI(
     title="OpenAI Compatible API",
     description="An adapter for various services to be compatible with the OpenAI API specification.",
-    version="1.1.2" # Incremented version for the new fix
 )
 try:
     ocr_client = Client("multimodalart/Florence-2-l4")
 except Exception as e:
     print(f"Warning: Could not initialize Gradio client for OCR: {e}")
     ocr_client = None
 # --- Pydantic Models ---
-# (Pydantic models are unchanged and remain the same as before)
 class Message(BaseModel):
     role: str
     content: str
 class ChatRequest(BaseModel):
     messages: List[Message]
     model: str
     stream: Optional[bool] = False
     tools: Optional[Any] = None
 class ImageGenerationRequest(BaseModel):
     prompt: str
     aspect_ratio: Optional[str] = "1:1"
     n: Optional[int] = 1
     user: Optional[str] = None
     model: Optional[str] = "default"
 class ModerationRequest(BaseModel):
     input: Union[str, List[str]]
     model: Optional[str] = "text-moderation-stable"
 class OcrRequest(BaseModel):
     image_url: Optional[str] = Field(None, description="URL of the image to process.")
     image_b64: Optional[str] = Field(None, description="Base64 encoded string of the image to process.")
     @model_validator(mode='before')
     @classmethod
     def check_sources(cls, data: Any) -> Any:
@@ -80,116 +89,258 @@ class OcrRequest(BaseModel):
             if data.get('image_url') and data.get('image_b64'):
                 raise ValueError('Provide either image_url or image_b64, not both.')
         return data
 class OcrResponse(BaseModel):
     ocr_text: str
     raw_response: dict
 # --- Helper Function ---
 def generate_random_id(prefix: str, length: int = 29) -> str:
     population = string.ascii_letters + string.digits
     random_part = "".join(secrets.choice(population) for _ in range(length))
     return f"{prefix}{random_part}"
 # === API Endpoints ===
 @app.get("/v1/models", tags=["Models"])
 async def list_models():
     return {"object": "list", "data": AVAILABLE_MODELS}
-# (Chat, Image Generation, and Moderation endpoints are unchanged and remain correct)
 @app.post("/v1/chat/completions", tags=["Chat"])
 async def chat_completion(request: ChatRequest):
-    model_id=MODEL_ALIASES.get(request.model,request.model);chat_id=generate_random_id("chatcmpl-");headers={'accept':'text/event-stream','content-type':'application/json','origin':'https://www.chatwithmono.xyz','referer':'https://www.chatwithmono.xyz/','user-agent':'Mozilla/5.0'}
     if request.tools:
-        tool_prompt=f"""You have access to the following tools. To call a tool, please respond with JSON for a tool call within <tool_call></tool_call> XML tags. Respond in the format {{"name": tool name, "parameters": dictionary of argument name and its value}}. Do not use variables.
 Tools: {";".join(f"<tool>{tool}</tool>" for tool in request.tools)}
 Response Format for tool call:
 <tool_call>
 {{"name": <function-name>, "arguments": <args-json-object>}}
 </tool_call>"""
-        if request.messages[0].role=="system":request.messages[0].content+="\n\n"+tool_prompt
-        else:request.messages.insert(0,Message(role="system",content=tool_prompt))
-    payload={"messages":[msg.model_dump()for msg in request.messages],"model":model_id}
     if request.stream:
         async def event_stream():
-            created=int(time.time());usage_info=None;is_first_chunk=True;tool_call_buffer="";in_tool_call=False
             try:
-                async with httpx.AsyncClient(timeout=120)as client:
-                    async with client.stream("POST",CHAT_API_URL,headers=headers,json=payload)as response:
                         response.raise_for_status()
                         async for line in response.aiter_lines():
-                            if not line:continue
                             if line.startswith("0:"):
-                                try:content_piece=json.loads(line[2:])
-                                except json.JSONDecodeError:continue
-                                current_buffer=content_piece
-                                if in_tool_call:current_buffer=tool_call_buffer+content_piece
-                                if"</tool_call>"in current_buffer:
-                                    tool_str=current_buffer.split("<tool_call>")[1].split("</tool_call>")[0];tool_json=json.loads(tool_str.strip());delta={"content":None,"tool_calls":[{"index":0,"id":generate_random_id("call_"),"type":"function","function":{"name":tool_json["name"],"arguments":json.dumps(tool_json["parameters"])}}]}
-                                    chunk={"id":chat_id,"object":"chat.completion.chunk","created":created,"model":model_id,"choices":[{"index":0,"delta":delta,"finish_reason":None}],"usage":None};yield f"data: {json.dumps(chunk)}\n\n"
-                                    in_tool_call=False;tool_call_buffer="";remaining_text=current_buffer.split("</tool_call>",1)[1]
-                                    if remaining_text:content_piece=remaining_text
-                                    else:continue
-                                if"<tool_call>"in content_piece:
-                                    in_tool_call=True;tool_call_buffer+=content_piece.split("<tool_call>",1)[1];text_before=content_piece.split("<tool_call>",1)[0]
                                     if text_before:
-                                        delta={"content":text_before,"tool_calls":None};chunk={"id":chat_id,"object":"chat.completion.chunk","created":created,"model":model_id,"choices":[{"index":0,"delta":delta,"finish_reason":None}],"usage":None};yield f"data: {json.dumps(chunk)}\n\n"
-                                    if"</tool_call>"not in tool_call_buffer:continue
                                 if not in_tool_call:
-                                    delta={"content":content_piece}
-                                    if is_first_chunk:delta["role"]="assistant";is_first_chunk=False
-                                    chunk={"id":chat_id,"object":"chat.completion.chunk","created":created,"model":model_id,"choices":[{"index":0,"delta":delta,"finish_reason":None}],"usage":None};yield f"data: {json.dumps(chunk)}\n\n"
-                            elif line.startswith(("e:","d:")):
-                                try:usage_info=json.loads(line[2:]).get("usage")
-                                except(json.JSONDecodeError,AttributeError):pass
                                 break
-                        final_usage=None
-                        if usage_info:final_usage={"prompt_tokens":usage_info.get("promptTokens",0),"completion_tokens":usage_info.get("completionTokens",0),"total_tokens":usage_info.get("promptTokens",0)+usage_info.get("completionTokens",0)}
-                        done_chunk={"id":chat_id,"object":"chat.completion.chunk","created":created,"model":model_id,"choices":[{"index":0,"delta":{},"finish_reason":"stop"if not in_tool_call else"tool_calls"}],"usage":final_usage};yield f"data: {json.dumps(done_chunk)}\n\n"
-            except httpx.HTTPStatusError as e:error_content={"error":{"message":f"Upstream API error: {e.response.status_code}. Details: {e.response.text}","type":"upstream_error","code":str(e.response.status_code)}};yield f"data: {json.dumps(error_content)}\n\n"
-            finally:yield"data: [DONE]\n\n"
-        return StreamingResponse(event_stream(),media_type="text/event-stream")
-    else:
-        full_response,usage_info="",{}
         try:
-            async with httpx.AsyncClient(timeout=120)as client:
-                async with client.stream("POST",CHAT_API_URL,headers=headers,json=payload)as response:
                     response.raise_for_status()
                     async for chunk in response.aiter_lines():
                         if chunk.startswith("0:"):
-                            try:full_response+=json.loads(chunk[2:])
-                            except:continue
-                        elif chunk.startswith(("e:","d:")):
-                            try:usage_info=json.loads(chunk[2:]).get("usage",{})
-                            except:continue
-            tool_calls=None;content_response=full_response
-            if"<tool_call>"in full_response and"</tool_call>"in full_response:
-                tool_call_str=full_response.split("<tool_call>")[1].split("</tool_call>")[0];tool_call=json.loads(tool_call_str.strip());tool_calls=[{"id":generate_random_id("call_"),"type":"function","function":{"name":tool_call["name"],"arguments":json.dumps(tool_call["parameters"])}}];content_response=None
-            return JSONResponse(content={"id":chat_id,"object":"chat.completion","created":int(time.time()),"model":model_id,"choices":[{"index":0,"message":{"role":"assistant","content":content_response,"tool_calls":tool_calls},"finish_reason":"stop"if not tool_calls else"tool_calls"}],"usage":{"prompt_tokens":usage_info.get("promptTokens",0),"completion_tokens":usage_info.get("completionTokens",0),"total_tokens":usage_info.get("promptTokens",0)+usage_info.get("completionTokens",0)}})
-        except httpx.HTTPStatusError as e:return JSONResponse(status_code=e.response.status_code,content={"error":{"message":f"Upstream API error. Details: {e.response.text}","type":"upstream_error"}})
 @app.post("/v1/images/generations", tags=["Images"])
 async def generate_images(request: ImageGenerationRequest):
-    results=[]
     try:
-        async with httpx.AsyncClient(timeout=120)as client:
             for _ in range(request.n):
-                model=request.model or"default"
-                if model in["gpt-image-1","dall-e-3","dall-e-2","nextlm-image-1"]:
-                    headers={'Content-Type':'application/json','User-Agent':'Mozilla/5.0','Referer':'https://www.chatwithmono.xyz/'};payload={"prompt":request.prompt,"model":model};resp=await client.post(IMAGE_GEN_API_URL,headers=headers,json=payload);resp.raise_for_status();data=resp.json();b64_image=data.get("image")
-                    if not b64_image:return JSONResponse(status_code=502,content={"error":"Missing base64 image in response"})
-                    image_url=f"data:image/png;base64,{b64_image}"
                     if SNAPZION_API_KEY:
-                        upload_headers={"Authorization":SNAPZION_API_KEY};upload_files={'file':('image.png',base64.b64decode(b64_image),'image/png')};upload_resp=await client.post(SNAPZION_UPLOAD_URL,headers=upload_headers,files=upload_files)
-                        if upload_resp.status_code==200:image_url=upload_resp.json().get("url",image_url)
-                    results.append({"url":image_url,"b64_json":b64_image,"revised_prompt":data.get("revised_prompt")})
-                else:params={"prompt":request.prompt,"aspect_ratio":request.aspect_ratio,"link":"typegpt.net"};resp=await client.get(IMAGE_API_URL,params=params);resp.raise_for_status();data=resp.json();results.append({"url":data.get("image_link"),"b64_json":data.get("base64_output")})
-    except httpx.HTTPStatusError as e:return JSONResponse(status_code=502,content={"error":f"Image generation failed. Upstream error: {e.response.status_code}","details":e.response.text})
-    except Exception as e:return JSONResponse(status_code=500,content={"error":"An internal error occurred.","details":str(e)})
-    return{"created":int(time.time()),"data":results}
-# === REVISED AND FIXED OCR Endpoint ===
 @app.post("/v1/ocr", response_model=OcrResponse, tags=["OCR"])
 async def perform_ocr(request: OcrRequest):
     """
@@ -218,7 +369,7 @@ async def perform_ocr(request: OcrRequest):
         raw_output = prediction[0]
         raw_result_dict = {}
-        # --- START: ROBUST PARSING LOGIC ---
         if isinstance(raw_output, str):
             try:
                 # First, try to parse as standard JSON
@@ -234,17 +385,18 @@ async def perform_ocr(request: OcrRequest):
                         raw_result_dict = {"result": str(parsed_output)}
                 except (ValueError, SyntaxError):
                     # If all parsing fails, assume the string is the direct OCR text.
-                    raw_result_dict = {"ocr_text": raw_output}
         elif isinstance(raw_output, dict):
             # It's already a dictionary, use it directly
             raw_result_dict = raw_output
         else:
             # Handle other unexpected data types
             raise HTTPException(status_code=502, detail=f"Unexpected data type from OCR service: {type(raw_output)}")
-        # --- END: ROBUST PARSING LOGIC ---
-        # Extract text from the dictionary, with fallbacks
-        ocr_text = raw_result_dict.get("OCR", raw_result_dict.get("ocr_text", str(raw_result_dict)))
         return OcrResponse(ocr_text=ocr_text, raw_response=raw_result_dict)
@@ -256,22 +408,69 @@ async def perform_ocr(request: OcrRequest):
         if temp_file_path and os.path.exists(temp_file_path):
             os.unlink(temp_file_path)
 @app.post("/v1/moderations", tags=["Moderation"])
 async def create_moderation(request: ModerationRequest):
-    input_texts=[request.input]if isinstance(request.input,str)else request.input
-    if not input_texts:return JSONResponse(status_code=400,content={"error":{"message":"Request must have at least one input string."}})
-    headers={'Content-Type':'application/json','User-Agent':'Mozilla/5.0','Referer':'https://www.chatwithmono.xyz/'};results=[]
     try:
-        async with httpx.AsyncClient(timeout=30)as client:
             for text_input in input_texts:
-                resp=await client.post(MODERATION_API_URL,headers=headers,json={"text":text_input});resp.raise_for_status();upstream_data=resp.json();upstream_categories=upstream_data.get("categories",{})
-                openai_categories={"hate":upstream_categories.get("hate",False),"hate/threatening":False,"harassment":False,"harassment/threatening":False,"self-harm":upstream_categories.get("self-harm",False),"self-harm/intent":False,"self-harm/instructions":False,"sexual":upstream_categories.get("sexual",False),"sexual/minors":False,"violence":upstream_categories.get("violence",False),"violence/graphic":False}
-                result_item={"flagged":upstream_data.get("overall_sentiment")=="flagged","categories":openai_categories,"category_scores":{k:1.0 if v else 0.0 for k,v in openai_categories.items()}}
-                if reason:=upstream_data.get("reason"):result_item["reason"]=reason
                 results.append(result_item)
-    except httpx.HTTPStatusError as e:return JSONResponse(status_code=502,content={"error":{"message":f"Moderation failed. Upstream error: {e.response.status_code}","details":e.response.text}})
-    except Exception as e:return JSONResponse(status_code=500,content={"error":{"message":"An internal error occurred during moderation.","details":str(e)}})
-    return JSONResponse(content={"id":generate_random_id("modr-"),"model":request.model,"results":results})
 # --- Main Execution ---

 import string
 import time
 import tempfile
+import ast
 from typing import List, Optional, Union, Any
 import httpx
 from fastapi.responses import JSONResponse, StreamingResponse
 from pydantic import BaseModel, Field, model_validator
+# Import for OCR functionality
 from gradio_client import Client, handle_file
 # --- Configuration ---
 load_dotenv()
+# Environment variables for external services
 IMAGE_API_URL = os.environ.get("IMAGE_API_URL", "https://image.api.example.com")
 SNAPZION_UPLOAD_URL = "https://upload.snapzion.com/api/public-upload"
 SNAPZION_API_KEY = os.environ.get("SNAP", "")
 app = FastAPI(
     title="OpenAI Compatible API",
     description="An adapter for various services to be compatible with the OpenAI API specification.",
+    version="1.1.3"  # Version reflects final formatting and fixes
 )
+# Initialize Gradio client globally to avoid re-initialization on each request
 try:
     ocr_client = Client("multimodalart/Florence-2-l4")
 except Exception as e:
     print(f"Warning: Could not initialize Gradio client for OCR: {e}")
     ocr_client = None
 # --- Pydantic Models ---
 class Message(BaseModel):
     role: str
     content: str
 class ChatRequest(BaseModel):
     messages: List[Message]
     model: str
     stream: Optional[bool] = False
     tools: Optional[Any] = None
 class ImageGenerationRequest(BaseModel):
     prompt: str
     aspect_ratio: Optional[str] = "1:1"
     n: Optional[int] = 1
     user: Optional[str] = None
     model: Optional[str] = "default"
 class ModerationRequest(BaseModel):
     input: Union[str, List[str]]
     model: Optional[str] = "text-moderation-stable"
 class OcrRequest(BaseModel):
     image_url: Optional[str] = Field(None, description="URL of the image to process.")
     image_b64: Optional[str] = Field(None, description="Base64 encoded string of the image to process.")
     @model_validator(mode='before')
     @classmethod
     def check_sources(cls, data: Any) -> Any:
             if data.get('image_url') and data.get('image_b64'):
                 raise ValueError('Provide either image_url or image_b64, not both.')
         return data
 class OcrResponse(BaseModel):
     ocr_text: str
     raw_response: dict
 # --- Helper Function ---
 def generate_random_id(prefix: str, length: int = 29) -> str:
+    """Generates a cryptographically secure, random alphanumeric ID."""
     population = string.ascii_letters + string.digits
     random_part = "".join(secrets.choice(population) for _ in range(length))
     return f"{prefix}{random_part}"
 # === API Endpoints ===
 @app.get("/v1/models", tags=["Models"])
 async def list_models():
+    """Lists the available models."""
     return {"object": "list", "data": AVAILABLE_MODELS}
 @app.post("/v1/chat/completions", tags=["Chat"])
 async def chat_completion(request: ChatRequest):
+    """Handles chat completion requests, supporting streaming and non-streaming."""
+    model_id = MODEL_ALIASES.get(request.model, request.model)
+    chat_id = generate_random_id("chatcmpl-")
+    headers = {
+        'accept': 'text/event-stream',
+        'content-type': 'application/json',
+        'origin': 'https://www.chatwithmono.xyz',
+        'referer': 'https://www.chatwithmono.xyz/',
+        'user-agent': 'Mozilla/5.0',
+    }
     if request.tools:
+        tool_prompt = f"""You have access to the following tools. To call a tool, please respond with JSON for a tool call within <tool_call></tool_call> XML tags. Respond in the format {{"name": tool name, "parameters": dictionary of argument name and its value}}. Do not use variables.
 Tools: {";".join(f"<tool>{tool}</tool>" for tool in request.tools)}
 Response Format for tool call:
 <tool_call>
 {{"name": <function-name>, "arguments": <args-json-object>}}
 </tool_call>"""
+        if request.messages[0].role == "system":
+            request.messages[0].content += "\n\n" + tool_prompt
+        else:
+            request.messages.insert(0, Message(role="system", content=tool_prompt))
+    payload = {"messages": [msg.model_dump() for msg in request.messages], "model": model_id}
     if request.stream:
         async def event_stream():
+            created = int(time.time())
+            usage_info = None
+            is_first_chunk = True
+            tool_call_buffer = ""
+            in_tool_call = False
             try:
+                async with httpx.AsyncClient(timeout=120) as client:
+                    async with client.stream("POST", CHAT_API_URL, headers=headers, json=payload) as response:
                         response.raise_for_status()
                         async for line in response.aiter_lines():
+                            if not line:
+                                continue
                             if line.startswith("0:"):
+                                try:
+                                    content_piece = json.loads(line[2:])
+                                except json.JSONDecodeError:
+                                    continue
+                                current_buffer = content_piece
+                                if in_tool_call:
+                                    current_buffer = tool_call_buffer + content_piece
+                                if "</tool_call>" in current_buffer:
+                                    tool_str = current_buffer.split("<tool_call>")[1].split("</tool_call>")[0]
+                                    tool_json = json.loads(tool_str.strip())
+                                    delta = {
+                                        "content": None,
+                                        "tool_calls": [{"index": 0, "id": generate_random_id("call_"), "type": "function",
+                                                        "function": {"name": tool_json["name"], "arguments": json.dumps(tool_json["parameters"])}}]
+                                    }
+                                    chunk = {"id": chat_id, "object": "chat.completion.chunk", "created": created, "model": model_id,
+                                             "choices": [{"index": 0, "delta": delta, "finish_reason": None}], "usage": None}
+                                    yield f"data: {json.dumps(chunk)}\n\n"
+                                    in_tool_call = False
+                                    tool_call_buffer = ""
+                                    remaining_text = current_buffer.split("</tool_call>", 1)[1]
+                                    if remaining_text:
+                                        content_piece = remaining_text
+                                    else:
+                                        continue
+                                if "<tool_call>" in content_piece:
+                                    in_tool_call = True
+                                    tool_call_buffer += content_piece.split("<tool_call>", 1)[1]
+                                    text_before = content_piece.split("<tool_call>", 1)[0]
                                     if text_before:
+                                        delta = {"content": text_before, "tool_calls": None}
+                                        chunk = {"id": chat_id, "object": "chat.completion.chunk", "created": created, "model": model_id,
+                                                 "choices": [{"index": 0, "delta": delta, "finish_reason": None}], "usage": None}
+                                        yield f"data: {json.dumps(chunk)}\n\n"
+                                    if "</tool_call>" not in tool_call_buffer:
+                                        continue
                                 if not in_tool_call:
+                                    delta = {"content": content_piece}
+                                    if is_first_chunk:
+                                        delta["role"] = "assistant"
+                                        is_first_chunk = False
+                                    chunk = {"id": chat_id, "object": "chat.completion.chunk", "created": created, "model": model_id,
+                                             "choices": [{"index": 0, "delta": delta, "finish_reason": None}], "usage": None}
+                                    yield f"data: {json.dumps(chunk)}\n\n"
+                            elif line.startswith(("e:", "d:")):
+                                try:
+                                    usage_info = json.loads(line[2:]).get("usage")
+                                except (json.JSONDecodeError, AttributeError):
+                                    pass
                                 break
+                        final_usage = None
+                        if usage_info:
+                            prompt_tokens = usage_info.get("promptTokens", 0)
+                            completion_tokens = usage_info.get("completionTokens", 0)
+                            final_usage = {
+                                "prompt_tokens": prompt_tokens,
+                                "completion_tokens": completion_tokens,
+                                "total_tokens": prompt_tokens + completion_tokens
+                            }
+                        finish_reason = "tool_calls" if in_tool_call else "stop"
+                        done_chunk = {"id": chat_id, "object": "chat.completion.chunk", "created": created, "model": model_id,
+                                      "choices": [{"index": 0, "delta": {}, "finish_reason": finish_reason}], "usage": final_usage}
+                        yield f"data: {json.dumps(done_chunk)}\n\n"
+            except httpx.HTTPStatusError as e:
+                error_content = {"error": {"message": f"Upstream API error: {e.response.status_code}. Details: {e.response.text}", "type": "upstream_error", "code": str(e.response.status_code)}}
+                yield f"data: {json.dumps(error_content)}\n\n"
+            finally:
+                yield "data: [DONE]\n\n"
+        return StreamingResponse(event_stream(), media_type="text/event-stream")
+    else:  # Non-streaming response
+        full_response, usage_info = "", {}
         try:
+            async with httpx.AsyncClient(timeout=120) as client:
+                async with client.stream("POST", CHAT_API_URL, headers=headers, json=payload) as response:
                     response.raise_for_status()
                     async for chunk in response.aiter_lines():
                         if chunk.startswith("0:"):
+                            try:
+                                full_response += json.loads(chunk[2:])
+                            except:
+                                continue
+                        elif chunk.startswith(("e:", "d:")):
+                            try:
+                                usage_info = json.loads(chunk[2:]).get("usage", {})
+                            except:
+                                continue
+            tool_calls = None
+            content_response = full_response
+            finish_reason = "stop"
+            if "<tool_call>" in full_response and "</tool_call>" in full_response:
+                tool_call_str = full_response.split("<tool_call>")[1].split("</tool_call>")[0]
+                tool_call = json.loads(tool_call_str.strip())
+                tool_calls = [{
+                    "id": generate_random_id("call_"),
+                    "type": "function",
+                    "function": {
+                        "name": tool_call["name"],
+                        "arguments": json.dumps(tool_call["parameters"])
+                    }
+                }]
+                content_response = None
+                finish_reason = "tool_calls"
+            prompt_tokens = usage_info.get("promptTokens", 0)
+            completion_tokens = usage_info.get("completionTokens", 0)
+            return JSONResponse(content={
+                "id": chat_id,
+                "object": "chat.completion",
+                "created": int(time.time()),
+                "model": model_id,
+                "choices": [{
+                    "index": 0,
+                    "message": {
+                        "role": "assistant",
+                        "content": content_response,
+                        "tool_calls": tool_calls
+                    },
+                    "finish_reason": finish_reason
+                }],
+                "usage": {
+                    "prompt_tokens": prompt_tokens,
+                    "completion_tokens": completion_tokens,
+                    "total_tokens": prompt_tokens + completion_tokens
+                }
+            })
+        except httpx.HTTPStatusError as e:
+            return JSONResponse(
+                status_code=e.response.status_code,
+                content={"error": {"message": f"Upstream API error. Details: {e.response.text}", "type": "upstream_error"}}
+            )
 @app.post("/v1/images/generations", tags=["Images"])
 async def generate_images(request: ImageGenerationRequest):
+    """Handles image generation requests."""
+    results = []
     try:
+        async with httpx.AsyncClient(timeout=120) as client:
             for _ in range(request.n):
+                model = request.model or "default"
+                if model in ["gpt-image-1", "dall-e-3", "dall-e-2", "nextlm-image-1"]:
+                    headers = {'Content-Type': 'application/json', 'User-Agent': 'Mozilla/5.0', 'Referer': 'https://www.chatwithmono.xyz/'}
+                    payload = {"prompt": request.prompt, "model": model}
+                    resp = await client.post(IMAGE_GEN_API_URL, headers=headers, json=payload)
+                    resp.raise_for_status()
+                    data = resp.json()
+                    b64_image = data.get("image")
+                    if not b64_image:
+                        return JSONResponse(status_code=502, content={"error": "Missing base64 image in response"})
+                    image_url = f"data:image/png;base64,{b64_image}"
                     if SNAPZION_API_KEY:
+                        upload_headers = {"Authorization": SNAPZION_API_KEY}
+                        upload_files = {'file': ('image.png', base64.b64decode(b64_image), 'image/png')}
+                        upload_resp = await client.post(SNAPZION_UPLOAD_URL, headers=upload_headers, files=upload_files)
+                        if upload_resp.status_code == 200:
+                            image_url = upload_resp.json().get("url", image_url)
+                    results.append({"url": image_url, "b64_json": b64_image, "revised_prompt": data.get("revised_prompt")})
+                else:
+                    params = {"prompt": request.prompt, "aspect_ratio": request.aspect_ratio, "link": "typegpt.net"}
+                    resp = await client.get(IMAGE_API_URL, params=params)
+                    resp.raise_for_status()
+                    data = resp.json()
+                    results.append({"url": data.get("image_link"), "b64_json": data.get("base64_output")})
+    except httpx.HTTPStatusError as e:
+        return JSONResponse(status_code=502, content={"error": f"Image generation failed. Upstream error: {e.response.status_code}", "details": e.response.text})
+    except Exception as e:
+        return JSONResponse(status_code=500, content={"error": "An internal error occurred.", "details": str(e)})
+    return {"created": int(time.time()), "data": results}
 @app.post("/v1/ocr", response_model=OcrResponse, tags=["OCR"])
 async def perform_ocr(request: OcrRequest):
     """
         raw_output = prediction[0]
         raw_result_dict = {}
+        # --- Robust Parsing Logic ---
         if isinstance(raw_output, str):
             try:
                 # First, try to parse as standard JSON
                         raw_result_dict = {"result": str(parsed_output)}
                 except (ValueError, SyntaxError):
                     # If all parsing fails, assume the string is the direct OCR text.
+                    raw_result_dict = {"ocr_text_from_string": raw_output}
         elif isinstance(raw_output, dict):
             # It's already a dictionary, use it directly
             raw_result_dict = raw_output
         else:
             # Handle other unexpected data types
             raise HTTPException(status_code=502, detail=f"Unexpected data type from OCR service: {type(raw_output)}")
+        # Extract text from the dictionary, with multiple fallbacks
+        ocr_text = raw_result_dict.get("OCR",
+                   raw_result_dict.get("ocr_text_from_string",
+                   str(raw_result_dict)))
         return OcrResponse(ocr_text=ocr_text, raw_response=raw_result_dict)
         if temp_file_path and os.path.exists(temp_file_path):
             os.unlink(temp_file_path)
 @app.post("/v1/moderations", tags=["Moderation"])
 async def create_moderation(request: ModerationRequest):
+    """Handles moderation requests, conforming to the OpenAI API specification."""
+    input_texts = [request.input] if isinstance(request.input, str) else request.input
+    if not input_texts:
+         return JSONResponse(status_code=400, content={"error": {"message": "Request must have at least one input string."}})
+    headers = {'Content-Type': 'application/json', 'User-Agent': 'Mozilla/5.0', 'Referer': 'https://www.chatwithmono.xyz/'}
+    results = []
     try:
+        async with httpx.AsyncClient(timeout=30) as client:
             for text_input in input_texts:
+                payload = {"text": text_input}
+                resp = await client.post(MODERATION_API_URL, headers=headers, json=payload)
+                resp.raise_for_status()
+                upstream_data = resp.json()
+                upstream_categories = upstream_data.get("categories", {})
+                openai_categories = {
+                    "hate": upstream_categories.get("hate", False),
+                    "hate/threatening": False,
+                    "harassment": False,
+                    "harassment/threatening": False,
+                    "self-harm": upstream_categories.get("self-harm", False),
+                    "self-harm/intent": False,
+                    "self-harm/instructions": False,
+                    "sexual": upstream_categories.get("sexual", False),
+                    "sexual/minors": False,
+                    "violence": upstream_categories.get("violence", False),
+                    "violence/graphic": False,
+                }
+                result_item = {
+                    "flagged": upstream_data.get("overall_sentiment") == "flagged",
+                    "categories": openai_categories,
+                    "category_scores": {k: 1.0 if v else 0.0 for k, v in openai_categories.items()},
+                }
+                if reason := upstream_data.get("reason"):
+                    result_item["reason"] = reason
                 results.append(result_item)
+    except httpx.HTTPStatusError as e:
+        return JSONResponse(
+            status_code=502,
+            content={"error": {"message": f"Moderation failed. Upstream error: {e.response.status_code}", "details": e.response.text}}
+        )
+    except Exception as e:
+        return JSONResponse(
+            status_code=500,
+            content={"error": {"message": "An internal error occurred during moderation.", "details": str(e)}}
+        )
+    final_response = {
+        "id": generate_random_id("modr-"),
+        "model": request.model,
+        "results": results,
+    }
+    return JSONResponse(content=final_response)
 # --- Main Execution ---