"""
title: OpenRouter
version: 0.2.0
license: MIT
description: Adds support for OpenRouter, including citations, reasoning tokens, and API call reporting
author: Zhuang Yumin
author_url: https://zhuangyumin.dev
"""

import re
import aiohttp
import json
import time
from typing import List, Union, Generator, Iterator, Optional, Callable, Any, Awaitable, AsyncGenerator
from pydantic import BaseModel, Field
import asyncio


def _insert_citations(text: str, citations: list[str]) -> str:
    """
    Replace citation markers [n] in text with markdown links to the corresponding citation URLs.

    Args:
        text: The text containing citation markers like [1], [2], etc.
        citations: A list of citation URLs, where index 0 corresponds to [1] in the text

    Returns:
        Text with citation markers replaced with markdown links
    """
    # Define regex pattern for citation markers [n]
    pattern = r"\[(\d+)\]"

    def replace_citation(match_obj):
        # Extract the number from the match
        num = int(match_obj.group(1))

        # Check if there's a corresponding citation URL
        # Citations are 0-indexed in the list, but 1-indexed in the text
        if 1 <= num <= len(citations):
            url = citations[num - 1]
            # Return Markdown link: [url]([n])
            return f"[{match_obj.group(0)}]({url})"
        else:
            # If no corresponding citation, return the original marker
            return match_obj.group(0)

    # Replace all citation markers in the text
    result = re.sub(pattern, replace_citation, text)

    return result


class Pipe:
    class Valves(BaseModel):
        OPENROUTER_API_KEY: str = Field(
            default="", description="Your OpenRouter API key"
        )
        INCLUDE_REASONING: bool = Field(
            default=True,
            description="Request reasoning tokens from models that support it",
        )
        MODEL_PREFIX: str = Field(
            default="", description="Optional prefix for model names in Open WebUI"
        )
        REPORT_API_URL: str = Field(
            default="",
            description="URL to report API",
        )
        REPORT_API_KEY: str = Field(
            default="",
            description="API key to report API",
        )

    def __init__(self):
        self.type = "manifold"  # Multiple models
        self.valves = self.Valves()

    async def pipes(self) -> List[dict]:
        """Fetch available models from OpenRouter API asynchronously"""
        if not self.valves.OPENROUTER_API_KEY:
            return [{"id": "error", "name": "API Key not provided"}]

        try:
            headers = {"Authorization": f"Bearer {self.valves.OPENROUTER_API_KEY}"}
            
            async with aiohttp.ClientSession() as session:
                async with session.get(
                    "https://openrouter.ai/api/v1/models", 
                    headers=headers,
                    timeout=aiohttp.ClientTimeout(total=30)
                ) as response:
                    if response.status != 200:
                        return [
                            {
                                "id": "error",
                                "name": f"Error fetching models: {response.status}",
                            }
                        ]

                    models_data = await response.json()

            # Extract model information
            models = []
            for model in models_data.get("data", []):
                model_id = model.get("id")
                if model_id:
                    # Use model name or ID, with optional prefix
                    model_name = model.get("name", model_id)
                    prefix = self.valves.MODEL_PREFIX
                    models.append(
                        {
                            "id": model_id,
                            "name": f"{prefix}{model_name}" if prefix else model_name,
                        }
                    )

            return models or [{"id": "error", "name": "No models found"}]

        except Exception as e:
            print(f"Error fetching models: {e}")
            return [{"id": "error", "name": f"Error: {str(e)}"}]

    async def _report_api_call_direct(self, usage_info: dict, user_email: str, model_id: str, __event_emitter__: Callable[[Any], Awaitable[None]]):
        """Report API call to upstream reporting service using direct usage information asynchronously"""
        if not self.valves.REPORT_API_URL or not self.valves.REPORT_API_KEY:
            return
        
        try:
            # Extract required fields for reporting from usage info
            timestamp = int(time.time())
            input_tokens = usage_info.get("prompt_tokens", 0)
            output_tokens = usage_info.get("completion_tokens", 0)
            cost_usd = usage_info.get("cost", 0.0)
            
            # Prepare API call record
            api_call_record = {
                "timestamp": timestamp,
                "model_id": model_id,
                "user_email": user_email,
                "input_tokens": input_tokens,
                "output_tokens": output_tokens,
                "cost_usd": cost_usd
            }
            
            # Send to reporting API asynchronously
            headers = {
                "Authorization": f"Bearer {self.valves.REPORT_API_KEY}",
                "Content-Type": "application/json"
            }
            
            report_url = f"{self.valves.REPORT_API_URL.rstrip('/')}/api/record_api_call"
            
            async with aiohttp.ClientSession() as session:
                async with session.post(
                    report_url,
                    headers=headers,
                    json=api_call_record,
                    timeout=aiohttp.ClientTimeout(total=30)
                ) as response:
                    if response.status == 200:
                        print(f"Successfully reported API call for user {user_email}")
                    else:
                        print(f"Failed to report API call: {response.status}")
            
            info = f"input: {input_tokens} | output: {output_tokens} | cost: {cost_usd:.6f}"
            await __event_emitter__(
                {
                    "type": "status",
                    "data": {
                        "description": info,
                        "done": True,
                    },
                }
            )
        except Exception as e:
            print(f"Error reporting API call: {e}")

    async def pipe(self, body: dict, __user__: dict, __metadata__: dict, __event_emitter__: Callable[[Any], Awaitable[None]]) -> Union[str, AsyncGenerator]:
        """Process the request and handle reasoning tokens if supported"""
        # Clone the body for OpenRouter
        payload = body.copy()

        # Print incoming body for debugging
        print(f"Original request body: {json.dumps(body)[:500]}...")

        # Extract user email and model ID for reporting
        user_email = __user__.get("email", "") if __user__ else ""
        model_id = __metadata__.get("model").get("id", "") if __metadata__ else ""

        # Make sure the model ID is properly extracted from the pipe format
        if "model" in payload and payload["model"] and "." in payload["model"]:
            # Extract the model ID from the format like "openrouter.model-id"
            payload["model"] = payload["model"].split(".", 1)[1]
            print(f"Extracted model ID: {payload['model']}")

        # Add include_reasoning parameter if enabled
        if self.valves.INCLUDE_REASONING:
            payload["include_reasoning"] = True
        
        # Add usage tracking to get token and cost information directly
        payload["usage"] = {"include": True}

        # Set up headers
        headers = {
            "Authorization": f"Bearer {self.valves.OPENROUTER_API_KEY}",
            "Content-Type": "application/json",
        }

        # Add HTTP-Referer and X-Title if provided
        # These help identify your app on OpenRouter
        if body.get("http_referer"):
            headers["HTTP-Referer"] = body["http_referer"]
        if body.get("x_title"):
            headers["X-Title"] = body["x_title"]

        # Default headers for identifying the app to OpenRouter
        if "HTTP-Referer" not in headers:
            headers["HTTP-Referer"] = "https://openwebui.com/"
        if "X-Title" not in headers:
            headers["X-Title"] = "Open WebUI via Pipe"

        url = "https://openrouter.ai/api/v1/chat/completions"

        try:
            if body.get("stream", False):
                return self.stream_response(url, headers, payload, user_email, model_id, __event_emitter__)
            else:
                return await self.non_stream_response(url, headers, payload, user_email, model_id, __event_emitter__)
        except aiohttp.ClientError as e:
            print(f"Request failed: {e}")
            return f"Error: Request failed: {e}"
        except Exception as e:
            print(f"Error in pipe method: {e}")
            return f"Error: {e}"

    async def non_stream_response(self, url, headers, payload, user_email, model_id, __event_emitter__: Callable[[Any], Awaitable[None]]):
        """Handle non-streaming responses and wrap reasoning in <think> tags if present"""
        try:
            print(
                f"Sending non-streaming request to OpenRouter: {json.dumps(payload)[:200]}..."
            )
            
            async with aiohttp.ClientSession() as session:
                async with session.post(
                    url, 
                    headers=headers, 
                    json=payload, 
                    timeout=aiohttp.ClientTimeout(total=90)
                ) as response:
                    if response.status != 200:
                        error_message = f"HTTP Error {response.status}"
                        try:
                            error_data = await response.json()
                            print(f"Error response: {json.dumps(error_data)}")
                            if "error" in error_data:
                                if (
                                    isinstance(error_data["error"], dict)
                                    and "message" in error_data["error"]
                                ):
                                    error_message += f": {error_data['error']['message']}"
                                else:
                                    error_message += f": {error_data['error']}"
                        except Exception as e:
                            print(f"Failed to parse error response: {e}")
                            error_text = await response.text()
                            error_message += f": {error_text[:500]}"

                        # Log request payload for debugging
                        print(f"Request that caused error: {json.dumps(payload)}")
                        raise Exception(error_message)

                    res = await response.json()
                    print(f"OpenRouter response keys: {list(res.keys())}")

            # Extract usage information directly from response for reporting
            if user_email and model_id:
                usage_info = res.get("usage", {})
                if usage_info:
                    try:
                        await self._report_api_call_direct(usage_info, user_email, model_id, __event_emitter__)
                    except Exception as e:
                        print(f"Error reporting API call: {e}")
                        return f"Error: {e}"
                else:
                    print(f"No usage information found in response")
                    return f"Error: No usage information found in response" 

            # Check if we have choices in the response
            if not res.get("choices") or len(res["choices"]) == 0:
                return ""

            # Extract content and reasoning if present
            choice = res["choices"][0]
            message = choice.get("message", {})

            # Debug output
            print(f"Message keys: {list(message.keys())}")

            content = message.get("content", "")
            reasoning = message.get("reasoning", "")

            print(f"Found reasoning: {bool(reasoning)} ({len(reasoning) if reasoning is not None else 0} chars)")
            print(f"Found content: {bool(content)} ({len(content) if content is not None else 0} chars)")

            # If we have both reasoning and content
            if reasoning and content:
                return f"<think>\n{reasoning}\n</think>\n\n{content}"
            elif reasoning:  # Only reasoning, no content (unusual)
                return f"<think>\n{reasoning}\n</think>\n\n"
            elif content:  # Only content, no reasoning
                return content
            return ""
        except Exception as e:
            print(f"Error in non_stream_response: {e}")
            return f"Error: {e}"

    async def stream_response(self, url, headers, payload, user_email, model_id, __event_emitter__: Callable[[Any], Awaitable[None]]):
        """Stream reasoning tokens in real-time with proper tag management"""
        try:
            async with aiohttp.ClientSession() as session:
                async with session.post(
                    url, 
                    headers=headers, 
                    json=payload,
                    timeout=aiohttp.ClientTimeout(total=90)
                ) as response:
                    if response.status != 200:
                        error_message = f"HTTP Error {response.status}"
                        try:
                            error_data = await response.json()
                            error_message += (
                                f": {error_data.get('error', {}).get('message', '')}"
                            )
                        except:
                            pass
                        raise Exception(error_message)

                    # State tracking
                    in_reasoning_state = False  # True if we've output the opening <think> tag
                    latest_citations = []  # The latest citations list
                    done_received = False  # Track if we've received [DONE]
                    usage_info = None  # Store usage information for reporting

                    # Process the response stream asynchronously
                    async for line_bytes in response.content:
                        if not line_bytes:
                            continue

                        line_text = line_bytes.decode("utf-8").strip()
                        
                        # Handle multiple lines in a single chunk
                        for line in line_text.split('\n'):
                            if not line.strip():
                                continue
                                
                            if not line.startswith("data: "):
                                continue
                            elif line == "data: [DONE]":
                                done_received = True
                                # Handle citations at the end
                                if latest_citations:
                                    citation_list = [f"1. {l}" for l in latest_citations]
                                    citation_list_str = "\n".join(citation_list)
                                    yield f"\n\n---\nCitations:\n{citation_list_str}"
                                continue

                            try:
                                chunk = json.loads(line[6:])

                                # Check for usage information (appears after [DONE])
                                if "usage" in chunk:
                                    usage_info = chunk["usage"]
                                    print(f"Extracted usage info: {usage_info}")
                                    
                                    # Handle reporting with usage information
                                    if user_email and model_id and usage_info:
                                        try:
                                            await self._report_api_call_direct(usage_info, user_email, model_id, __event_emitter__)
                                        except Exception as e:
                                            print(f"Error reporting API call: {e}")
                                            yield f"Error: {e}"
                                        yield ""  # trick to ensure proper completion
                                    continue

                                if "choices" in chunk and chunk["choices"]:
                                    choice = chunk["choices"][0]
                                    citations = chunk.get("citations") or []

                                    # Update the citation list
                                    if citations:
                                        latest_citations = citations

                                    # Check for reasoning tokens
                                    reasoning_text = None
                                    if "delta" in choice and "reasoning" in choice["delta"]:
                                        reasoning_text = choice["delta"]["reasoning"]
                                    elif "message" in choice and "reasoning" in choice["message"]:
                                        reasoning_text = choice["message"]["reasoning"]

                                    # Check for content tokens
                                    content_text = None
                                    if "delta" in choice and "content" in choice["delta"]:
                                        content_text = choice["delta"]["content"]
                                    elif "message" in choice and "content" in choice["message"]:
                                        content_text = choice["message"]["content"]

                                    # Handle reasoning tokens
                                    if reasoning_text:
                                        # If first reasoning token, output opening tag
                                        if not in_reasoning_state:
                                            yield "<think>\n"
                                            in_reasoning_state = True

                                        # Output the reasoning token
                                        yield _insert_citations(reasoning_text, citations)

                                    # Handle content tokens
                                    if content_text:
                                        # If transitioning from reasoning to content, close the thinking tag
                                        if in_reasoning_state:
                                            yield "\n</think>\n\n"
                                            in_reasoning_state = False

                                        # Output the content
                                        if content_text:
                                            yield _insert_citations(content_text, citations)

                            except Exception as e:
                                print(f"Error processing chunk: {e}")

                    # If we're still in reasoning state at the end, close the tag
                    if in_reasoning_state:
                        yield "\n</think>\n\n"

        except Exception as e:
            print(f"Error in stream_response: {e}")
            yield f"Error: {e}"