OpenRouter Integration for OpenWebUI Function • Open WebUI Community

""" title: OpenRouter Integration for OpenWebUI version: 0.4.1 description: Integration with OpenRouter for OpenWebUI with Free Model Filtering and optional field improvements author: kevarch author_url: https://github.com/kevarch contributor: Eloi Marques da Silva (https://github.com/eloimarquessilva) credits: rburmorrison (https://github.com/rburmorrison), Google Gemini Pro 2.5 license: MIT Changelog: - Version 0.4.1: * Contribution by Eloi Marques da Silva * Added FREE_ONLY parameter to optionally filter and display only free models in OpenWebUI. * Changed MODEL_PREFIX and MODEL_PROVIDERS from required (str) to optional (Optional[str]), allowing null values. """ import re import requests import json import traceback # Import traceback for detailed error logging from typing import Optional, List, Union, Generator, Iterator from pydantic import BaseModel, Field # --- Helper function for citation text insertion --- def _insert_citations(text: str, citations: list[str]) -> str: """ Replace citation markers [n] in text with markdown links to the corresponding citation URLs. Args: text: The text containing citation markers like [1], [2], etc. citations: A list of citation URLs, where index 0 corresponds to [1] in the text Returns: Text with citation markers replaced with markdown links """ if not citations or not text: return text pattern = r"\[(\d+)\]" def replace_citation(match_obj): try: num = int(match_obj.group(1)) if 1 <= num <= len(citations): url = citations[num - 1] return f"[[{num}]]({url})" else: return match_obj.group(0) except (ValueError, IndexError): return match_obj.group(0) try: return re.sub(pattern, replace_citation, text) except Exception as e: print(f"Error during citation insertion: {e}") return text # --- Helper function for formatting the final citation list --- def _format_citation_list(citations: list[str]) -> str: """ Formats a list of citation URLs into a markdown string. Args: citations: A list of citation URLs. Returns: A formatted markdown string (e.g., "\n\n---\nCitations:\n1. url1\n2. url2") or an empty string if no citations are provided. """ if not citations: return "" try: citation_list = [f"{i+1}. {url}" for i, url in enumerate(citations)] return "\n\n---\nCitations:\n" + "\n".join(citation_list) except Exception as e: print(f"Error formatting citation list: {e}") return "" # --- Main Pipe class --- class Pipe: class Valves(BaseModel): # User-configurable settings OPENROUTER_API_KEY: str = Field( default="", description="Your OpenRouter API key (required)." ) INCLUDE_REASONING: bool = Field( default=True, description="Request reasoning tokens from models that support it.", ) MODEL_PREFIX: Optional[str] = Field( default=None, description="Optional prefix for model names in Open WebUI (e.g., 'OR: ').", ) # NEW: Configurable request timeout REQUEST_TIMEOUT: int = Field( default=90, description="Timeout for API requests in seconds.", gt=0, ) MODEL_PROVIDERS: Optional[str] = Field( default=None, description="Comma-separated list of model providers to include or exclude. Leave empty to include all providers.", ) INVERT_PROVIDER_LIST: bool = Field( default=False, description="If true, the above 'Model Providers' list becomes an *exclude* list instead of an *include* list.", ) ENABLE_CACHE_CONTROL: bool = Field( default=False, description="Enable OpenRouter prompt caching by adding 'cache_control' to potentially large message parts. May reduce costs for supported models (e.g., Anthropic, Gemini) on subsequent calls with the same cached prefix. See OpenRouter docs for details.", ) FREE_ONLY: bool = Field( default=False, description="If true, only free models will be available.", ) def __init__(self): self.type = "manifold" # Specifies this pipe provides multiple models self.valves = self.Valves() if not self.valves.OPENROUTER_API_KEY: print("Warning: OPENROUTER_API_KEY is not set in Valves.") def pipes(self) -> List[dict]: """ Fetches available models from the OpenRouter API. This method is called by OpenWebUI to discover the models this pipe provides. """ if not self.valves.OPENROUTER_API_KEY: return [ {"id": "error", "name": "Pipe Error: OpenRouter API Key not provided"} ] try: headers = {"Authorization": f"Bearer {self.valves.OPENROUTER_API_KEY}"} response = requests.get( "https://openrouter.ai/api/v1/models", headers=headers, timeout=self.valves.REQUEST_TIMEOUT, ) response.raise_for_status() models_data = response.json() raw_models_data = models_data.get("data", []) models: List[dict] = [] # --- Provider Filtering Logic --- provider_list_str = (self.valves.MODEL_PROVIDERS or "").lower() invert_list = self.valves.INVERT_PROVIDER_LIST target_providers = { p.strip() for p in provider_list_str.split(",") if p.strip() } # --- End Filtering Logic --- for model in raw_models_data: model_id = model.get("id") if not model_id: continue # Apply Provider Filtering if target_providers: provider = ( model_id.split("/", 1)[0].lower() if "/" in model_id else model_id.lower() ) provider_in_list = provider in target_providers keep = (provider_in_list and not invert_list) or ( not provider_in_list and invert_list ) if not keep: continue # Apply Free Only Filtering if self.valves.FREE_ONLY and "free" not in model_id.lower(): continue model_name = model.get("name", model_id) prefix = self.valves.MODEL_PREFIX or "" models.append({"id": model_id, "name": f"{prefix}{model_name}"}) if not models: if self.valves.FREE_ONLY: return [{"id": "error", "name": "Pipe Error: No free models found"}] elif target_providers: return [ { "id": "error", "name": "Pipe Error: No models found matching the provider filter", } ] else: return [ { "id": "error", "name": "Pipe Error: No models found on OpenRouter", } ] return models except requests.exceptions.Timeout: print("Error fetching models: Request timed out.") return [{"id": "error", "name": "Pipe Error: Timeout fetching models"}] except requests.exceptions.HTTPError as e: error_msg = f"Pipe Error: HTTP {e.response.status_code} fetching models" try: error_detail = e.response.json().get("error", {}).get("message", "") if error_detail: error_msg += f": {error_detail}" except json.JSONDecodeError: pass print(f"Error fetching models: {error_msg} (URL: {e.request.url})") return [{"id": "error", "name": error_msg}] except requests.exceptions.RequestException as e: print(f"Error fetching models: Request failed: {e}") return [ { "id": "error", "name": f"Pipe Error: Network error fetching models: {e}", } ] except Exception as e: print(f"Unexpected error fetching models: {e}") traceback.print_exc() return [{"id": "error", "name": f"Pipe Error: Unexpected error: {e}"}] def pipe(self, body: dict) -> Union[str, Generator, Iterator]: """ Processes incoming chat requests. This is the main function called by OpenWebUI when a user interacts with a model provided by this pipe. Args: body: The request body, conforming to OpenAI chat completions format. Returns: Either a string (for non-streaming responses) or a generator/iterator (for streaming responses). """ if not self.valves.OPENROUTER_API_KEY: return "Pipe Error: OpenRouter API Key is not configured." try: payload = body.copy() if "model" in payload and payload["model"] and "." in payload["model"]: payload["model"] = payload["model"].split(".", 1)[1] # --- Apply Cache Control Logic --- if self.valves.ENABLE_CACHE_CONTROL and "messages" in payload: try: cache_applied = False messages = payload["messages"] # 1. Try applying to System Message for i, msg in enumerate(messages): if msg.get("role") == "system" and isinstance( msg.get("content"), list ): longest_index, max_len = -1, -1 for j, part in enumerate(msg["content"]): if part.get("type") == "text": text_len = len(part.get("text", "")) if text_len > max_len: max_len, longest_index = text_len, j if longest_index != -1: msg["content"][longest_index]["cache_control"] = { "type": "ephemeral" } cache_applied = True break # 2. Fallback to Last User Message if not cache_applied: for msg in reversed(messages): if msg.get("role") == "user" and isinstance( msg.get("content"), list ): longest_index, max_len = -1, -1 for j, part in enumerate(msg["content"]): if part.get("type") == "text": text_len = len(part.get("text", "")) if text_len > max_len: max_len, longest_index = text_len, j if longest_index != -1: msg["content"][longest_index]["cache_control"] = { "type": "ephemeral" } break except Exception as cache_err: print(f"Warning: Error applying cache_control logic: {cache_err}") traceback.print_exc() # --- End Cache Control Logic --- if self.valves.INCLUDE_REASONING: payload["include_reasoning"] = True headers = { "Authorization": f"Bearer {self.valves.OPENROUTER_API_KEY}", "Content-Type": "application/json", "HTTP-Referer": body.get("http_referer", "https://openwebui.com/"), "X-Title": body.get("x_title", "Open WebUI via Pipe"), } url = "https://openrouter.ai/api/v1/chat/completions" is_streaming = body.get("stream", False) if is_streaming: return self.stream_response( url, headers, payload, _insert_citations, _format_citation_list, self.valves.REQUEST_TIMEOUT, ) else: return self.non_stream_response( url, headers, payload, _insert_citations, _format_citation_list, self.valves.REQUEST_TIMEOUT, ) except Exception as e: print(f"Error preparing request in pipe method: {e}") traceback.print_exc() return f"Pipe Error: Failed to prepare request: {e}" def non_stream_response( self, url, headers, payload, citation_inserter, citation_formatter, timeout ) -> str: """Handles non-streaming API requests.""" try: response = requests.post( url, headers=headers, json=payload, timeout=timeout ) response.raise_for_status() res = response.json() if not res.get("choices"): return "" choice = res["choices"][0] message = choice.get("message", {}) citations = res.get("citations", []) content = message.get("content", "") reasoning = message.get("reasoning", "") content = citation_inserter(content, citations) reasoning = citation_inserter(reasoning, citations) citation_list = citation_formatter(citations) final = "" if reasoning: final += f"<think>\n{reasoning}\n</think>\n\n" if content: final += content if final: final += citation_list return final except requests.exceptions.Timeout: return f"Pipe Error: Request timed out ({timeout}s)" except requests.exceptions.HTTPError as e: error_msg = f"Pipe Error: API returned HTTP {e.response.status_code}" try: detail = e.response.json().get("error", {}).get("message", "") if detail: error_msg += f": {detail}" except Exception: pass return error_msg except Exception as e: print(f"Unexpected error in non_stream_response: {e}") traceback.print_exc() return f"Pipe Error: Unexpected error processing response: {e}" def stream_response( self, url, headers, payload, citation_inserter, citation_formatter, timeout ) -> Generator[str, None, None]: """Handles streaming API requests using a generator.""" response = None try: response = requests.post( url, headers=headers, json=payload, stream=True, timeout=timeout ) response.raise_for_status() buffer = "" in_think = False latest_citations: List[str] = [] for line in response.iter_lines(): if not line or not line.startswith(b"data: "): continue data = line[len(b"data: ") :].decode("utf-8") if data == "[DONE]": break try: chunk = json.loads(data) except json.JSONDecodeError: continue if "choices" in chunk: choice = chunk["choices"][0] citations = chunk.get("citations") if citations is not None: latest_citations = citations delta = choice.get("delta", {}) content = delta.get("content", "") reasoning = delta.get("reasoning", "") # reasoning if reasoning: if not in_think: if buffer: yield citation_inserter(buffer, latest_citations) buffer = "" yield "<think>\n" in_think = True buffer += reasoning # content if content: if in_think: if buffer: yield citation_inserter(buffer, latest_citations) buffer = "" yield "\n</think>\n\n" in_think = False buffer += content # flush buffer if buffer: yield citation_inserter(buffer, latest_citations) yield citation_formatter(latest_citations) except requests.exceptions.Timeout: yield f"Pipe Error: Request timed out ({timeout}s)" except requests.exceptions.HTTPError as e: yield f"Pipe Error: API returned HTTP {e.response.status_code}" except Exception as e: yield f"Pipe Error: Unexpected error during streaming: {e}" finally: if response: response.close()