From a39c4275fe829b0bd813675d9674916ca5129768 Mon Sep 17 00:00:00 2001
From: "zhenjun.chen" <zhenkun.wang@dotcunited.com>
Date: Sat, 30 May 2026 15:40:52 +0800
Subject: [PATCH 1/2] Add orcarouter_chat example

---
 orcarouter_chat/.env.example                  |   1 +
 orcarouter_chat/.gitignore                    |   8 +
 orcarouter_chat/README.md                     |  50 ++
 orcarouter_chat/orcarouter_chat/__init__.py   |   0
 .../orcarouter_chat/orcarouter_chat.py        | 444 ++++++++++++++++++
 orcarouter_chat/requirements.txt              |   4 +
 orcarouter_chat/rxconfig.py                   |   6 +
 7 files changed, 513 insertions(+)
 create mode 100644 orcarouter_chat/.env.example
 create mode 100644 orcarouter_chat/.gitignore
 create mode 100644 orcarouter_chat/README.md
 create mode 100644 orcarouter_chat/orcarouter_chat/__init__.py
 create mode 100644 orcarouter_chat/orcarouter_chat/orcarouter_chat.py
 create mode 100644 orcarouter_chat/requirements.txt
 create mode 100644 orcarouter_chat/rxconfig.py

diff --git a/orcarouter_chat/.env.example b/orcarouter_chat/.env.example
new file mode 100644
index 00000000..1c5890be
--- /dev/null
+++ b/orcarouter_chat/.env.example
@@ -0,0 +1 @@
+ORCAROUTER_API_KEY=sk-orca-replace-me
diff --git a/orcarouter_chat/.gitignore b/orcarouter_chat/.gitignore
new file mode 100644
index 00000000..3c43506f
--- /dev/null
+++ b/orcarouter_chat/.gitignore
@@ -0,0 +1,8 @@
+assets/external/
+.states
+.web
+*.db
+__pycache__/
+*.py[cod]
+.env
+.venv/
diff --git a/orcarouter_chat/README.md b/orcarouter_chat/README.md
new file mode 100644
index 00000000..0089c2ca
--- /dev/null
+++ b/orcarouter_chat/README.md
@@ -0,0 +1,50 @@
+# OrcaRouter chat
+
+A minimal Reflex chat app that calls [OrcaRouter](https://www.orcarouter.ai),
+an OpenAI-compatible LLM gateway, and lets you switch between adaptive routing
+(`orcarouter/auto`) and specific upstream models from a dropdown -- same API
+key, same endpoint.
+
+The model dropdown is populated at startup from OrcaRouter's public pricing
+catalog (`https://www.orcarouter.ai/api/pricing`, no auth required), so new
+models added on the server side show up the next time you click **Refresh**.
+If the catalog endpoint is unreachable the app falls back to a curated list of
+flagship models.
+
+## Setup
+
+1. Get an API key at <https://www.orcarouter.ai/console> (the key starts with
+   `sk-orca-`).
+2. Copy the example env file and paste your key:
+   ```bash
+   cp .env.example .env
+   # then edit .env and set ORCAROUTER_API_KEY=sk-orca-...
+   ```
+3. Install dependencies and run:
+   ```bash
+   pip install -r requirements.txt
+   reflex run
+   ```
+
+Open <http://localhost:3000>, pick a model from the dropdown, and start
+chatting.
+
+## What this example demonstrates
+
+- Using OrcaRouter as a drop-in OpenAI-compatible provider
+  (`AsyncOpenAI(base_url="https://api.orcarouter.ai/v1", api_key=...)`).
+- Switching between `orcarouter/auto` (adaptive routing) and specific upstream
+  models (`openai/...`, `anthropic/...`, ...) without changing client code.
+- Passing OrcaRouter-specific routing preferences via the `extra_body` field
+  (`{"models": [...], "route": "fallback"}`).
+- Attaching attribution headers (`HTTP-Referer`, `X-Title`) so OrcaRouter can
+  report which client originated the request.
+- Skipping `temperature` for reasoning models (Claude Opus, GPT-5 family,
+  DeepSeek reasoner) which reject the parameter.
+
+## References
+
+- OrcaRouter docs: <https://docs.orcarouter.ai>
+- Routing strategies and `orcarouter/auto`:
+  <https://www.orcarouter.ai/console/routing>
+- Full model catalog: <https://www.orcarouter.ai/models>
diff --git a/orcarouter_chat/orcarouter_chat/__init__.py b/orcarouter_chat/orcarouter_chat/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/orcarouter_chat/orcarouter_chat/orcarouter_chat.py b/orcarouter_chat/orcarouter_chat/orcarouter_chat.py
new file mode 100644
index 00000000..93137bf1
--- /dev/null
+++ b/orcarouter_chat/orcarouter_chat/orcarouter_chat.py
@@ -0,0 +1,444 @@
+"""OrcaRouter chat example for Reflex.
+
+Demonstrates calling OrcaRouter (https://www.orcarouter.ai) -- an OpenAI-compatible
+LLM gateway -- from a Reflex app, with a runtime-loaded model dropdown that lets you
+switch between adaptive routing (orcarouter/auto) and specific upstream models in
+one click.
+
+Run:
+    cp .env.example .env  # fill in ORCAROUTER_API_KEY (get one at https://www.orcarouter.ai/console)
+    pip install -r requirements.txt
+    reflex run
+"""
+
+from __future__ import annotations
+
+import os
+import re
+from pathlib import Path
+from typing import Any
+
+import httpx
+import reflex as rx
+from openai import AsyncOpenAI
+
+try:
+    from dotenv import load_dotenv
+
+    _here = Path(__file__).resolve().parent
+    for candidate in (_here / ".env", _here.parent / ".env"):
+        if candidate.exists():
+            load_dotenv(candidate, override=False)
+            break
+except ImportError:
+    pass
+
+ORCAROUTER_BASE_URL = "https://api.orcarouter.ai/v1"
+ORCAROUTER_PRICING_URL = "https://www.orcarouter.ai/api/pricing"
+
+ATTRIBUTION_HEADERS = {
+    "HTTP-Referer": "https://www.orcarouter.ai/",
+    "X-Title": "reflex-orcarouter-chat",
+}
+
+FALLBACK_MODELS: list[str] = [
+    "orcarouter/auto",
+    "openai/gpt-5.5",
+    "google/gemini-3-flash-preview",
+    "anthropic/claude-opus-4.7",
+    "grok/grok-4.3",
+    "deepseek/deepseek-v4-pro",
+    "minimax/minimax-m2.7",
+    "qwen/qwen3.6-flash",
+]
+
+
+def is_chat_model(name: str, entry: dict[str, Any]) -> bool:
+    """Filter /api/pricing entries down to chat-LLM models.
+
+    Mirrors the rules documented in OrcaRouter's pricing schema: skip image /
+    video / embedding / TTS / STT / rerank entries plus models that only live
+    on the responses or completions endpoint.
+    """
+    eps = set(entry.get("supported_endpoint_types") or [])
+    n = name.lower()
+    if "image-generation" in eps or "openai-video" in eps:
+        return False
+    if "image" in set(entry.get("output_modalities") or []):
+        return False
+    if any(k in n for k in ("imagen", "dall-e", "gpt-image", "grok-imagine")):
+        return False
+    if "embedding" in n or "tts" in n or n.endswith("-speech"):
+        return False
+    if "whisper" in n or "transcrib" in n or "rerank" in n:
+        return False
+    if "openai-response" in eps and "openai" not in eps:
+        return False
+    if "codex" in n:
+        return False
+    if re.match(r"openai/gpt-5(\.\d+)?-pro", n):
+        return False
+    return True
+
+
+def is_reasoning_model(model: str) -> bool:
+    """Models that reject `temperature` (and need longer timeouts).
+
+    Detected by the OrcaRouter-documented patterns: Claude Opus reasoning,
+    OpenAI gpt-5 / o-series, DeepSeek reasoner / r1, plus the conservative
+    catch-all `*-reasoner` / `*-thinking` suffix used by several upstreams.
+    The submit handler also retries once without temperature if the upstream
+    still rejects it, so this list is a fast path, not a hard contract.
+    """
+    m = model.lower()
+    if m.startswith("anthropic/claude-opus"):
+        return True
+    if re.match(r"openai/gpt-5(\.\d+)?($|[-/])", m):
+        return True
+    if re.match(r"openai/o\d+($|[-/])", m):
+        return True
+    if "deepseek-reasoner" in m or "deepseek-r1" in m:
+        return True
+    if m.endswith("-reasoner") or m.endswith("-thinking"):
+        return True
+    return False
+
+
+def force_stream_model(model: str) -> bool:
+    """z-ai/glm-4.5 family rejects non-streaming requests."""
+    m = model.lower()
+    return m.startswith("z-ai/glm-4.5")
+
+
+class State(rx.State):
+    """Chat state."""
+
+    models: list[str] = list(FALLBACK_MODELS)
+    model: str = FALLBACK_MODELS[0]
+    custom_model: str = ""
+    use_fallback_route: bool = False
+    fallback_models_csv: str = "openai/gpt-5.5, anthropic/claude-opus-4.7"
+
+    prompt: str = ""
+    messages: list[dict[str, str]] = []
+    streaming: bool = False
+    error: str = ""
+
+    last_model: str = ""
+    last_input_tokens: int = 0
+    last_output_tokens: int = 0
+    models_source: str = "fallback"
+
+    @rx.event
+    async def load_models(self):
+        """Pull the live model catalog from OrcaRouter; fall back to the curated
+        flagship list if the network is unavailable so the demo always boots."""
+        try:
+            async with httpx.AsyncClient(timeout=10.0) as client:
+                resp = await client.get(ORCAROUTER_PRICING_URL)
+                resp.raise_for_status()
+                payload = resp.json()
+            entries = payload.get("data") or []
+            live = [
+                e["model_name"]
+                for e in entries
+                if "model_name" in e and is_chat_model(e["model_name"], e)
+            ]
+            if live:
+                merged = ["orcarouter/auto", *sorted(m for m in live if m != "orcarouter/auto")]
+                self.models = merged
+                self.models_source = (
+                    f"live ({len(merged)} models from https://www.orcarouter.ai/models)"
+                )
+                if self.model not in merged:
+                    self.model = merged[0]
+                return
+        except Exception as exc:  # noqa: BLE001 - demo path, surface the reason in UI
+            self.error = f"Could not load live model catalog: {exc}. Using fallback list."
+        self.models = list(FALLBACK_MODELS)
+        self.models_source = (
+            f"fallback ({len(FALLBACK_MODELS)} flagship models; "
+            "see https://www.orcarouter.ai/models for the full catalog)"
+        )
+
+    @rx.event
+    def set_prompt(self, value: str):
+        self.prompt = value
+
+    @rx.event
+    def set_model(self, value: str):
+        self.model = value
+
+    @rx.event
+    def set_custom_model(self, value: str):
+        self.custom_model = value
+
+    @rx.event
+    def apply_custom_model(self):
+        if self.custom_model.strip():
+            self.model = self.custom_model.strip()
+            if self.model not in self.models:
+                self.models = [self.model, *self.models]
+            self.custom_model = ""
+
+    @rx.event
+    def toggle_fallback_route(self, checked: bool):
+        self.use_fallback_route = checked
+
+    @rx.event
+    def set_fallback_models_csv(self, value: str):
+        self.fallback_models_csv = value
+
+    @rx.event
+    def clear_chat(self):
+        self.messages = []
+        self.error = ""
+        self.last_model = ""
+        self.last_input_tokens = 0
+        self.last_output_tokens = 0
+
+    @rx.event(background=True)
+    async def submit(self):
+        async with self:
+            prompt = self.prompt.strip()
+            if not prompt or self.streaming:
+                return
+            api_key = os.environ.get("ORCAROUTER_API_KEY", "").strip()
+            if not api_key:
+                cwd = os.getcwd()
+                env_here = (Path(cwd) / ".env").exists()
+                self.error = (
+                    "ORCAROUTER_API_KEY is not set. Create a .env next to rxconfig.py "
+                    "(or export the env var before running) and restart `reflex run`. "
+                    f"Looked at cwd={cwd}, .env exists there: {env_here}."
+                )
+                return
+            model = self.model
+            self.error = ""
+            self.streaming = True
+            self.messages = [
+                *self.messages,
+                {"role": "user", "content": prompt},
+                {"role": "assistant", "content": ""},
+            ]
+            self.prompt = ""
+            history = list(self.messages[:-1])
+            use_fallback = self.use_fallback_route
+            fallback_csv = self.fallback_models_csv
+
+        client = AsyncOpenAI(
+            api_key=api_key,
+            base_url=ORCAROUTER_BASE_URL,
+            default_headers=ATTRIBUTION_HEADERS,
+        )
+
+        kwargs: dict[str, Any] = {
+            "model": model,
+            "messages": history,
+            "stream": True,
+            "stream_options": {"include_usage": True},
+            "timeout": 300.0,
+        }
+        if not is_reasoning_model(model):
+            kwargs["temperature"] = 0.7
+        if use_fallback:
+            fallback_list = [m.strip() for m in fallback_csv.split(",") if m.strip()]
+            if fallback_list:
+                kwargs["extra_body"] = {"models": fallback_list, "route": "fallback"}
+
+        async def consume(call_kwargs: dict[str, Any]):
+            stream = await client.chat.completions.create(**call_kwargs)
+            async for chunk in stream:
+                if chunk.usage is not None:
+                    async with self:
+                        self.last_input_tokens = chunk.usage.prompt_tokens or 0
+                        self.last_output_tokens = chunk.usage.completion_tokens or 0
+                if not chunk.choices:
+                    continue
+                delta = chunk.choices[0].delta.content or ""
+                if not delta:
+                    continue
+                async with self:
+                    msgs = list(self.messages)
+                    msgs[-1] = {
+                        "role": "assistant",
+                        "content": msgs[-1]["content"] + delta,
+                    }
+                    self.messages = msgs
+
+        try:
+            try:
+                await consume(kwargs)
+            except Exception as exc:  # noqa: BLE001
+                msg = str(exc).lower()
+                if "temperature" in msg and "temperature" in kwargs:
+                    retry_kwargs = {k: v for k, v in kwargs.items() if k != "temperature"}
+                    async with self:
+                        msgs = list(self.messages)
+                        msgs[-1] = {"role": "assistant", "content": ""}
+                        self.messages = msgs
+                    await consume(retry_kwargs)
+                else:
+                    raise
+        except Exception as exc:  # noqa: BLE001 - demo path, surface the reason in UI
+            async with self:
+                self.error = f"{type(exc).__name__}: {exc}"
+                if self.messages and self.messages[-1]["role"] == "assistant":
+                    self.messages = self.messages[:-1]
+        finally:
+            async with self:
+                self.streaming = False
+                self.last_model = model
+
+
+def message_bubble(msg: dict[str, str]) -> rx.Component:
+    is_user = msg["role"] == "user"
+    return rx.box(
+        rx.text(msg["content"], white_space="pre-wrap"),
+        background=rx.cond(is_user, "var(--accent-3)", "var(--gray-3)"),
+        padding="0.75em 1em",
+        border_radius="12px",
+        max_width="80%",
+        align_self=rx.cond(is_user, "flex-end", "flex-start"),
+    )
+
+
+def model_picker() -> rx.Component:
+    return rx.vstack(
+        rx.hstack(
+            rx.select(
+                State.models,
+                value=State.model,
+                on_change=State.set_model,
+                width="100%",
+            ),
+            rx.button(
+                "Refresh",
+                on_click=State.load_models,
+                variant="soft",
+            ),
+            width="100%",
+        ),
+        rx.hstack(
+            rx.input(
+                placeholder="Custom model id (e.g. orcarouter/your-router)",
+                value=State.custom_model,
+                on_change=State.set_custom_model,
+                width="100%",
+            ),
+            rx.button("Use", on_click=State.apply_custom_model, variant="soft"),
+            width="100%",
+        ),
+        rx.hstack(
+            rx.checkbox(
+                "Enable fallback route",
+                checked=State.use_fallback_route,
+                on_change=State.toggle_fallback_route,
+            ),
+            rx.cond(
+                State.use_fallback_route,
+                rx.input(
+                    value=State.fallback_models_csv,
+                    on_change=State.set_fallback_models_csv,
+                    placeholder="comma-separated fallback models",
+                    width="100%",
+                ),
+            ),
+            width="100%",
+        ),
+        rx.text(State.models_source, size="1", color="gray"),
+        width="100%",
+        spacing="2",
+    )
+
+
+def chat_panel() -> rx.Component:
+    return rx.vstack(
+        rx.foreach(State.messages, message_bubble),
+        rx.cond(
+            State.streaming,
+            rx.text("...", color="gray"),
+        ),
+        rx.cond(
+            State.error != "",
+            rx.callout(State.error, icon="triangle_alert", color_scheme="red"),
+        ),
+        width="100%",
+        align="stretch",
+        spacing="3",
+        min_height="40vh",
+    )
+
+
+def input_bar() -> rx.Component:
+    return rx.hstack(
+        rx.input(
+            placeholder="Ask anything...",
+            value=State.prompt,
+            on_change=State.set_prompt,
+            width="100%",
+        ),
+        rx.button(
+            "Send",
+            on_click=State.submit,
+            loading=State.streaming,
+        ),
+        rx.button(
+            "Clear",
+            on_click=State.clear_chat,
+            variant="soft",
+        ),
+        width="100%",
+    )
+
+
+def footer() -> rx.Component:
+    return rx.hstack(
+        rx.text(
+            "Last call: ",
+            rx.cond(State.last_model != "", State.last_model, "--"),
+            "  |  in/out tokens: ",
+            State.last_input_tokens.to_string(),
+            "/",
+            State.last_output_tokens.to_string(),
+            size="1",
+            color="gray",
+        ),
+        rx.spacer(),
+        rx.link(
+            "OrcaRouter docs",
+            href="https://docs.orcarouter.ai",
+            is_external=True,
+            size="1",
+        ),
+        width="100%",
+    )
+
+
+def index() -> rx.Component:
+    return rx.container(
+        rx.vstack(
+            rx.heading("OrcaRouter chat", size="6"),
+            rx.text(
+                "OpenAI-compatible chat against ",
+                rx.code("api.orcarouter.ai/v1"),
+                ". Switch the router/model from the dropdown -- same API key, "
+                "same endpoint.",
+                size="2",
+                color="gray",
+            ),
+            model_picker(),
+            rx.divider(),
+            chat_panel(),
+            input_bar(),
+            footer(),
+            spacing="4",
+            width="100%",
+        ),
+        size="3",
+        padding_y="2em",
+    )
+
+
+app = rx.App(theme=rx.theme(accent_color="violet"))
+app.add_page(index, route="/", on_load=State.load_models)
diff --git a/orcarouter_chat/requirements.txt b/orcarouter_chat/requirements.txt
new file mode 100644
index 00000000..f6b400d2
--- /dev/null
+++ b/orcarouter_chat/requirements.txt
@@ -0,0 +1,4 @@
+reflex>=0.8.0
+openai>=1.55.3
+httpx>=0.27.0
+python-dotenv>=1.0.0
diff --git a/orcarouter_chat/rxconfig.py b/orcarouter_chat/rxconfig.py
new file mode 100644
index 00000000..e1abb3b9
--- /dev/null
+++ b/orcarouter_chat/rxconfig.py
@@ -0,0 +1,6 @@
+import reflex as rx
+
+config = rx.Config(
+    app_name="orcarouter_chat",
+    env_file=".env",
+)

From ba0bb8bf19486332e38522f2d704890c099ef2ca Mon Sep 17 00:00:00 2001
From: "zhenjun.chen" <zhenkun.wang@dotcunited.com>
Date: Sat, 30 May 2026 15:54:25 +0800
Subject: [PATCH 2/2] Address Greptile review and add favicon

- load_models: run as background task (release state lock during HTTP fetch)
- Enter key submits via rx.form (was: button-only)
- pinned custom models persist across catalog refreshes
- assets/favicon.ico: include reflex default
---
 orcarouter_chat/assets/favicon.ico            | Bin 0 -> 4286 bytes
 .../orcarouter_chat/orcarouter_chat.py        | 112 ++++++++++++------
 2 files changed, 76 insertions(+), 36 deletions(-)
 create mode 100644 orcarouter_chat/assets/favicon.ico

diff --git a/orcarouter_chat/assets/favicon.ico b/orcarouter_chat/assets/favicon.ico
new file mode 100644
index 0000000000000000000000000000000000000000..166ae995eaa63fc96771410a758282dc30e925cf
GIT binary patch
literal 4286
zcmeHL>rYc>81ELdEe;}zmYd}cUgmJRfwjUwD1`#s5KZP>mMqza#Viv|_7|8f+0+bX
zHuqusuw-7Ca`DTu#4U4^o2bjO#K>4%N?Wdi*wZ3Vx%~Ef4}D1`U_EM<ED`eKIp@9o
zp65Bw<qbOBQ~XU%)``Emx+tAauhZ$)6CBbN5Mo^Y;oQQXF-IT%Pq;&UB^J~Bj=dja
zgx_&57F)a2m^@!dxyH|D2{|w4LZzIOd!-Cr6Yg1_;kWm~`;Qy9gYeos@CEf)>Rg3u
z#2#M|V>}}q-@<vp;pM&w_f25f58U*rm>IaO@{9R}d*u7f&~5HfxSkmHVcazU#i30H
zAGxQ<ed9tizB_yrXFofRQ-_b?!nda|(KD#(Ao-*e{t){bzx)QLJ~@hWpVr{y$4B98
zzlMN&2*Q_gZ8)jWcf#f$$h%JW9CBC1W7E^i@m@hGW<0}CY;*R@@1**;yB|uI3$Jb5
zip|eN!W0#QtYs0nbn+}P<b^mh9Iu@Bc6qo*L1XRL*v@k*Qr00iIt~XbsxadohHnvm
zzmxIa<;FYP@=>5Spe!j9`KuGqR@aExK`-}sH1jvqoIp<GYFHC9sD~a0$|~=}KcMpO
z%g#k!bUaGdrXhD_EZWXI;eQ<dHwph+D>3C7Vm)9Tu=UPE;j^esN~a6^a$ZILngo;^
zGLXl(ZFyY&U!li`6}y-hUQ99v?s`U4O!kgog74FPw-9g+V)qs!jFGEQyvBf><<X4)
z20)EJ?eQNPe<sG#`-N7xTd%=(u^o=zI*7}#6Sj+&;rN~MmsWgGwhMc=8u6|%AA2@$
z!_}srFw;N!@bMq9T8(8(Y%(nIDX=7FqL}$mV#wrkhKdr7nGNZ%rmTnk*A|RBS+_eK
z@c!+D!n)(@Ub<e&oDY>U|E2vRmx|+(VI~S=lT?@~C5pvZOd`x{Q_+3tG6H=gtdWcf
z)+7-Zp=UqH^J4sk<ladXkZUKo1YeQhRKYRUoT7wOI4^bJZttkdIo>^>_G-Ufn-2Hz
z2mN12|C{5}U`^eCQu<l=+M2RKMOo@bSomI^z6rLUo8h;)aO-*(l<PM3!Colz!-Lo@
z*WAM&tbeAcSnMw<$56*#=xM$JSIbp6Tdu**cyv(qwEcl@j_<d;j;a@5#@=ibDqq-w
zD~&&5TJ+6FtiML)Uv>Fz=F%wp@}SzA1MHEaM^CtJs<{}Tzu$bx2orTKiedgmtVGM{
zdd#vX`&cuiec|My_KW;y{Ryz2kFu9}=~us6hvx1ZqQCk(d+>HP>ks>mmHCjjDh{pe
zKQkKpk0SeDX#XMqf$}QV{z=xrN!mQczJAvud@;zFqaU1ocq==Py)qsa=8UKrt!J7r
z{RsTo^rgtZo%$rak)DN*D)!(Y^$@yL6Nd=#eu&?unzhH8yq>v{gkt8xcG3S%H)-y_
zqQ1|v|JT$0R~Y}omg2Y+nDvR+K|kzR5i^fmKF>j~N;A35Vr`JWh4yRqKl#P|qlx?`
z@|CmBiP}<RpdN|oD7g<x6VgyB@|52{KRN;Jr_XD)-^Y85djC4|1vcoO<#&w1w#YT?
zD|6URDPdaVIa{n_zsy?pJet3+S8WmZ;c#&;=l#52O){@;u$I>ysYO%m2{eBG6&ix5
zr#u((F2{vb=W4jNmTQh3M^F2o80T49?w>*rv0mt)-o1y!{hRk`E#UVPdna6jnz`rw
dKpn)r^--YJZpr;bYU`N~>#v3X5BRU&{{=gv-{1fM

literal 0
HcmV?d00001

diff --git a/orcarouter_chat/orcarouter_chat/orcarouter_chat.py b/orcarouter_chat/orcarouter_chat/orcarouter_chat.py
index 93137bf1..06114797 100644
--- a/orcarouter_chat/orcarouter_chat/orcarouter_chat.py
+++ b/orcarouter_chat/orcarouter_chat/orcarouter_chat.py
@@ -115,6 +115,7 @@ class State(rx.State):
 
     models: list[str] = list(FALLBACK_MODELS)
     model: str = FALLBACK_MODELS[0]
+    pinned_models: list[str] = []
     custom_model: str = ""
     use_fallback_route: bool = False
     fallback_models_csv: str = "openai/gpt-5.5, anthropic/claude-opus-4.7"
@@ -129,10 +130,20 @@ class State(rx.State):
     last_output_tokens: int = 0
     models_source: str = "fallback"
 
-    @rx.event
+    @rx.event(background=True)
     async def load_models(self):
         """Pull the live model catalog from OrcaRouter; fall back to the curated
-        flagship list if the network is unavailable so the demo always boots."""
+        flagship list if the network is unavailable so the demo always boots.
+
+        Runs as a background task so the 10s HTTP fetch never holds the state
+        lock -- the UI stays responsive while the catalog loads.
+        """
+        async with self:
+            pinned_snapshot = list(self.pinned_models)
+            current_model = self.model
+
+        live_merged: list[str] | None = None
+        error_msg = ""
         try:
             async with httpx.AsyncClient(timeout=10.0) as client:
                 resp = await client.get(ORCAROUTER_PRICING_URL)
@@ -145,21 +156,35 @@ async def load_models(self):
                 if "model_name" in e and is_chat_model(e["model_name"], e)
             ]
             if live:
-                merged = ["orcarouter/auto", *sorted(m for m in live if m != "orcarouter/auto")]
-                self.models = merged
-                self.models_source = (
-                    f"live ({len(merged)} models from https://www.orcarouter.ai/models)"
-                )
-                if self.model not in merged:
-                    self.model = merged[0]
-                return
+                live_merged = [
+                    "orcarouter/auto",
+                    *sorted(m for m in live if m != "orcarouter/auto"),
+                ]
         except Exception as exc:  # noqa: BLE001 - demo path, surface the reason in UI
-            self.error = f"Could not load live model catalog: {exc}. Using fallback list."
-        self.models = list(FALLBACK_MODELS)
-        self.models_source = (
-            f"fallback ({len(FALLBACK_MODELS)} flagship models; "
-            "see https://www.orcarouter.ai/models for the full catalog)"
-        )
+            error_msg = f"Could not load live model catalog: {exc}. Using fallback list."
+
+        if live_merged is not None:
+            merged = live_merged
+            source = f"live ({len(merged)} models from https://www.orcarouter.ai/models)"
+        else:
+            merged = list(FALLBACK_MODELS)
+            source = (
+                f"fallback ({len(FALLBACK_MODELS)} flagship models; "
+                "see https://www.orcarouter.ai/models for the full catalog)"
+            )
+
+        for p in pinned_snapshot:
+            if p not in merged:
+                merged.append(p)
+
+        new_model = current_model if current_model in merged else merged[0]
+
+        async with self:
+            self.models = merged
+            self.model = new_model
+            self.models_source = source
+            if error_msg:
+                self.error = error_msg
 
     @rx.event
     def set_prompt(self, value: str):
@@ -175,11 +200,15 @@ def set_custom_model(self, value: str):
 
     @rx.event
     def apply_custom_model(self):
-        if self.custom_model.strip():
-            self.model = self.custom_model.strip()
-            if self.model not in self.models:
-                self.models = [self.model, *self.models]
-            self.custom_model = ""
+        candidate = self.custom_model.strip()
+        if not candidate:
+            return
+        if candidate not in self.pinned_models:
+            self.pinned_models = [*self.pinned_models, candidate]
+        if candidate not in self.models:
+            self.models = [candidate, *self.models]
+        self.model = candidate
+        self.custom_model = ""
 
     @rx.event
     def toggle_fallback_route(self, checked: bool):
@@ -197,6 +226,10 @@ def clear_chat(self):
         self.last_input_tokens = 0
         self.last_output_tokens = 0
 
+    @rx.event
+    def submit_from_form(self, _form_data: dict[str, Any]):
+        return State.submit
+
     @rx.event(background=True)
     async def submit(self):
         async with self:
@@ -371,23 +404,30 @@ def chat_panel() -> rx.Component:
 
 
 def input_bar() -> rx.Component:
-    return rx.hstack(
-        rx.input(
-            placeholder="Ask anything...",
-            value=State.prompt,
-            on_change=State.set_prompt,
+    return rx.form(
+        rx.hstack(
+            rx.input(
+                name="prompt",
+                placeholder="Ask anything...",
+                value=State.prompt,
+                on_change=State.set_prompt,
+                width="100%",
+            ),
+            rx.button(
+                "Send",
+                type="submit",
+                loading=State.streaming,
+            ),
+            rx.button(
+                "Clear",
+                on_click=State.clear_chat,
+                variant="soft",
+                type="button",
+            ),
             width="100%",
         ),
-        rx.button(
-            "Send",
-            on_click=State.submit,
-            loading=State.streaming,
-        ),
-        rx.button(
-            "Clear",
-            on_click=State.clear_chat,
-            variant="soft",
-        ),
+        on_submit=State.submit_from_form,
+        reset_on_submit=False,
         width="100%",
     )