zeroshotbuilders · flylo · May 12, 2026 · May 12, 2026 · May 12, 2026 · May 12, 2026
diff --git a/.ai/ai-agents.md b/.ai/ai-agents.md
@@ -10,7 +10,7 @@ multiple implementations:
 - `service_openai.py`: production implementation using the OpenAI Agents SDK
 - `agent_service.py` (`AiAgentServiceLocal`): mocked implementation for testing non-AI portions of workflows
   (orchestration, task management, error handling, etc)
-- `service_ollama.py`: hits a local Ollama deployment for development/testing with local models
+- `service_openai_compat.py`: hits any OpenAI-compatible API (Ollama, OpenRouter, etc.)
 
 ## Factory
 
@@ -21,8 +21,9 @@ from zeroshot_agentic_workflows import AiAgentConfig, AiAgentFactory, AiAgentPro
 
 config = AiAgentConfig(
     local=False,
-    provider=AiAgentProvider.OLLAMA,
-    ollama_base_url="http://localhost:11434",
+    provider=AiAgentProvider.OPENAI_COMPAT,
+    openai_compat_base_url="http://localhost:11434/v1",
+    openai_compat_api_key="ollama",
     default_model="qwen2.5:latest",
 )
 factory = AiAgentFactory(config)

diff --git a/.ai/skills/testing-guide.md b/.ai/skills/testing-guide.md
@@ -14,7 +14,7 @@ Read these docs for full details:
 ### Test Tiers
 - **Unit** (`tests/unit/`): always runs, no I/O
 - **Integration** (`tests/integration/`): `--integration` flag, real Postgres/Redis via testcontainers
-- **Eval** (`tests/evals/`): `--eval` flag, real LLM inference via Ollama
+- **Eval** (`tests/evals/`): `--eval` flag, real LLM inference via OpenAI-compatible API
 
 ### Testcontainers
 ```python

diff --git a/.ai/testing.md b/.ai/testing.md
@@ -8,7 +8,7 @@ Tests are organized into three tiers, each gated by a CLI flag:
 |------|-----------|------|---------------|
 | Unit | `tests/unit/` | *(always runs)* | Pure logic, no I/O |
 | Integration | `tests/integration/` | `--integration` | Real Postgres/Redis via testcontainers |
-| Eval | `tests/evals/` | `--eval` | Real LLM inference via Ollama |
+| Eval | `tests/evals/` | `--eval` | Real LLM inference via OpenAI-compatible API |
 
 Run them:
 ```bash

diff --git a/packages/agent-experiments/assets/config.yaml b/packages/agent-experiments/assets/config.yaml
@@ -1,3 +1,3 @@
-provider: ollama
+provider: openai_compat
 defaultModel: "qwen2.5:latest"
 port: 3000
diff --git a/packages/agent-experiments/tests/evals/conftest.py b/packages/agent-experiments/tests/evals/conftest.py
@@ -12,11 +12,12 @@
 
 @pytest_asyncio.fixture(scope="module", loop_scope="module")
 async def salary_agent():
-    """Create a SalaryExtractionAgent wired to local Ollama."""
+    """Create a SalaryExtractionAgent wired to a local OpenAI-compatible API."""
     config = AiAgentConfig(
         local=False,
-        provider=AiAgentProvider.OLLAMA,
-        ollama_base_url="http://localhost:11434",
+        provider=AiAgentProvider.OPENAI_COMPAT,
+        openai_compat_base_url="http://localhost:11434/v1",
+        openai_compat_api_key="ollama",
         default_model="qwen2.5:latest",
     )
     factory = AiAgentFactory(config)

diff --git a/packages/agent-experiments/tests/evals/test_salary_extraction.py b/packages/agent-experiments/tests/evals/test_salary_extraction.py
@@ -1,12 +1,12 @@
 """Salary extraction eval suite.
 
-These tests exercise real LLM inference via Ollama and are skipped
-by default.  Run with:
+These tests exercise real LLM inference via an OpenAI-compatible API
+and are skipped by default.  Run with:
 
     uv run pytest --eval packages/agent-experiments/tests/evals/
 
 Requires:
-  - Ollama running locally with ``qwen2.5:latest`` pulled
+  - An OpenAI-compatible API running (e.g. Ollama with ``qwen2.5:latest``)
   - PDF fixtures generated (run generate_fixtures.py first)
 """
 

diff --git a/packages/agentic-workflows/src/zeroshot_agentic_workflows/__init__.py b/packages/agentic-workflows/src/zeroshot_agentic_workflows/__init__.py
@@ -21,6 +21,7 @@
     generate_tools_reference,
     parse_prompt_frontmatter,
 )
+from .service_openai_compat import AiAgentServiceOpenAICompat
 from .session import (
     CONVERSATION_SESSION_REPOSITORY,
     ConversationItemModel,
@@ -46,6 +47,7 @@
     "AiAgentProvider",
     "AiAgentService",
     "AiAgentServiceLocal",
+    "AiAgentServiceOpenAICompat",
     "AiSessionFactory",
     "ConsensusRunResult",
     "ConsensusStrategy",

diff --git a/packages/agentic-workflows/src/zeroshot_agentic_workflows/agent_service.py b/packages/agentic-workflows/src/zeroshot_agentic_workflows/agent_service.py
@@ -74,15 +74,16 @@ async def create_and_run(
 
 class AiAgentProvider(StrEnum):
     OPENAI = "openai"
-    OLLAMA = "ollama"
+    OPENAI_COMPAT = "openai_compat"
 
 
 @dataclass(frozen=True, slots=True)
 class AiAgentConfig:
     local: bool
     provider: AiAgentProvider = AiAgentProvider.OPENAI
     openai_api_token: str | None = None
-    ollama_base_url: str = "http://localhost:11434"
+    openai_compat_base_url: str | None = None
+    openai_compat_api_key: str | None = None
     default_model: str | None = None
 
 

diff --git a/packages/agentic-workflows/src/zeroshot_agentic_workflows/factory.py b/packages/agentic-workflows/src/zeroshot_agentic_workflows/factory.py
@@ -1,8 +1,8 @@
 from __future__ import annotations
 
 from .agent_service import AiAgentConfig, AiAgentProvider, AiAgentService, AiAgentServiceLocal
-from .service_ollama import AiAgentServiceOllama
 from .service_openai import AiAgentServiceOpenai
+from .service_openai_compat import AiAgentServiceOpenAICompat
 
 
 class AiAgentFactory:
@@ -15,10 +15,15 @@ def make_agent_service(self) -> AiAgentService:
         if self._config.local:
             return AiAgentServiceLocal.get_instance()
 
-        if self._config.provider == AiAgentProvider.OLLAMA:
-            return AiAgentServiceOllama(
-                base_url=self._config.ollama_base_url,
-                default_model=self._config.default_model or "qwen2.5:14b",
+        if self._config.provider == AiAgentProvider.OPENAI_COMPAT:
+            if not self._config.openai_compat_base_url:
+                raise ValueError(
+                    "openai_compat_base_url is required for the OpenAI-compatible provider"
+                )
+            return AiAgentServiceOpenAICompat(
+                base_url=self._config.openai_compat_base_url,
+                api_key=self._config.openai_compat_api_key or "",
+                default_model=self._config.default_model or "",
             )
 
         if self._config.provider == AiAgentProvider.OPENAI:
@@ -32,11 +37,16 @@ def make_agent_service(self) -> AiAgentService:
         raise ValueError(f"Unknown provider: {self._config.provider}")
 
     @staticmethod
-    def make_ollama_service(
-        base_url: str = "http://localhost:11434",
-        default_model: str = "qwen2.5:14b",
-    ) -> AiAgentServiceOllama:
-        return AiAgentServiceOllama(base_url=base_url, default_model=default_model)
+    def make_openai_compat_service(
+        base_url: str,
+        api_key: str,
+        default_model: str,
+    ) -> AiAgentServiceOpenAICompat:
+        return AiAgentServiceOpenAICompat(
+            base_url=base_url,
+            api_key=api_key,
+            default_model=default_model,
+        )
 
     @staticmethod
     def make_openai_service(

diff --git a/...oshot_agentic_workflows/service_ollama.py → ...gentic_workflows/service_openai_compat.py b/...oshot_agentic_workflows/service_ollama.py → ...gentic_workflows/service_openai_compat.py
@@ -13,19 +13,20 @@
 logger = logging.getLogger(__name__)
 
 
-class AiAgentServiceOllama:
-    """Ollama implementation via OpenAI-compatible API."""
+class AiAgentServiceOpenAICompat:
+    """OpenAI-compatible API implementation (Ollama, OpenRouter, etc.)."""
 
     def __init__(
         self,
-        base_url: str = "http://localhost:11434",
-        default_model: str = "qwen2.5:14b",
+        base_url: str,
+        api_key: str,
+        default_model: str,
     ) -> None:
         self._base_url = base_url
         self._default_model = default_model
         self._client = AsyncOpenAI(
-            base_url=f"{base_url}/v1",
-            api_key="ollama",
+            base_url=base_url,
+            api_key=api_key,
         )
 
     def create_agent(self, config: AgentConfig[T]) -> AgentType[T]:

diff --git a/packages/agentic-workflows/tests/unit/test_factory.py b/packages/agentic-workflows/tests/unit/test_factory.py
@@ -29,11 +29,24 @@ def test_openai_provider_requires_token(self) -> None:
         with pytest.raises(ValueError, match="openai_api_token"):
             factory.make_agent_service()
 
-    def test_static_ollama_factory(self) -> None:
-        from zeroshot_agentic_workflows.service_ollama import AiAgentServiceOllama
+    def test_static_openai_compat_factory(self) -> None:
+        from zeroshot_agentic_workflows.service_openai_compat import AiAgentServiceOpenAICompat
 
-        service = AiAgentFactory.make_ollama_service()
-        assert isinstance(service, AiAgentServiceOllama)
+        service = AiAgentFactory.make_openai_compat_service(
+            base_url="http://localhost:11434/v1",
+            api_key="test",
+            default_model="qwen2.5:14b",
+        )
+        assert isinstance(service, AiAgentServiceOpenAICompat)
+
+    def test_openai_compat_provider_requires_base_url(self) -> None:
+        config = AiAgentConfig(
+            local=False,
+            provider=AiAgentProvider.OPENAI_COMPAT,
+        )
+        factory = AiAgentFactory(config)
+        with pytest.raises(ValueError, match="openai_compat_base_url"):
+            factory.make_agent_service()
 
 
 class TestAiSessionFactory:

diff --git a/uv.lock b/uv.lock