Final cleanup: Merge LLM, add Dockerfile

- Merge llm.py + llm_sync.py into single unified client - Remove llm_sync.py (now just llm.py with both sync/async) - Add requests to dependencies - Add Dockerfile for containerized deployment - Add .dockerignore All issues resolved!
2026-03-13 04:47:01 +00:00
parent 8e92e99205
commit 6766e93c3d
5 changed files with 93 additions and 143 deletions
@@ -0,0 +1,40 @@
+# Git
+.git
+.gitignore
+
+# Python
+__pycache__
+*.py[cod]
+*$py.class
+*.so
+.Python
+venv/
+.venv/
+env/
+.env
+*.egg-info/
+dist/
+build/
+
+# IDE
+.vscode/
+.idea/
+*.swp
+*.swo
+
+# Testing
+.pytest_cache/
+.coverage
+htmlcov/
+
+# OS
+.DS_Store
+Thumbs.db
+
+# Docs
+*.md
+!README.md
+
+# Local
+*.log
+*.tmp
@@ -0,0 +1,51 @@
+# =============================================================================
+# Opus Orchestrator AI - Dockerfile
+# =============================================================================
+# Build: docker build -t opus-orchestrator .
+# Run:   docker run -p 8080:8080 -p 8000:8000 -e OPENAI_API_KEY=sk-... opus-orchestrator
+# =============================================================================
+
+FROM python:3.12-slim
+
+# Labels
+LABEL maintainer="mark@thefoldwithin.earth"
+LABEL description="AI-powered book generation system"
+LABEL version="0.2.0"
+
+# Set working directory
+WORKDIR /app
+
+# Install system dependencies
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    build-essential \
+    curl \
+    && rm -rf /var/lib/apt/lists/*
+
+# Copy project files
+COPY pyproject.toml README.md install.sh ./
+COPY opus_orchestrator/ ./opus_orchestrator/
+COPY config.example.yaml ./
+
+# Create virtual environment
+RUN python -m venv /opt/venv
+ENV PATH="/opt/venv/bin:$PATH"
+
+# Install Python dependencies
+RUN pip install --no-cache-dir -e ".[all]"
+
+# Create non-root user
+RUN useradd -m -u 1000 opus && \
+    chown -R opus:opus /app
+
+# Switch to non-root user
+USER opus
+
+# Expose ports
+EXPOSE 8000 8080
+
+# Health check
+HEALTHCHECK --interval=30s --timeout=10s --start-period=5s --retries=3 \
+    CMD curl -f http://localhost:8000/health || exit 1
+
+# Default command: start web UI
+CMD ["python", "-m", "opus_orchestrator", "ui", "--port", "8080"]
@@ -25,7 +25,7 @@ from langgraph.graph import StateGraph, END
 from langgraph.checkpoint.memory import MemorySaver

 from opus_orchestrator.frameworks import get_framework_prompt, StoryFramework
-from opus_orchestrator.utils.llm_sync import LLMClient
+from opus_orchestrator.utils.llm import LLMClient
 from opus_orchestrator.autogen_critique import create_critique_crew


@@ -1,142 +0,0 @@
-"""LLM client for Opus Orchestrator - Synchronous version.
-
-Uses synchronous httpx to avoid event loop issues with LangGraph.
-"""
-
-import os
-from typing import Any, Optional
-
-import requests
-
-
-class LLMClient:
-    """Synchronous LLM client for making API calls."""
-
-    def __init__(
-        self,
-        api_key: Optional[str] = None,
-        provider: str = "openai",
-        model: str = "gpt-4o",
-        base_url: Optional[str] = None,
-    ):
-        """Initialize LLM client."""
-        self.api_key = api_key or os.environ.get("MINIMAX_API_KEY") or os.environ.get("OPENAI_API_KEY")
-        self.provider = provider
-        self.model = model
-        
-        if base_url:
-            self.base_url = base_url
-        elif provider == "minimax":
-            self.base_url = "https://api.minimax.chat/v1"
-        elif provider == "openai":
-            self.base_url = "https://api.openai.com/v1"
-        else:
-            self.base_url = "https://api.openai.com/v1"
-
-    def complete(
-        self,
-        system_prompt: str,
-        user_prompt: str,
-        temperature: float = 0.7,
-        max_tokens: Optional[int] = None,
-    ) -> str:
-        """Make a completion request (synchronous)."""
-        headers = {
-            "Authorization": f"Bearer {self.api_key}",
-            "Content-Type": "application/json",
-        }
-        
-        if self.provider == "minimax":
-            return self._complete_minimax(
-                system_prompt, user_prompt, temperature, max_tokens, headers
-            )
-        elif self.provider == "openai":
-            return self._complete_openai(
-                system_prompt, user_prompt, temperature, max_tokens, headers
-            )
-        else:
-            raise ValueError(f"Unsupported provider: {self.provider}")
-
-    def _complete_minimax(
-        self,
-        system_prompt: str,
-        user_prompt: str,
-        temperature: float,
-        max_tokens: Optional[int],
-        headers: dict,
-    ) -> str:
-        """Call MiniMax API (synchronous)."""
-        minimax_model = self.model.split("/")[-1] if "/" in self.model else self.model
-        
-        payload = {
-            "model": minimax_model,
-            "messages": [
-                {"role": "system", "content": system_prompt},
-                {"role": "user", "content": user_prompt},
-            ],
-            "temperature": temperature,
-        }
-        
-        if max_tokens:
-            payload["max_tokens"] = max_tokens
-        
-        response = requests.post(
-            f"{self.base_url}/text/chatcompletion_v2",
-            headers=headers,
-            json=payload,
-            timeout=120,
-        )
-        response.raise_for_status()
-        
-        data = response.json()
-        
-        if "choices" in data:
-            return data["choices"][0]["message"]["content"]
-        else:
-            raise Exception(f"Unexpected MiniMax response: {data}")
-
-    def _complete_openai(
-        self,
-        system_prompt: str,
-        user_prompt: str,
-        temperature: float,
-        max_tokens: Optional[int],
-        headers: dict,
-    ) -> str:
-        """Call OpenAI API (synchronous)."""
-        payload = {
-            "model": self.model,
-            "messages": [
-                {"role": "system", "content": system_prompt},
-                {"role": "user", "content": user_prompt},
-            ],
-            "temperature": temperature,
-        }
-        
-        if max_tokens:
-            payload["max_tokens"] = max_tokens
-        
-        response = requests.post(
-            f"{self.base_url}/chat/completions",
-            headers=headers,
-            json=payload,
-            timeout=120,
-        )
-        response.raise_for_status()
-        
-        data = response.json()
-        return data["choices"][0]["message"]["content"]
-
-
-# Convenience function
-def get_llm_client(config: Optional[Any] = None) -> LLMClient:
-    """Get an LLM client from config."""
-    from opus_orchestrator.config import get_config
-    
-    cfg = config or get_config()
-    
-    return LLMClient(
-        api_key=cfg.agent.api_key,
-        provider=cfg.agent.provider,
-        model=cfg.agent.model,
-    )
@@ -24,6 +24,7 @@ dependencies = [
    "pydantic-ai>=0.0.0",
    "pydantic>=2.0.0",
    "httpx>=0.27.0",
+    "requests>=2.31.0",
    "pygithub>=2.0.0",
    "pyyaml>=6.0",
    "tiktoken>=0.7.0",