feat: Add Minimax API compatibility to Emissary LLM

2026-05-25 19:06:12 +00:00
parent f546e3d8d8
commit 3a2ed2e22b
1 changed files with 46 additions and 13 deletions
@@ -150,20 +150,52 @@ def chat():
    # 1. EMISSARY (Left Hemisphere) generates a response
    emissary_text = ""
    emissary_model = "Mock-Emissary"
    try:
-        emissary_resp = requests.post(EMISSARY_URL, json={
+        minimax_key = os.environ.get("MINIMAX_API_KEY")
-            "model": "deepseek-coder-v2:lite",
+        if minimax_key:
-            "messages": [{"role": "user", "content": prompt}],
+            emissary_model = "MiniMax-M2.7"
-            "stream": False
+            emissary_resp = requests.post(
-        }, timeout=5)
+                "https://api.minimax.io/anthropic/v1/messages", 
-        if emissary_resp.status_code == 200:
+                headers={
-            emissary_data = emissary_resp.json()
+                    "x-api-key": minimax_key,
-            emissary_text = emissary_data.get("message", {}).get("content", "")
+                    "anthropic-version": "2023-06-01",
                    "content-type": "application/json"
                },
                json={
                    "model": "MiniMax-M2.7",
                    "max_tokens": 1024,
                    "messages": [{"role": "user", "content": prompt}]
                },
                timeout=15
            )
            if emissary_resp.status_code == 200:
                emissary_data = emissary_resp.json()
                content_blocks = emissary_data.get("content", [])
                text_blocks = [b.get("text", "") for b in content_blocks if b.get("type") == "text"]
                emissary_text = "".join(text_blocks)
                thinking_blocks = [b.get("thinking", "") for b in content_blocks if b.get("type") == "thinking"]
                if thinking_blocks:
                    emissary_text = f"<i style='color:#666; font-size:0.9em'>[Thinking: {''.join(thinking_blocks).strip()}]</i>\n\n" + emissary_text
            else:
                raise Exception(f"Minimax Error: {emissary_resp.text}")
        else:
-            raise Exception("LLM offline")
+            # Fallback to Ollama
-    except Exception:
+            emissary_model = "deepseek-coder-v2:lite"
-        # Fallback to Mock Emissary if LLM is not running
+            emissary_resp = requests.post(EMISSARY_URL, json={
-        emissary_text = f"[MOCK EMISSARY] I have generated a discrete token response to: '{prompt}'. In a production environment, my static window would be injected with the Master's K_anchor tensors."
+                "model": "deepseek-coder-v2:lite",
                "messages": [{"role": "user", "content": prompt}],
                "stream": False
            }, timeout=5)
            if emissary_resp.status_code == 200:
                emissary_data = emissary_resp.json()
                emissary_text = emissary_data.get("message", {}).get("content", "")
            else:
                raise Exception("LLM offline")
    except Exception as e:
        # Fallback to Mock Emissary if LLMs are not running
        emissary_text = f"[MOCK EMISSARY] Backend unavailable ({str(e)}). But my mathematical phase is stable."
    # 2. MASTER (Right Hemisphere) Integrates the tokens
    # We mathematically tie the Token Clock to the stream of words
@@ -205,7 +237,8 @@ def chat():
            'collapsed': collapsed
        },
        'emissary': {
-            'response': emissary_text
+            'response': emissary_text,
            'model': emissary_model
        }
    })