Add pluggable LLM support with Gemini provider

- Add LLMProvider registry (llm/registry.py) that builds a provider from env vars (LLM_PROVIDER, GEMINI_API_KEY, GEMINI_MODEL) - Add GeminiLLMProvider using the google-genai SDK - Wire build_llm_provider() into CLI and web pipeline route (replacing llm=None) - Wrap pass 2 and pass 4 LLM calls in per-combo try/except so API errors skip individual combos rather than aborting the whole run - Add gemini optional dep to pyproject.toml; Dockerfile installs [web,gemini] - Document env vars in .env.example and README - Lower requires-python to >=3.10 to match installed system Python Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
2026-02-18 22:04:35 -06:00
parent f1b3c75190
commit 20dae0dce3
10 changed files with 204 additions and 40 deletions
--- a/src/physcom/llm/providers/gemini.py
+++ b/src/physcom/llm/providers/gemini.py
@@ -0,0 +1,57 @@
+"""Gemini LLM provider via google-genai SDK."""
+
+from __future__ import annotations
+
+import json
+import re
+
+from physcom.llm.base import LLMProvider
+from physcom.llm.prompts import PHYSICS_ESTIMATION_PROMPT, PLAUSIBILITY_REVIEW_PROMPT
+
+
+class GeminiLLMProvider(LLMProvider):
+    """LLM provider backed by Google Gemini."""
+
+    def __init__(self, api_key: str, model: str = "gemini-2.0-flash") -> None:
+        try:
+            from google import genai
+        except ImportError:
+            raise ImportError(
+                "google-genai is required: pip install 'physcom[gemini]'"
+            )
+        self._client = genai.Client(api_key=api_key)
+        self._model = model
+
+    def estimate_physics(
+        self, combination_description: str, metrics: list[str]
+    ) -> dict[str, float]:
+        prompt = PHYSICS_ESTIMATION_PROMPT.format(
+            description=combination_description,
+            metrics=", ".join(metrics),
+        )
+        response = self._client.models.generate_content(
+            model=self._model, contents=prompt
+        )
+        return self._parse_json(response.text, metrics)
+
+    def review_plausibility(
+        self, combination_description: str, scores: dict[str, float]
+    ) -> str:
+        scores_str = "\n".join(f"- {k}: {v:.3f}" for k, v in scores.items())
+        prompt = PLAUSIBILITY_REVIEW_PROMPT.format(
+            description=combination_description,
+            scores=scores_str,
+        )
+        response = self._client.models.generate_content(
+            model=self._model, contents=prompt
+        )
+        return response.text.strip()
+
+    def _parse_json(self, text: str, metrics: list[str]) -> dict[str, float]:
+        """Strip markdown fences and parse JSON; fall back to 0.5 per metric on error."""
+        text = re.sub(r"```(?:json)?\s*", "", text).strip().rstrip("`").strip()
+        try:
+            data = json.loads(text)
+            return {k: float(v) for k, v in data.items() if k in metrics}
+        except (json.JSONDecodeError, ValueError, TypeError):
+            return {m: 0.5 for m in metrics}
--- a/src/physcom/llm/registry.py
+++ b/src/physcom/llm/registry.py
@@ -0,0 +1,30 @@
+"""Build an LLMProvider from environment variables."""
+
+from __future__ import annotations
+
+import os
+
+from physcom.llm.base import LLMProvider
+
+
+def build_llm_provider() -> LLMProvider | None:
+    """Return an LLMProvider based on env vars, or None if not configured.
+
+    LLM_PROVIDER   — provider name ('gemini'; more can be added)
+    GEMINI_API_KEY — required when LLM_PROVIDER=gemini
+    GEMINI_MODEL   — optional Gemini model name (default: gemini-2.0-flash)
+    """
+    provider = os.environ.get("LLM_PROVIDER", "").lower().strip()
+
+    if not provider:
+        return None
+
+    if provider == "gemini":
+        api_key = os.environ.get("GEMINI_API_KEY", "")
+        if not api_key:
+            raise ValueError("LLM_PROVIDER=gemini requires GEMINI_API_KEY to be set")
+        model = os.environ.get("GEMINI_MODEL", "gemini-2.0-flash")
+        from physcom.llm.providers.gemini import GeminiLLMProvider
+        return GeminiLLMProvider(api_key=api_key, model=model)
+
+    raise ValueError(f"Unknown LLM_PROVIDER: {provider!r}. Supported: gemini")