Add Flask web UI, Docker Compose, core engine + tests

- physcom core: CLI, 5-pass pipeline, SQLite repo, 37 tests
- physcom_web: Flask app with HTMX for entity/domain/pipeline/results CRUD
- Docker Compose: web + cli services sharing a named volume for the DB
- Clean up local settings to use wildcard permissions

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
Simonson, Andrew
2026-02-18 13:59:53 -06:00
parent 6e0f82835a
commit 8118a62242
54 changed files with 3505 additions and 1 deletions

72
tests/test_pipeline.py Normal file
View File

@@ -0,0 +1,72 @@
"""Tests for the multi-pass pipeline."""
from physcom.engine.constraint_resolver import ConstraintResolver
from physcom.engine.scorer import Scorer
from physcom.engine.pipeline import Pipeline
from physcom.llm.providers.mock import MockLLMProvider
def test_pass1_filters_impossible_combos(seeded_repo):
"""Pass 1 should block known-impossible combinations (e.g., solar sail + walking)."""
domain = seeded_repo.get_domain("urban_commuting")
resolver = ConstraintResolver()
scorer = Scorer(domain)
pipeline = Pipeline(seeded_repo, resolver, scorer)
result = pipeline.run(domain, ["platform", "power_source"], passes=[1])
assert result.total_generated == 81
assert result.pass1_blocked > 0
assert result.pass1_valid + result.pass1_conditional + result.pass1_blocked == 81
def test_pass123_produces_scored_results(seeded_repo):
"""Passes 1-3 should produce a scored shortlist."""
domain = seeded_repo.get_domain("urban_commuting")
resolver = ConstraintResolver()
scorer = Scorer(domain)
pipeline = Pipeline(seeded_repo, resolver, scorer)
result = pipeline.run(
domain, ["platform", "power_source"],
score_threshold=0.01, passes=[1, 2, 3, 5],
)
assert result.pass2_estimated > 0
assert result.pass3_above_threshold > 0
def test_pass4_with_mock_llm(seeded_repo):
"""Pass 4 should annotate with LLM review."""
domain = seeded_repo.get_domain("urban_commuting")
resolver = ConstraintResolver()
scorer = Scorer(domain)
mock_llm = MockLLMProvider(default_estimates={
"speed": 50.0, "cost_efficiency": 0.5, "safety": 0.6,
"availability": 0.7, "range_fuel": 200.0,
})
pipeline = Pipeline(seeded_repo, resolver, scorer, llm=mock_llm)
result = pipeline.run(
domain, ["platform", "power_source"],
score_threshold=0.01, passes=[1, 2, 3, 4, 5],
)
assert result.pass4_reviewed > 0
def test_blocked_combos_not_scored(seeded_repo):
"""Blocked combinations should not make it to scoring."""
domain = seeded_repo.get_domain("urban_commuting")
resolver = ConstraintResolver()
scorer = Scorer(domain)
pipeline = Pipeline(seeded_repo, resolver, scorer)
result = pipeline.run(
domain, ["platform", "power_source"],
score_threshold=0.0, passes=[1, 2, 3, 5],
)
# Estimated count should be less than total (blocked ones filtered)
assert result.pass2_estimated < result.total_generated
assert result.pass2_estimated == result.pass1_valid + result.pass1_conditional