Real Stack Interoperability#

Source: examples/real_stack_interoperability.py

Introduction#

Run one packaged problem from design-research-problems through a public design-research-agents baseline and validate the exported events.csv contract with design-research-analysis’s artifact-first helpers.

Technical Implementation#

Import the installed sibling libraries through their package-level APIs.
Execute a one-run study that uses a packaged optimization problem together with SeededRandomBaselineAgent.
Export canonical artifacts and validate the event table through the analysis package’s artifact-first helpers.

from __future__ import annotations

import importlib
from pathlib import Path
from typing import Any

import design_research_experiments as drex


def _load_stack_modules() -> dict[str, Any] | None:
    """Import sibling stack packages when the coordinated libraries are installed."""
    try:
        problems_module = importlib.import_module("design_research_problems")
        agents_module = importlib.import_module("design_research_agents")
        analysis_module = importlib.import_module("design_research_analysis")
    except ImportError as exc:
        print(f"Real stack example skipped: {exc}")
        return None

    return {
        "problems": problems_module,
        "agents": agents_module,
        "analysis": analysis_module,
    }


def main() -> None:
    """Run one real interoperability path across the sibling libraries."""
    modules = _load_stack_modules()
    if modules is None:
        return

    problems_module = modules["problems"]
    agents_module = modules["agents"]
    analysis_module = modules["analysis"]
    problem_id = "gmpb_default_dynamic_min"
    packaged_problem = problems_module.get_problem(problem_id)

    study = drex.Study(
        study_id="real-stack-interoperability",
        title="Real stack interoperability",
        description="Packaged problem + public agent + validated analysis handoff.",
        output_dir=Path("artifacts") / "real-stack-interoperability",
        problem_ids=(problem_id,),
        agent_specs=("SeededRandomBaselineAgent",),
        outcomes=(
            drex.OutcomeSpec(
                name="primary_outcome",
                source_table="runs",
                column="primary_outcome",
                aggregation="mean",
                primary=True,
            ),
        ),
        run_budget=drex.RunBudget(replicates=1, parallelism=1, max_runs=1),
        primary_outcomes=("primary_outcome",),
    )
    conditions = drex.build_design(study)
    run_results = drex.run_study(
        study,
        conditions=conditions,
        show_progress=False,
    )
    exported_paths = drex.export_analysis_tables(
        study,
        conditions=conditions,
        run_results=run_results,
        output_dir=study.output_dir / "analysis",
        validate_with_analysis_package=True,
    )
    report = analysis_module.validate_experiment_events(exported_paths["events.csv"])
    primary_metric_rows = analysis_module.build_condition_metric_table_from_artifacts(
        exported_paths["events.csv"],
        metric="primary_outcome",
        condition_column="agent_id",
    )
    run_result = run_results[0]

    print("Problem ID:", packaged_problem.metadata.problem_id)
    print("Problem family:", packaged_problem.metadata.kind.value)
    print("Problem package:", problems_module.__name__)
    print("Agent package:", agents_module.__name__)
    print("Agent:", study.agent_specs[0])
    print("Completed runs:", len(run_results))
    print("Run status:", run_result.status.value)
    print("Output keys:", ", ".join(sorted(run_result.outputs)))
    print("Primary outcome:", run_result.metrics.get("primary_outcome"))
    print("Metric rows:", len(primary_metric_rows))
    print("Event rows valid:", report.is_valid, f"(rows={report.n_rows})")
    print("Exported artifacts:", ", ".join(path.name for path in exported_paths.values()))


if __name__ == "__main__":
    main()

Expected Results#

Run Command

PYTHONPATH=src python examples/real_stack_interoperability.py

The script prints the packaged problem identity, one successful run result, and the exported artifact filenames after the event table passes validation.