soderlind · January 11, 2026 23:35
diff --git a/README.md b/README.md
diff --git a/copilot-ralph.py b/copilot-ralph.py
 #!/usr/bin/env python3
 """
 Ralph loop wrapper for GitHub Copilot CLI (programmatic mode).

 It repeatedly runs Copilot with a prompt that targets exactly ONE PRD story,
 then enforces these completion conditions:

 - PRD: all stories are passes=true
 - Tests: story tests pass before flipping passes=true
 - Final tests: final_tests pass before completing
 - Repo state: git working tree is clean (no diff / no uncommitted changes)

 The wrapper persists state in:
 - prd.json (source of truth)
 - progress.txt (append-only transcript)
 - .ralph/state.json (resume metadata)

 Usage example:
  ./copilot-ralph.py --prd prd.json --progress progress.txt --max-iterations 30
 """

 from __future__ import annotations

 import argparse
 import json
 import os
 import subprocess
 import sys
 import time
 from datetime import datetime, timezone
 from pathlib import Path
 from typing import Any, Dict, List, Optional, Tuple

 DEFAULT_COMPLETION = "COMPLETE"


 def now_iso() -> str:
    return datetime.now(timezone.utc).isoformat().replace("+00:00", "Z")


 def log(msg: str) -> None:
    # Always flush so long-running steps don't appear "stuck".
    print(f"[{now_iso()}] {msg}", flush=True)


 def run_streaming(
    cmd: List[str] | str,
    *,
    cwd: Optional[Path] = None,
    check: bool = True,
    label: Optional[str] = None,
 ) -> Tuple[int, str]:
    """Run a command and stream combined stdout/stderr to the terminal.

    Returns (exit_code, combined_output).
    """
    start = time.time()
    proc = subprocess.Popen(
        cmd,
        cwd=str(cwd) if cwd else None,
        text=True,
        stdout=subprocess.PIPE,
        stderr=subprocess.STDOUT,
        shell=isinstance(cmd, str),
    )

    assert proc.stdout is not None
    lines: List[str] = []
    prefix = f"[{label}] " if label else ""

    for line in proc.stdout:
        # Stream to terminal and keep for logs/progress.txt
        lines.append(line.rstrip("\n"))
        print(prefix + line, end="", flush=True)

    rc = proc.wait()
    elapsed = time.time() - start
    if label:
        log(f"{label} finished with exit code {rc} in {elapsed:.1f}s")
    if check and rc != 0:
        raise subprocess.CalledProcessError(rc, cmd, output="\n".join(lines))
    return rc, "\n".join(lines).strip()


 def sh(cmd: List[str], cwd: Optional[Path] = None, check: bool = True) -> subprocess.CompletedProcess:
    return subprocess.run(
        cmd,
        cwd=str(cwd) if cwd else None,
        text=True,
        capture_output=True,
        check=check,
    )


 def sh_shell(command: str, cwd: Optional[Path] = None, check: bool = True) -> subprocess.CompletedProcess:
    # Run via shell for convenience (quotes/pipes). Keep commands trusted.
    return subprocess.run(
        command,
        cwd=str(cwd) if cwd else None,
        text=True,
        capture_output=True,
        check=check,
        shell=True,
    )


 def git_clean() -> bool:
    p = sh(["git", "status", "--porcelain"], check=True)
    return p.stdout.strip() == ""


 def git_porcelain() -> str:
    return sh(["git", "status", "--porcelain"], check=True).stdout.strip()


 def git_diff_stat() -> str:
    return sh(["git", "diff", "--stat"], check=True).stdout.strip()


 def git_branch() -> str:
    p = sh(["git", "rev-parse", "--abbrev-ref", "HEAD"], check=True)
    return p.stdout.strip()


 def ensure_git_repo() -> None:
    sh(["git", "rev-parse", "--is-inside-work-tree"], check=True)


 def load_json(path: Path) -> Dict[str, Any]:
    return json.loads(path.read_text(encoding="utf-8"))


 def save_json(path: Path, data: Dict[str, Any]) -> None:
    path.write_text(json.dumps(data, indent=2, ensure_ascii=False) + "\n", encoding="utf-8")


 def pick_next_story(prd: Dict[str, Any]) -> Optional[Dict[str, Any]]:
    stories = prd.get("stories", [])
    failing = [s for s in stories if not s.get("passes", False)]
    if not failing:
        return None
    failing.sort(key=lambda s: (int(s.get("priority", 9999)), str(s.get("id", ""))))
    return failing[0]


 def union_tests(prd: Dict[str, Any]) -> List[str]:
    seen: List[str] = []
    for s in prd.get("stories", []):
        for t in (s.get("tests") or []):
            if t not in seen:
                seen.append(t)
    return seen


 def run_tests(commands: List[str]) -> Tuple[bool, str]:
    logs: List[str] = []
    for cmd in commands:
        log(f"Running tests: {cmd}")
        logs.append(f"$ {cmd}")
        try:
            _, combined = run_streaming(cmd, check=True, label="tests")
            if combined:
                logs.append(combined)
        except subprocess.CalledProcessError as e:
            combined = (getattr(e, "output", None) or "").strip()
            if combined:
                logs.append(combined)
            logs.append(f"[FAIL] {cmd} exited with {e.returncode}")
            return False, "\n".join(logs)
    return True, "\n".join(logs)


 def append_progress(progress_path: Path, text: str) -> None:
    progress_path.parent.mkdir(parents=True, exist_ok=True)
    with progress_path.open("a", encoding="utf-8") as f:
        f.write(text.rstrip() + "\n")


 def stage_all() -> None:
    sh(["git", "add", "-A"], check=True)


 def commit_if_needed(message: str) -> bool:
    if git_clean():
        return False
    stage_all()
    args = ["git", "commit", "-m", message]
    if os.getenv("RALPH_NO_VERIFY", "").strip() == "1":
        args.append("--no-verify")
    sh(args, check=True)
    return True


 def build_prompt(
    prd: Dict[str, Any],
    story: Dict[str, Any],
    progress_tail: str,
    completion_token: str,
 ) -> str:
    acceptance = "\n".join([f"- {a}" for a in (story.get("acceptance") or [])])
    tests = "\n".join([f"- {t}" for t in (story.get("tests") or [])])

    return f"""You are acting as an autonomous coding agent inside a git repo.

 GOAL
 Implement exactly ONE PRD story per iteration: {story.get("id")} - {story.get("title")}

 ACCEPTANCE CRITERIA
 {acceptance if acceptance.strip() else "- (none provided)"}

 TESTS TO PASS FOR THIS STORY
 {tests if tests.strip() else "- (no tests listed; do not mark passing without adding tests in prd.json)"}

 RULES (NON-NEGOTIABLE)
 1) Work ONLY on this story. Do not start other stories.
 2) Make the smallest set of changes that satisfy acceptance criteria.
 3) Update prd.json: set this story's passes=true ONLY when tests pass.
 4) Ensure repository is left clean (no uncommitted changes) by committing your work.
 5) Do not emit the token {completion_token} unless ALL stories in prd.json are passes=true AND all final tests pass AND git is clean.

 CONTEXT
 - Current branch: {git_branch()}
 - Git status:
 {git_porcelain() or "(clean)"}
 - Diff stat:
 {git_diff_stat() or "(none)"}

 RECENT PROGRESS LOG (tail)
 {progress_tail}

 OUTPUT FORMAT
 - Start with a short plan.
 - Then do the work.
 - End with:
  - "STORY_DONE" if you believe this story is done (tests passing + committed + prd.json updated).
  - Or "STORY_BLOCKED: <reason>" if you cannot proceed.
 - Only end with {completion_token} if absolutely all conditions are met.
 """


 def build_final_tests_fix_prompt(
    prd: Dict[str, Any],
    test_log: str,
    progress_tail: str,
    completion_token: str,
 ) -> str:
    final_tests = prd.get("final_tests") or union_tests(prd)
    tests_list = "\n".join([f"- {t}" for t in final_tests])
    # Truncate test log to last 80 lines to avoid overly long prompts
    test_log_lines = test_log.splitlines()
    if len(test_log_lines) > 80:
        test_log = "\n".join(test_log_lines[-80:])

    return f"""You are acting as an autonomous coding agent inside a git repo.

 GOAL
 All PRD stories are marked as passing, but the FINAL TESTS are failing. Fix the failing tests.

 FAILING TESTS
 {tests_list}

 TEST OUTPUT (failures)
 {test_log}

 RULES (NON-NEGOTIABLE)
 1) Analyze the test failures and fix the underlying code issues.
 2) Do NOT modify the tests unless they are clearly incorrect.
 3) Make the smallest set of changes that fix the failures.
 4) Ensure repository is left clean (no uncommitted changes) by committing your work.
 5) Do not emit the token {completion_token} unless all final tests pass AND git is clean.

 CONTEXT
 - Current branch: {git_branch()}
 - Git status:
 {git_porcelain() or "(clean)"}
 - Diff stat:
 {git_diff_stat() or "(none)"}

 RECENT PROGRESS LOG (tail)
 {progress_tail}

 OUTPUT FORMAT
 - Start with a short analysis of what's failing and why.
 - Then fix the code.
 - Commit your changes.
 - End with "FIXES_APPLIED" if you believe the fixes are done.
 - Only end with {completion_token} if all final tests pass AND git is clean.
 """


 def call_copilot(copilot_bin: str, prompt: str, extra_args: List[str]) -> str:
    # Copilot CLI programmatic mode: copilot -p "prompt"
    cmd = [copilot_bin, "-p", prompt] + extra_args
    log("Calling Copilot (programmatic mode)...")
    try:
        rc, combined = run_streaming(cmd, check=False, label="copilot")
    except FileNotFoundError:
        return f"[ERROR] Copilot binary not found: {copilot_bin}"
    if rc != 0:
        combined = (combined + f"\n\n[ERROR] copilot exited with {rc}").strip()
    return combined


 def main() -> int:
    ap = argparse.ArgumentParser()
    ap.add_argument("--prd", type=Path, default=Path("prd.json"))
    ap.add_argument("--progress", type=Path, default=Path("progress.txt"))
    ap.add_argument("--state", type=Path, default=Path(".ralph/state.json"))
    ap.add_argument("--max-iterations", type=int, default=20)
    ap.add_argument("--sleep", type=float, default=0.3)
    ap.add_argument("--completion-token", type=str, default=DEFAULT_COMPLETION)
    ap.add_argument("--copilot-bin", type=str, default="copilot")
    ap.add_argument(
        "--copilot-arg",
        action="append",
        default=[],
        help="Extra args passed through to copilot (repeatable).",
    )
    args = ap.parse_args()

    log("Starting Ralph loop")
    ensure_git_repo()

    log(f"Using PRD: {args.prd}")
    log(f"Using progress log: {args.progress}")
    log(f"Using state file: {args.state}")
    log(f"Max iterations: {args.max_iterations}")
    log(f"Completion token: {args.completion_token}")

    args.state.parent.mkdir(parents=True, exist_ok=True)

    if not git_clean():
        print(
            "Refusing to start: git working tree is not clean.\nRun: git status --porcelain",
            file=sys.stderr,
        )
        return 2

    if args.state.exists():
        state = load_json(args.state)
    else:
        state = {"created_at": now_iso(), "runs": 0}
        save_json(args.state, state)
        log("Created new state file")

    for i in range(1, args.max_iterations + 1):
        log(f"Iteration {i}/{args.max_iterations}: loading PRD")
        prd = load_json(args.prd)
        story = pick_next_story(prd)

        if story is None:
            log("All stories passing; running final tests")
            final_tests = prd.get("final_tests") or union_tests(prd)
            ok, final_test_log = run_tests(final_tests)
            if not ok:
                append_progress(args.progress, f"[{now_iso()}] FINAL_TESTS_FAIL\n{final_test_log}\n")
                log(f"Final tests failed; calling Copilot to fix (iteration {i})")

                # Get progress tail for context
                if args.progress.exists():
                    tail = args.progress.read_text(encoding="utf-8").splitlines()[-30:]
                    progress_tail = "\n".join(tail)
                else:
                    progress_tail = "(none yet)"

                fix_prompt = build_final_tests_fix_prompt(
                    prd, final_test_log, progress_tail, args.completion_token
                )
                copilot_out = call_copilot(args.copilot_bin, fix_prompt, args.copilot_arg)
                append_progress(
                    args.progress,
                    f"[{now_iso()}] ITERATION {i} FINAL_TESTS_FIX\n{copilot_out}\n",
                )
                log("Copilot run complete; continuing loop")
                time.sleep(args.sleep)
                continue

            # Commit tracking files before final clean check
            log("Final tests passed; committing any tracking changes")
            commit_if_needed("ralph: update progress and state")

            if not git_clean():
                append_progress(args.progress, f"[{now_iso()}] FINAL_NOT_CLEAN\n{git_porcelain()}\n")
                log("Repo not clean at final check; refusing to complete")
                time.sleep(args.sleep)
                continue

            append_progress(
                args.progress,
                f"[{now_iso()}] ALL_PASS + FINAL_TESTS_PASS + CLEAN => {args.completion_token}\n",
            )
            log("All completion conditions met")
            print(args.completion_token, flush=True)
            state["runs"] = int(state.get("runs", 0)) + 1
            state["last_completed_at"] = now_iso()
            save_json(args.state, state)
            return 0

        if args.progress.exists():
            tail = args.progress.read_text(encoding="utf-8").splitlines()[-30:]
            progress_tail = "\n".join(tail)
        else:
            progress_tail = "(none yet)"

        prompt = build_prompt(prd, story, progress_tail, args.completion_token)
        log(f"Selected story {story.get('id')}: {story.get('title')}")
        print(f"\n=== ITERATION {i}/{args.max_iterations} | Story {story.get('id')} ===", flush=True)

        copilot_out = call_copilot(args.copilot_bin, prompt, args.copilot_arg)
        log("Copilot run complete; appending transcript to progress.txt")

        append_progress(
            args.progress,
            f"[{now_iso()}] ITERATION {i} STORY {story.get('id')} ({story.get('title')})\n"
            f"{copilot_out}\n",
        )

        prd2 = load_json(args.prd)
        story2 = next((s for s in prd2.get("stories", []) if s.get("id") == story.get("id")), None)
        if not story2:
            append_progress(args.progress, f"[{now_iso()}] ERROR: story disappeared from prd.json\n")
            print("Story disappeared from PRD; fix PRD and re-run.")
            return 3

        tests = story2.get("tests") or []
        if not tests:
            append_progress(args.progress, f"[{now_iso()}] ERROR: story has no tests; refusing to mark pass.\n")
            log("Story has no tests listed in PRD; add tests and re-run")
            time.sleep(args.sleep)
            continue

        log(f"Running story tests for {story2.get('id')}")
        ok, test_log = run_tests(tests)
        if not ok:
            append_progress(args.progress, f"[{now_iso()}] TESTS_FAIL for {story2.get('id')}\n{test_log}\n")
            log("Tests failed; continuing loop")
            time.sleep(args.sleep)
            continue

        story2["passes"] = True
        save_json(args.prd, prd2)

        commit_msg = f"ralph: {story2.get('id')} {story2.get('title')}"
        log(f"Tests passed; committing changes: {commit_msg}")
        commit_if_needed(commit_msg)

        if not git_clean():
            append_progress(args.progress, f"[{now_iso()}] ERROR: repo not clean after commit.\n{git_porcelain()}\n")
            log("Repo not clean after commit; fix manually")
            return 5

        append_progress(args.progress, f"[{now_iso()}] STORY_PASS {story2.get('id')} (tests pass + committed + clean)\n")

        state["runs"] = int(state.get("runs", 0)) + 1
        state["last_iteration_at"] = now_iso()
        state["last_story"] = story2.get("id")
        save_json(args.state, state)

        time.sleep(args.sleep)

    print(f"Did not finish within max iterations ({args.max_iterations}).")
    return 1


 if __name__ == "__main__":
    raise SystemExit(main())
diff --git a/prd.json b/prd.json
 {
  "project": "Ralph Demo: Todo List",
  "final_tests": [
    "npm test",
    "npm run build"
  ],
  "stories": [
    {
      "id": "S1",
      "priority": 1,
      "title": "Core Todo functionality (CRUD + filters)",
      "acceptance": [
        "User can add a todo with a title; empty titles are rejected with a friendly message.",
        "User can toggle complete/incomplete; completed todos are visually distinct (e.g., strikethrough).",
        "User can delete a todo; it disappears immediately.",
        "User can filter between All / Active / Completed; filter updates the list immediately."
      ],
      "tests": [
        "npm test -- --runInBand"
      ],
      "passes": true
    },
    {
      "id": "S2",
      "priority": 2,
      "title": "Persistence (localStorage)",
      "acceptance": [
        "Todos persist across page reloads using localStorage.",
        "Filter selection persists for the session (or localStorage if you prefer).",
        "App handles corrupted localStorage data by resetting gracefully."
      ],
      "tests": [
        "npm test -- --runInBand"
      ],
      "passes": true
    },
    {
      "id": "S3",
      "priority": 3,
      "title": "Vite setup (dev + build)",
      "acceptance": [
        "Add Vite as dev dependency for bundling.",
        "Create index.html in project root that mounts the app.",
        "Create src/main.jsx as entry point that renders TodoApp.",
        "Add 'dev' script: 'vite' and 'build' script: 'vite build'.",
        "Running 'npm run dev' starts a dev server (default Vite port is fine).",
        "Running 'npm run build' succeeds."
      ],
      "tests": [
        "npm run build"
      ],
      "passes": true
    },
    {
      "id": "S4",
      "priority": 4,
      "title": "UI polish (styling + small UX)",
      "acceptance": [
        "Create src/styles.css with clean, modern styling; app centered with reasonable max-width.",
        "Style input, buttons, list; completed todos have strikethrough + muted color.",
        "Filter buttons show active state.",
        "Add a 'Clear Completed' button that appears only when there are completed todos.",
        "Show remaining items count with correct pluralization (1 item / N items).",
        "Import styles.css in main.jsx.",
        "Build succeeds."
      ],
      "tests": [
        "npm run build"
      ],
      "passes": true
    }
  ]
 }
diff --git a/run.sh b/run.sh
 #!/usr/bin/env bash
 set -euo pipefail

 # Bootstrap runner for the Ralph loop.
 # Tests are defined in prd.json and executed by ./copilot-ralph.py.

 # If progress.txt does not exist, create it
 if [ ! -f progress.txt ]; then
 	echo "Creating progress.txt..."
 	touch progress.txt
 fi

 # Initialize git repo if not already initialized
 if ! git rev-parse --is-inside-work-tree &>/dev/null; then
    echo "Initializing git repository..."
    git init
    git add -A
    git commit -m "Initial commit"
 fi

 # Install dependencies if possible.
 # If this is a brand-new empty repo, there may be no package.json yet.
 # In that case, skip install so the agent can create the project files.
 if [ -f package.json ]; then
    if [ ! -d node_modules ]; then
        echo "Installing dependencies..."
        if command -v pnpm &>/dev/null; then
            pnpm install
        else
            npm install
        fi
    fi
 else
    echo "No package.json found; skipping dependency install (agent will create project files)."
 fi

 # Ensure clean working tree (Ralph refuses to start otherwise)
 if [ -n "$(git status --porcelain)" ]; then
    echo "Working tree not clean; committing changes before Ralph run..."
    git add -A
    if [ "${RALPH_NO_VERIFY:-}" = "1" ]; then
        git commit -m "chore: prep for ralph run" --no-verify
    else
        git commit -m "chore: prep for ralph run"
    fi
 fi
 ./copilot-ralph.py --prd prd.json --progress progress.txt --max-iterations 30 \
    --copilot-arg="--allow-all-tools" \
    --copilot-arg="--allow-all-paths"
	#!/usr/bin/env python3
	"""
	Ralph loop wrapper for GitHub Copilot CLI (programmatic mode).

	It repeatedly runs Copilot with a prompt that targets exactly ONE PRD story,
	then enforces these completion conditions:

	- PRD: all stories are passes=true
	- Tests: story tests pass before flipping passes=true
	- Final tests: final_tests pass before completing
	- Repo state: git working tree is clean (no diff / no uncommitted changes)

	The wrapper persists state in:
	- prd.json (source of truth)
	- progress.txt (append-only transcript)
	- .ralph/state.json (resume metadata)

	Usage example:
	./copilot-ralph.py --prd prd.json --progress progress.txt --max-iterations 30
	"""

	from __future__ import annotations

	import argparse
	import json
	import os
	import subprocess
	import sys
	import time
	from datetime import datetime, timezone
	from pathlib import Path
	from typing import Any, Dict, List, Optional, Tuple

	DEFAULT_COMPLETION = "COMPLETE"


	def now_iso() -> str:
	return datetime.now(timezone.utc).isoformat().replace("+00:00", "Z")


	def log(msg: str) -> None:
	# Always flush so long-running steps don't appear "stuck".
	print(f"[{now_iso()}] {msg}", flush=True)


	def run_streaming(
	cmd: List[str] \| str,
	*,
	cwd: Optional[Path] = None,
	check: bool = True,
	label: Optional[str] = None,
	) -> Tuple[int, str]:
	"""Run a command and stream combined stdout/stderr to the terminal.

	Returns (exit_code, combined_output).
	"""
	start = time.time()
	proc = subprocess.Popen(
	cmd,
	cwd=str(cwd) if cwd else None,
	text=True,
	stdout=subprocess.PIPE,
	stderr=subprocess.STDOUT,
	shell=isinstance(cmd, str),
	)

	assert proc.stdout is not None
	lines: List[str] = []
	prefix = f"[{label}] " if label else ""

	for line in proc.stdout:
	# Stream to terminal and keep for logs/progress.txt
	lines.append(line.rstrip("\n"))
	print(prefix + line, end="", flush=True)

	rc = proc.wait()
	elapsed = time.time() - start
	if label:
	log(f"{label} finished with exit code {rc} in {elapsed:.1f}s")
	if check and rc != 0:
	raise subprocess.CalledProcessError(rc, cmd, output="\n".join(lines))
	return rc, "\n".join(lines).strip()


	def sh(cmd: List[str], cwd: Optional[Path] = None, check: bool = True) -> subprocess.CompletedProcess:
	return subprocess.run(
	cmd,
	cwd=str(cwd) if cwd else None,
	text=True,
	capture_output=True,
	check=check,
	)


	def sh_shell(command: str, cwd: Optional[Path] = None, check: bool = True) -> subprocess.CompletedProcess:
	# Run via shell for convenience (quotes/pipes). Keep commands trusted.
	return subprocess.run(
	command,
	cwd=str(cwd) if cwd else None,
	text=True,
	capture_output=True,
	check=check,
	shell=True,
	)


	def git_clean() -> bool:
	p = sh(["git", "status", "--porcelain"], check=True)
	return p.stdout.strip() == ""


	def git_porcelain() -> str:
	return sh(["git", "status", "--porcelain"], check=True).stdout.strip()


	def git_diff_stat() -> str:
	return sh(["git", "diff", "--stat"], check=True).stdout.strip()


	def git_branch() -> str:
	p = sh(["git", "rev-parse", "--abbrev-ref", "HEAD"], check=True)
	return p.stdout.strip()


	def ensure_git_repo() -> None:
	sh(["git", "rev-parse", "--is-inside-work-tree"], check=True)


	def load_json(path: Path) -> Dict[str, Any]:
	return json.loads(path.read_text(encoding="utf-8"))


	def save_json(path: Path, data: Dict[str, Any]) -> None:
	path.write_text(json.dumps(data, indent=2, ensure_ascii=False) + "\n", encoding="utf-8")


	def pick_next_story(prd: Dict[str, Any]) -> Optional[Dict[str, Any]]:
	stories = prd.get("stories", [])
	failing = [s for s in stories if not s.get("passes", False)]
	if not failing:
	return None
	failing.sort(key=lambda s: (int(s.get("priority", 9999)), str(s.get("id", ""))))
	return failing[0]


	def union_tests(prd: Dict[str, Any]) -> List[str]:
	seen: List[str] = []
	for s in prd.get("stories", []):
	for t in (s.get("tests") or []):
	if t not in seen:
	seen.append(t)
	return seen


	def run_tests(commands: List[str]) -> Tuple[bool, str]:
	logs: List[str] = []
	for cmd in commands:
	log(f"Running tests: {cmd}")
	logs.append(f"$ {cmd}")
	try:
	_, combined = run_streaming(cmd, check=True, label="tests")
	if combined:
	logs.append(combined)
	except subprocess.CalledProcessError as e:
	combined = (getattr(e, "output", None) or "").strip()
	if combined:
	logs.append(combined)
	logs.append(f"[FAIL] {cmd} exited with {e.returncode}")
	return False, "\n".join(logs)
	return True, "\n".join(logs)


	def append_progress(progress_path: Path, text: str) -> None:
	progress_path.parent.mkdir(parents=True, exist_ok=True)
	with progress_path.open("a", encoding="utf-8") as f:
	f.write(text.rstrip() + "\n")


	def stage_all() -> None:
	sh(["git", "add", "-A"], check=True)


	def commit_if_needed(message: str) -> bool:
	if git_clean():
	return False
	stage_all()
	args = ["git", "commit", "-m", message]
	if os.getenv("RALPH_NO_VERIFY", "").strip() == "1":
	args.append("--no-verify")
	sh(args, check=True)
	return True


	def build_prompt(
	prd: Dict[str, Any],
	story: Dict[str, Any],
	progress_tail: str,
	completion_token: str,
	) -> str:
	acceptance = "\n".join([f"- {a}" for a in (story.get("acceptance") or [])])
	tests = "\n".join([f"- {t}" for t in (story.get("tests") or [])])

	return f"""You are acting as an autonomous coding agent inside a git repo.

	GOAL
	Implement exactly ONE PRD story per iteration: {story.get("id")} - {story.get("title")}

	ACCEPTANCE CRITERIA
	{acceptance if acceptance.strip() else "- (none provided)"}

	TESTS TO PASS FOR THIS STORY
	{tests if tests.strip() else "- (no tests listed; do not mark passing without adding tests in prd.json)"}

	RULES (NON-NEGOTIABLE)
	1) Work ONLY on this story. Do not start other stories.
	2) Make the smallest set of changes that satisfy acceptance criteria.
	3) Update prd.json: set this story's passes=true ONLY when tests pass.
	4) Ensure repository is left clean (no uncommitted changes) by committing your work.
	5) Do not emit the token {completion_token} unless ALL stories in prd.json are passes=true AND all final tests pass AND git is clean.

	CONTEXT
	- Current branch: {git_branch()}
	- Git status:
	{git_porcelain() or "(clean)"}
	- Diff stat:
	{git_diff_stat() or "(none)"}

	RECENT PROGRESS LOG (tail)
	{progress_tail}

	OUTPUT FORMAT
	- Start with a short plan.
	- Then do the work.
	- End with:
	- "STORY_DONE" if you believe this story is done (tests passing + committed + prd.json updated).
	- Or "STORY_BLOCKED: <reason>" if you cannot proceed.
	- Only end with {completion_token} if absolutely all conditions are met.
	"""


	def build_final_tests_fix_prompt(
	prd: Dict[str, Any],
	test_log: str,
	progress_tail: str,
	completion_token: str,
	) -> str:
	final_tests = prd.get("final_tests") or union_tests(prd)
	tests_list = "\n".join([f"- {t}" for t in final_tests])
	# Truncate test log to last 80 lines to avoid overly long prompts
	test_log_lines = test_log.splitlines()
	if len(test_log_lines) > 80:
	test_log = "\n".join(test_log_lines[-80:])

	return f"""You are acting as an autonomous coding agent inside a git repo.

	GOAL
	All PRD stories are marked as passing, but the FINAL TESTS are failing. Fix the failing tests.

	FAILING TESTS
	{tests_list}

	TEST OUTPUT (failures)
	{test_log}

	RULES (NON-NEGOTIABLE)
	1) Analyze the test failures and fix the underlying code issues.
	2) Do NOT modify the tests unless they are clearly incorrect.
	3) Make the smallest set of changes that fix the failures.
	4) Ensure repository is left clean (no uncommitted changes) by committing your work.
	5) Do not emit the token {completion_token} unless all final tests pass AND git is clean.

	CONTEXT
	- Current branch: {git_branch()}
	- Git status:
	{git_porcelain() or "(clean)"}
	- Diff stat:
	{git_diff_stat() or "(none)"}

	RECENT PROGRESS LOG (tail)
	{progress_tail}

	OUTPUT FORMAT
	- Start with a short analysis of what's failing and why.
	- Then fix the code.
	- Commit your changes.
	- End with "FIXES_APPLIED" if you believe the fixes are done.
	- Only end with {completion_token} if all final tests pass AND git is clean.
	"""


	def call_copilot(copilot_bin: str, prompt: str, extra_args: List[str]) -> str:
	# Copilot CLI programmatic mode: copilot -p "prompt"
	cmd = [copilot_bin, "-p", prompt] + extra_args
	log("Calling Copilot (programmatic mode)...")
	try:
	rc, combined = run_streaming(cmd, check=False, label="copilot")
	except FileNotFoundError:
	return f"[ERROR] Copilot binary not found: {copilot_bin}"
	if rc != 0:
	combined = (combined + f"\n\n[ERROR] copilot exited with {rc}").strip()
	return combined


	def main() -> int:
	ap = argparse.ArgumentParser()
	ap.add_argument("--prd", type=Path, default=Path("prd.json"))
	ap.add_argument("--progress", type=Path, default=Path("progress.txt"))
	ap.add_argument("--state", type=Path, default=Path(".ralph/state.json"))
	ap.add_argument("--max-iterations", type=int, default=20)
	ap.add_argument("--sleep", type=float, default=0.3)
	ap.add_argument("--completion-token", type=str, default=DEFAULT_COMPLETION)
	ap.add_argument("--copilot-bin", type=str, default="copilot")
	ap.add_argument(
	"--copilot-arg",
	action="append",
	default=[],
	help="Extra args passed through to copilot (repeatable).",
	)
	args = ap.parse_args()

	log("Starting Ralph loop")
	ensure_git_repo()

	log(f"Using PRD: {args.prd}")
	log(f"Using progress log: {args.progress}")
	log(f"Using state file: {args.state}")
	log(f"Max iterations: {args.max_iterations}")
	log(f"Completion token: {args.completion_token}")

	args.state.parent.mkdir(parents=True, exist_ok=True)

	if not git_clean():
	print(
	"Refusing to start: git working tree is not clean.\nRun: git status --porcelain",
	file=sys.stderr,
	)
	return 2

	if args.state.exists():
	state = load_json(args.state)
	else:
	state = {"created_at": now_iso(), "runs": 0}
	save_json(args.state, state)
	log("Created new state file")

	for i in range(1, args.max_iterations + 1):
	log(f"Iteration {i}/{args.max_iterations}: loading PRD")
	prd = load_json(args.prd)
	story = pick_next_story(prd)

	if story is None:
	log("All stories passing; running final tests")
	final_tests = prd.get("final_tests") or union_tests(prd)
	ok, final_test_log = run_tests(final_tests)
	if not ok:
	append_progress(args.progress, f"[{now_iso()}] FINAL_TESTS_FAIL\n{final_test_log}\n")
	log(f"Final tests failed; calling Copilot to fix (iteration {i})")

	# Get progress tail for context
	if args.progress.exists():
	tail = args.progress.read_text(encoding="utf-8").splitlines()[-30:]
	progress_tail = "\n".join(tail)
	else:
	progress_tail = "(none yet)"

	fix_prompt = build_final_tests_fix_prompt(
	prd, final_test_log, progress_tail, args.completion_token
	)
	copilot_out = call_copilot(args.copilot_bin, fix_prompt, args.copilot_arg)
	append_progress(
	args.progress,
	f"[{now_iso()}] ITERATION {i} FINAL_TESTS_FIX\n{copilot_out}\n",
	)
	log("Copilot run complete; continuing loop")
	time.sleep(args.sleep)
	continue

	# Commit tracking files before final clean check
	log("Final tests passed; committing any tracking changes")
	commit_if_needed("ralph: update progress and state")

	if not git_clean():
	append_progress(args.progress, f"[{now_iso()}] FINAL_NOT_CLEAN\n{git_porcelain()}\n")
	log("Repo not clean at final check; refusing to complete")
	time.sleep(args.sleep)
	continue

	append_progress(
	args.progress,
	f"[{now_iso()}] ALL_PASS + FINAL_TESTS_PASS + CLEAN => {args.completion_token}\n",
	)
	log("All completion conditions met")
	print(args.completion_token, flush=True)
	state["runs"] = int(state.get("runs", 0)) + 1
	state["last_completed_at"] = now_iso()
	save_json(args.state, state)
	return 0

	if args.progress.exists():
	tail = args.progress.read_text(encoding="utf-8").splitlines()[-30:]
	progress_tail = "\n".join(tail)
	else:
	progress_tail = "(none yet)"

	prompt = build_prompt(prd, story, progress_tail, args.completion_token)
	log(f"Selected story {story.get('id')}: {story.get('title')}")
	print(f"\n=== ITERATION {i}/{args.max_iterations} \| Story {story.get('id')} ===", flush=True)

	copilot_out = call_copilot(args.copilot_bin, prompt, args.copilot_arg)
	log("Copilot run complete; appending transcript to progress.txt")

	append_progress(
	args.progress,
	f"[{now_iso()}] ITERATION {i} STORY {story.get('id')} ({story.get('title')})\n"
	f"{copilot_out}\n",
	)

	prd2 = load_json(args.prd)
	story2 = next((s for s in prd2.get("stories", []) if s.get("id") == story.get("id")), None)
	if not story2:
	append_progress(args.progress, f"[{now_iso()}] ERROR: story disappeared from prd.json\n")
	print("Story disappeared from PRD; fix PRD and re-run.")
	return 3

	tests = story2.get("tests") or []
	if not tests:
	append_progress(args.progress, f"[{now_iso()}] ERROR: story has no tests; refusing to mark pass.\n")
	log("Story has no tests listed in PRD; add tests and re-run")
	time.sleep(args.sleep)
	continue

	log(f"Running story tests for {story2.get('id')}")
	ok, test_log = run_tests(tests)
	if not ok:
	append_progress(args.progress, f"[{now_iso()}] TESTS_FAIL for {story2.get('id')}\n{test_log}\n")
	log("Tests failed; continuing loop")
	time.sleep(args.sleep)
	continue

	story2["passes"] = True
	save_json(args.prd, prd2)

	commit_msg = f"ralph: {story2.get('id')} {story2.get('title')}"
	log(f"Tests passed; committing changes: {commit_msg}")
	commit_if_needed(commit_msg)

	if not git_clean():
	append_progress(args.progress, f"[{now_iso()}] ERROR: repo not clean after commit.\n{git_porcelain()}\n")
	log("Repo not clean after commit; fix manually")
	return 5

	append_progress(args.progress, f"[{now_iso()}] STORY_PASS {story2.get('id')} (tests pass + committed + clean)\n")

	state["runs"] = int(state.get("runs", 0)) + 1
	state["last_iteration_at"] = now_iso()
	state["last_story"] = story2.get("id")
	save_json(args.state, state)

	time.sleep(args.sleep)

	print(f"Did not finish within max iterations ({args.max_iterations}).")
	return 1


	if __name__ == "__main__":
	raise SystemExit(main())
	{
	"project": "Ralph Demo: Todo List",
	"final_tests": [
	"npm test",
	"npm run build"
	],
	"stories": [
	{
	"id": "S1",
	"priority": 1,
	"title": "Core Todo functionality (CRUD + filters)",
	"acceptance": [
	"User can add a todo with a title; empty titles are rejected with a friendly message.",
	"User can toggle complete/incomplete; completed todos are visually distinct (e.g., strikethrough).",
	"User can delete a todo; it disappears immediately.",
	"User can filter between All / Active / Completed; filter updates the list immediately."
	],
	"tests": [
	"npm test -- --runInBand"
	],
	"passes": true
	},
	{
	"id": "S2",
	"priority": 2,
	"title": "Persistence (localStorage)",
	"acceptance": [
	"Todos persist across page reloads using localStorage.",
	"Filter selection persists for the session (or localStorage if you prefer).",
	"App handles corrupted localStorage data by resetting gracefully."
	],
	"tests": [
	"npm test -- --runInBand"
	],
	"passes": true
	},
	{
	"id": "S3",
	"priority": 3,
	"title": "Vite setup (dev + build)",
	"acceptance": [
	"Add Vite as dev dependency for bundling.",
	"Create index.html in project root that mounts the app.",
	"Create src/main.jsx as entry point that renders TodoApp.",
	"Add 'dev' script: 'vite' and 'build' script: 'vite build'.",
	"Running 'npm run dev' starts a dev server (default Vite port is fine).",
	"Running 'npm run build' succeeds."
	],
	"tests": [
	"npm run build"
	],
	"passes": true
	},
	{
	"id": "S4",
	"priority": 4,
	"title": "UI polish (styling + small UX)",
	"acceptance": [
	"Create src/styles.css with clean, modern styling; app centered with reasonable max-width.",
	"Style input, buttons, list; completed todos have strikethrough + muted color.",
	"Filter buttons show active state.",
	"Add a 'Clear Completed' button that appears only when there are completed todos.",
	"Show remaining items count with correct pluralization (1 item / N items).",
	"Import styles.css in main.jsx.",
	"Build succeeds."
	],
	"tests": [
	"npm run build"
	],
	"passes": true
	}
	]
	}
	#!/usr/bin/env bash
	set -euo pipefail

	# Bootstrap runner for the Ralph loop.
	# Tests are defined in prd.json and executed by ./copilot-ralph.py.

	# If progress.txt does not exist, create it
	if [ ! -f progress.txt ]; then
	echo "Creating progress.txt..."
	touch progress.txt
	fi

	# Initialize git repo if not already initialized
	if ! git rev-parse --is-inside-work-tree &>/dev/null; then
	echo "Initializing git repository..."
	git init
	git add -A
	git commit -m "Initial commit"
	fi

	# Install dependencies if possible.
	# If this is a brand-new empty repo, there may be no package.json yet.
	# In that case, skip install so the agent can create the project files.
	if [ -f package.json ]; then
	if [ ! -d node_modules ]; then
	echo "Installing dependencies..."
	if command -v pnpm &>/dev/null; then
	pnpm install
	else
	npm install
	fi
	fi
	else
	echo "No package.json found; skipping dependency install (agent will create project files)."
	fi

	# Ensure clean working tree (Ralph refuses to start otherwise)
	if [ -n "$(git status --porcelain)" ]; then
	echo "Working tree not clean; committing changes before Ralph run..."
	git add -A
	if [ "${RALPH_NO_VERIFY:-}" = "1" ]; then
	git commit -m "chore: prep for ralph run" --no-verify
	else
	git commit -m "chore: prep for ralph run"
	fi
	fi
	./copilot-ralph.py --prd prd.json --progress progress.txt --max-iterations 30 \
	--copilot-arg="--allow-all-tools" \
	--copilot-arg="--allow-all-paths"