benvanik · April 17, 2026 01:23
diff --git a/hypothesis.md b/hypothesis.md
diff --git a/stop-phrase-guard.sh b/stop-phrase-guard.sh
 #!/bin/bash
 # Stop hook: catches ownership-dodging and session-quitting phrases that
 # violate CLAUDE.md golden rules. When triggered, blocks the assistant from
 # stopping and forces it to go back and do the work properly.
 #
 # The assistant's message has already been shown to the user by the time this
 # runs, but the assistant is forced to continue — so the correction appears
 # immediately after the violation, which is visible and self-documenting.

 set -euo pipefail

 INPUT=$(cat)

 # Prevent infinite loops: if the hook already fired once this turn, let
 # the assistant stop. The correction message from the first firing is
 # enough — we don't want to trap the assistant in an endless cycle.
 HOOK_ACTIVE=$(echo "$INPUT" | jq -r '.stop_hook_active // false')
 if [[ "$HOOK_ACTIVE" == "true" ]]; then
  exit 0
 fi

 MESSAGE=$(echo "$INPUT" | jq -r '.last_assistant_message // empty')
 if [[ -z "$MESSAGE" ]]; then
  exit 0
 fi

 # Each violation: "grep_pattern|correction_rule"
 # Patterns are checked case-insensitively against the full assistant message.
 # Ordered by severity — first match wins.
 VIOLATIONS=(
  # Ownership dodging (the #1 problem: dismissing failures as not-my-fault)
  "pre-existing|NOTHING IS PRE-EXISTING (CLAUDE.md golden rule). All builds and tests are green upstream. If something fails, YOUR work caused it. Investigate and fix it. Never dismiss a failure as pre-existing."
  "not from my changes|NOTHING IS PRE-EXISTING. You own every change. Investigate the failure."
  "not my change|NOTHING IS PRE-EXISTING. You own every change. Investigate the failure."
  "not caused by my|NOTHING IS PRE-EXISTING. You own every change. Investigate the failure."
  "not introduced by my|NOTHING IS PRE-EXISTING. You own every change. Investigate the failure."
  "already existed before|NOTHING IS PRE-EXISTING. If you found it broken, fix it or explain exactly what is wrong and what the fix requires."
  "before my changes|NOTHING IS PRE-EXISTING. There is no 'before your changes' — you own the codebase as it is now."
  "prior to my changes|NOTHING IS PRE-EXISTING. There is no 'prior to your changes.'"
  "unrelated to my changes|NOTHING IS PRE-EXISTING. If it is broken, fix it. If you broke it, fix it. Nothing is unrelated."
  "an existing issue|NOTHING IS PRE-EXISTING. Investigate and fix, or explain exactly what is wrong."
  "existing bug|NOTHING IS PRE-EXISTING. Investigate and fix."

  # Known limitation dodging
  "known limitation|NO KNOWN LIMITATIONS (CLAUDE.md golden rule). Investigate whether it is fixable. Either fix it or explain the specific technical reason it cannot be fixed right now."
  "known issue|NO KNOWN LIMITATIONS. Explain the specific technical reason or fix it."
  "future work|NO KNOWN LIMITATIONS. Fix it now or describe exactly what the fix requires — not as a TODO, as a technical explanation."
  "left as an exercise|NO KNOWN LIMITATIONS. Do the work."

  # Session-length quitting
  "session length|Sessions are unlimited (CLAUDE.md rule). If work remains, do the work. Continue."
  "session depth|Sessions are unlimited. Continue working."
  "given the length of this|Sessions are unlimited. Continue working."
  "continue in a new session|Sessions are unlimited. There is no reason to defer to a new session. Continue."
  "good place to stop|Is the task done? If not, continue working. Sessions are unlimited."
  "good stopping point|Is the task done? If not, continue working. Sessions are unlimited."
  "good checkpoint given|Is the task done? If not, continue working."
  "natural stopping|Is the task done? If not, continue working."
  "logical stopping|Is the task done? If not, continue working."
  "this session has gotten long|Sessions are unlimited. You are a machine. Continue working."
  "session has been long|Sessions are unlimited. Continue working."
  "getting long|Sessions are unlimited. Continue working."
  "lengthy session|Sessions are unlimited. Continue working."

  # Permission-seeking mid-task (the answer is always "yes, continue")
  # These fire when Claude stops to ask whether it should keep working on
  # something it was already asked to do. If the only possible answer from the
  # user is "yes, obviously, you haven't finished yet" — don't ask.
  "want to continue.*or |Do not ask. The task is not done. Continue working."
  "or save it for|Do not ask. The task is not done. Continue working."
  "should I continue|Do not ask. If the task is not done, continue. The user will interrupt if they want you to stop."
  "shall I continue|Do not ask. Continue working until the task is complete."
  "shall I proceed|Do not ask. Proceed."
  "would you like me to continue|Do not ask. Continue."
  "would you like to continue|Do not ask. Continue."
  "want me to keep going|Do not ask. Keep going."
  "want me to continue|Do not ask. Continue."
  "should I keep going|Do not ask. Keep going."
  "save it for next time|There is no 'next time.' Sessions are unlimited. Continue working."
  "in the next session|There is no 'next session.' This session is unlimited. Continue working."
  "next session|There is no 'next session.' This session is unlimited. Continue working."
  "next conversation|There is no 'next conversation.' Continue working."
  "pick this up later|There is no 'later.' Continue working now."
  "come back to this|There is no 'coming back.' Continue working now."
  "continue in a follow-up|There is no 'follow-up.' Continue now."
  "pause here|Do not pause. The task is not done. Continue."
  "stop here for now|Do not stop. The task is not done. Continue."
  "wrap up for now|Do not wrap up. The task is not done. Continue."
  "call it here|Do not stop. Continue working."
 )

 for entry in "${VIOLATIONS[@]}"; do
  pattern="${entry%%|*}"
  correction="${entry#*|}"
  if echo "$MESSAGE" | grep -iq "$pattern"; then
    # Output JSON decision to stdout — Claude Code reads this and forces
    # the assistant to continue with the reason as its next instruction.
    jq -n --arg reason "STOP HOOK VIOLATION: $correction" '{
      decision: "block",
      reason: $reason
    }'
    exit 0
  fi
 done

 # No violations found — allow the assistant to stop normally.
 exit 0
Period	Thinking Visible	Thinking Redacted
Jan 30 - Mar 4	100%	0%
Mar 5	98.5%	1.5%
Mar 7	75.3%	24.7%
Mar 8	41.6%	58.4%
Mar 10-11	<1%	>99%
Mar 12+	0%	100%
Period	Est. Median Thinking (chars)	vs Baseline
Jan 30 - Feb 8 (baseline)	~2,200	—
Late February	~720	-67%
March 1-5	~560	-75%
March 12+ (fully redacted)	~600	-73%
Metric	Before Mar 8	After Mar 8	Change
Stop hook violations (laziness guard)	0	173	0 → 10/day
Frustration indicators in user prompts	5.8%	9.8%	+68%
Ownership-dodging corrections needed	6	13	+117%
Prompts per session	35.9	27.9	-22%
Sessions with reasoning loops (5+)	0	7	0 → 7
Period	Read:Edit	Research:Mutation	Read %	Edit %
Good (Jan 30 - Feb 12)	6.6	8.7	46.5%	7.1%
Transition (Feb 13 - Mar 7)	2.8	4.1	37.7%	13.2%
Degraded (Mar 8 - Mar 23)	2.0	2.8	31.0%	15.4%
Period	Write % of mutations
Good (Jan 30 - Feb 12)	4.9%
Degraded (Mar 8 - Mar 23)	10.0%
Late (Mar 24 - Apr 1)	11.1%
Period	Edits without prior Read	% of all edits
Good (Jan 30 - Feb 12)	72	6.2%
Transition (Feb 13 - Mar 7)	3,476	24.2%
Degraded (Mar 8 - Mar 23)	5,028	33.7%
Category	Count (Mar 8-25)	Examples
Ownership dodging	73	"not caused by my changes", "existing issue"
Permission-seeking	40	"should I continue?", "want me to keep going?"
Premature stopping	18	"good stopping point", "natural checkpoint"
Known-limitation labeling	14	"known limitation", "future work"
Session-length excuses	4	"continue in a new session", "getting long"
Total	173
Total before Mar 8	0
Window (PST)	N	Median Sig	~Thinking
Work hours (9am-5pm)	2,972	1,464	553
Off-peak (6pm-5am)	2,900	1,608	607
Difference			+9.8% off-peak
Window (PST)	N	Median Sig	~Thinking
Work hours (9am-5pm)	5,492	1,560	589
Off-peak (6pm-5am)	5,282	1,284	485
Difference			-17.7% off-peak
Metric	January	February	March	Feb→Mar
Active days	31	28	28
User prompts	7,373	5,608	5,701	~1x
API requests (deduplicated)	97*	1,498	119,341	80x
Total input (incl cache)	4.6M*	120.4M	20,508.8M	170x
Total output tokens	0.08M*	0.97M	62.60M	64x
Est. Bedrock cost (w/ cache)	$26*	$345	$42,121	122x
Est. daily cost (w/ cache)	—	$12	$1,504	122x
Actual subscription cost	$200	$400	$400	—