Implement Spec 001: Core UI & Camera Feed with PyObjC
This commit is contained in:
18
.cursor/commands/speckit.specify.md
Normal file
18
.cursor/commands/speckit.specify.md
Normal file
@@ -0,0 +1,18 @@
|
|||||||
|
---
|
||||||
|
description: Create a feature specification
|
||||||
|
---
|
||||||
|
|
||||||
|
Create a specification for:
|
||||||
|
|
||||||
|
$ARGUMENTS
|
||||||
|
|
||||||
|
## Steps
|
||||||
|
|
||||||
|
1. Generate short name (2-4 words, kebab-case)
|
||||||
|
2. Find next spec number from `specs/`
|
||||||
|
3. Create `specs/NNN-short-name.md`
|
||||||
|
4. Include clear acceptance criteria
|
||||||
|
5. Add completion signal:
|
||||||
|
```
|
||||||
|
**Output when complete:** `<promise>DONE</promise>`
|
||||||
|
```
|
||||||
6
.gitignore
vendored
Normal file
6
.gitignore
vendored
Normal file
@@ -0,0 +1,6 @@
|
|||||||
|
.env
|
||||||
|
.venv/
|
||||||
|
__pycache__/
|
||||||
|
*.pyc
|
||||||
|
.DS_Store
|
||||||
|
.specify/
|
||||||
5
AGENTS.md
Normal file
5
AGENTS.md
Normal file
@@ -0,0 +1,5 @@
|
|||||||
|
# Agent Instructions
|
||||||
|
|
||||||
|
**Read:** `.specify/memory/constitution.md`
|
||||||
|
|
||||||
|
That file is your source of truth for this project.
|
||||||
5
CLAUDE.md
Normal file
5
CLAUDE.md
Normal file
@@ -0,0 +1,5 @@
|
|||||||
|
# Agent Instructions
|
||||||
|
|
||||||
|
**Read:** `.specify/memory/constitution.md`
|
||||||
|
|
||||||
|
That file is your source of truth for this project.
|
||||||
18
PROMPT_build.md
Normal file
18
PROMPT_build.md
Normal file
@@ -0,0 +1,18 @@
|
|||||||
|
# Ralph Build Mode
|
||||||
|
|
||||||
|
Read `.specify/memory/constitution.md` first.
|
||||||
|
|
||||||
|
## Your Task
|
||||||
|
|
||||||
|
1. Check `specs/` folder
|
||||||
|
2. Find highest priority INCOMPLETE spec
|
||||||
|
3. Implement completely
|
||||||
|
4. Run tests, verify acceptance criteria
|
||||||
|
5. Commit and push
|
||||||
|
6. Output `<promise>DONE</promise>` when done
|
||||||
|
|
||||||
|
## Rules
|
||||||
|
|
||||||
|
- ONE spec per iteration
|
||||||
|
- Do NOT output magic phrase until truly complete
|
||||||
|
- If blocked: explain in ralph_history.txt, exit without phrase
|
||||||
11
PROMPT_plan.md
Normal file
11
PROMPT_plan.md
Normal file
@@ -0,0 +1,11 @@
|
|||||||
|
# Ralph Planning Mode
|
||||||
|
|
||||||
|
Read `.specify/memory/constitution.md` first.
|
||||||
|
|
||||||
|
## Your Task
|
||||||
|
|
||||||
|
1. Analyze specs in `specs/`
|
||||||
|
2. Create `IMPLEMENTATION_PLAN.md` with prioritized tasks
|
||||||
|
3. Output `<promise>DONE</promise>` when done
|
||||||
|
|
||||||
|
Delete IMPLEMENTATION_PLAN.md to return to direct spec mode.
|
||||||
108
main.py
Normal file
108
main.py
Normal file
@@ -0,0 +1,108 @@
|
|||||||
|
import sys
|
||||||
|
import cv2
|
||||||
|
import numpy as np
|
||||||
|
from PIL import Image
|
||||||
|
import objc
|
||||||
|
from AppKit import (
|
||||||
|
NSApplication, NSApp, NSWindow, NSView, NSImageView, NSButton,
|
||||||
|
NSStackView, NSImage, NSBitmapImageRep, NSBackingStoreBuffered,
|
||||||
|
NSWindowStyleMaskTitled, NSWindowStyleMaskClosable,
|
||||||
|
NSWindowStyleMaskResizable, NSWindowStyleMaskMiniaturizable,
|
||||||
|
NSTimer, NSMakeSize, NSMakeRect, NSObject, NSLog,
|
||||||
|
NSUserInterfaceLayoutOrientationVertical, NSLayoutAttributeCenterX,
|
||||||
|
NSLayoutAttributeCenterY, NSLayoutAttributeWidth, NSLayoutAttributeHeight,
|
||||||
|
NSLayoutAttributeTop, NSLayoutAttributeBottom, NSLayoutAttributeLeading,
|
||||||
|
NSLayoutAttributeTrailing
|
||||||
|
)
|
||||||
|
from Foundation import NSObject, NSTimer, NSDate
|
||||||
|
|
||||||
|
class ItemSenseApp(NSObject):
|
||||||
|
def applicationDidFinishLaunching_(self, notification):
|
||||||
|
self.window = NSWindow.alloc().initWithContentRect_styleMask_backing_defer_(
|
||||||
|
NSMakeRect(0, 0, 800, 600),
|
||||||
|
NSWindowStyleMaskTitled | NSWindowStyleMaskClosable | NSWindowStyleMaskResizable | NSWindowStyleMaskMiniaturizable,
|
||||||
|
NSBackingStoreBuffered,
|
||||||
|
False
|
||||||
|
)
|
||||||
|
self.window.setTitle_("ItemSense")
|
||||||
|
self.window.center()
|
||||||
|
|
||||||
|
# Main content view (StackView for layout)
|
||||||
|
self.stack_view = NSStackView.alloc().init()
|
||||||
|
self.stack_view.setOrientation_(NSUserInterfaceLayoutOrientationVertical)
|
||||||
|
self.stack_view.setSpacing_(10)
|
||||||
|
self.stack_view.setEdgeInsets_((10, 10, 10, 10))
|
||||||
|
self.window.setContentView_(self.stack_view)
|
||||||
|
|
||||||
|
# Image View for Camera Feed
|
||||||
|
self.image_view = NSImageView.alloc().init()
|
||||||
|
self.image_view.setImageScaling_(0) # NSImageScaleProportionallyDown
|
||||||
|
self.stack_view.addView_inGravity_(self.image_view, 1) # Top gravity
|
||||||
|
|
||||||
|
# Capture Button
|
||||||
|
self.capture_button = NSButton.buttonWithTitle_target_action_("Capture", self, "captureClicked:")
|
||||||
|
self.stack_view.addView_inGravity_(self.capture_button, 3) # Bottom gravity
|
||||||
|
|
||||||
|
self.window.makeKeyAndOrderFront_(None)
|
||||||
|
|
||||||
|
# Initialize Camera
|
||||||
|
self.cap = cv2.VideoCapture(0)
|
||||||
|
if not self.cap.isOpened():
|
||||||
|
NSLog("Error: Could not open camera")
|
||||||
|
|
||||||
|
# Start Timer for 30 FPS
|
||||||
|
self.timer = NSTimer.scheduledTimerWithTimeInterval_target_selector_userInfo_repeats_(
|
||||||
|
1.0/30.0, self, "updateFrame:", None, True
|
||||||
|
)
|
||||||
|
|
||||||
|
def applicationShouldTerminateAfterLastWindowClosed_(self, sender):
|
||||||
|
return True
|
||||||
|
|
||||||
|
def applicationWillTerminate_(self, notification):
|
||||||
|
if hasattr(self, 'cap') and self.cap.isOpened():
|
||||||
|
self.cap.release()
|
||||||
|
|
||||||
|
def updateFrame_(self, timer):
|
||||||
|
if hasattr(self, 'cap') and self.cap.isOpened():
|
||||||
|
ret, frame = self.cap.read()
|
||||||
|
if ret:
|
||||||
|
# Convert BGR to RGB
|
||||||
|
rgb_frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
|
||||||
|
|
||||||
|
# Convert to NSImage
|
||||||
|
height, width, channels = rgb_frame.shape
|
||||||
|
bytes_per_line = channels * width
|
||||||
|
|
||||||
|
# Create BitmapRep
|
||||||
|
bitmap_rep = NSBitmapImageRep.alloc().initWithBitmapDataPlanes_pixelsWide_pixelsHigh_bitsPerSample_samplesPerPixel_hasAlpha_isPlanar_colorSpaceName_bytesPerRow_bitsPerPixel_(
|
||||||
|
None, width, height, 8, 3, False, False, "NSDeviceRGBColorSpace", bytes_per_line, 24
|
||||||
|
)
|
||||||
|
|
||||||
|
# Copy data
|
||||||
|
bitmap_data = bitmap_rep.bitmapData()
|
||||||
|
# We need to copy the bytes. This is the PyObjC way to write to the buffer requires a bit of care.
|
||||||
|
# A safer/easier way with PIL:
|
||||||
|
image = Image.fromarray(rgb_frame)
|
||||||
|
img_data = image.tobytes()
|
||||||
|
|
||||||
|
# Low-level memory copy might be tricky in pure python/objc without unsafe pointers.
|
||||||
|
# Alternative: Use PIL to save to memory buffer (TIFF/PNG) and load NSImage from data.
|
||||||
|
# This is slightly slower but safer and easier in Python.
|
||||||
|
import io
|
||||||
|
# Using PPM format is fast (uncompressed)
|
||||||
|
header = f"P6 {width} {height} 255 ".encode()
|
||||||
|
data = header + rgb_frame.tobytes()
|
||||||
|
ns_data = objc.lookUpClass("NSData").dataWithBytes_length_(data, len(data))
|
||||||
|
ns_image = NSImage.alloc().initWithData_(ns_data)
|
||||||
|
|
||||||
|
self.image_view.setImage_(ns_image)
|
||||||
|
|
||||||
|
def captureClicked_(self, sender):
|
||||||
|
print("Capture clicked")
|
||||||
|
|
||||||
|
if __name__ == "__main__":
|
||||||
|
app = NSApplication.sharedApplication()
|
||||||
|
delegate = ItemSenseApp.alloc().init()
|
||||||
|
app.setDelegate_(delegate)
|
||||||
|
NSApp.activateIgnoringOtherApps_(True)
|
||||||
|
app.run()
|
||||||
5
requirements.txt
Normal file
5
requirements.txt
Normal file
@@ -0,0 +1,5 @@
|
|||||||
|
pyobjc-framework-Cocoa
|
||||||
|
opencv-python
|
||||||
|
pillow
|
||||||
|
openai
|
||||||
|
python-dotenv
|
||||||
635
scripts/ralph-loop-codex.sh
Executable file
635
scripts/ralph-loop-codex.sh
Executable file
@@ -0,0 +1,635 @@
|
|||||||
|
#!/bin/bash
|
||||||
|
#
|
||||||
|
# Ralph Loop for OpenAI Codex CLI
|
||||||
|
#
|
||||||
|
# Based on Geoffrey Huntley's Ralph Wiggum methodology.
|
||||||
|
# Combined with SpecKit-style specifications.
|
||||||
|
#
|
||||||
|
# Usage:
|
||||||
|
# ./scripts/ralph-loop-codex.sh # Build mode (unlimited)
|
||||||
|
# ./scripts/ralph-loop-codex.sh 20 # Build mode (max 20 iterations)
|
||||||
|
# ./scripts/ralph-loop-codex.sh plan # Planning mode (optional)
|
||||||
|
#
|
||||||
|
|
||||||
|
set -e
|
||||||
|
set -o pipefail
|
||||||
|
|
||||||
|
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
|
||||||
|
PROJECT_DIR="$(dirname "$SCRIPT_DIR")"
|
||||||
|
LOG_DIR="$PROJECT_DIR/logs"
|
||||||
|
CONSTITUTION="$PROJECT_DIR/.specify/memory/constitution.md"
|
||||||
|
RLM_DIR="$PROJECT_DIR/rlm"
|
||||||
|
RLM_TRACE_DIR="$RLM_DIR/trace"
|
||||||
|
RLM_QUERIES_DIR="$RLM_DIR/queries"
|
||||||
|
RLM_ANSWERS_DIR="$RLM_DIR/answers"
|
||||||
|
RLM_INDEX="$RLM_DIR/index.tsv"
|
||||||
|
|
||||||
|
# Configuration
|
||||||
|
MAX_ITERATIONS=0 # 0 = unlimited
|
||||||
|
MODE="build"
|
||||||
|
RLM_CONTEXT_FILE=""
|
||||||
|
CODEX_CMD="${CODEX_CMD:-codex}"
|
||||||
|
TAIL_LINES=5
|
||||||
|
TAIL_RENDERED_LINES=0
|
||||||
|
ROLLING_OUTPUT_LINES=5
|
||||||
|
ROLLING_OUTPUT_INTERVAL=10
|
||||||
|
ROLLING_RENDERED_LINES=0
|
||||||
|
|
||||||
|
# Colors
|
||||||
|
RED='\033[0;31m'
|
||||||
|
GREEN='\033[0;32m'
|
||||||
|
YELLOW='\033[1;33m'
|
||||||
|
BLUE='\033[0;34m'
|
||||||
|
PURPLE='\033[0;35m'
|
||||||
|
CYAN='\033[0;36m'
|
||||||
|
NC='\033[0m'
|
||||||
|
|
||||||
|
mkdir -p "$LOG_DIR"
|
||||||
|
|
||||||
|
# Check constitution for YOLO setting
|
||||||
|
YOLO_ENABLED=true
|
||||||
|
if [[ -f "$CONSTITUTION" ]]; then
|
||||||
|
if grep -q "YOLO Mode.*DISABLED" "$CONSTITUTION" 2>/dev/null; then
|
||||||
|
YOLO_ENABLED=false
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
|
||||||
|
show_help() {
|
||||||
|
cat <<EOF
|
||||||
|
Ralph Loop for OpenAI Codex CLI
|
||||||
|
|
||||||
|
Usage:
|
||||||
|
./scripts/ralph-loop-codex.sh # Build mode, unlimited
|
||||||
|
./scripts/ralph-loop-codex.sh 20 # Build mode, max 20 iterations
|
||||||
|
./scripts/ralph-loop-codex.sh plan # Planning mode (OPTIONAL)
|
||||||
|
./scripts/ralph-loop-codex.sh --rlm-context ./rlm/context.txt
|
||||||
|
./scripts/ralph-loop-codex.sh --rlm ./rlm/context.txt
|
||||||
|
|
||||||
|
Modes:
|
||||||
|
build (default) Pick incomplete spec and implement
|
||||||
|
plan Create IMPLEMENTATION_PLAN.md (OPTIONAL)
|
||||||
|
|
||||||
|
Work Source:
|
||||||
|
Agent reads specs/*.md and picks the highest priority incomplete spec.
|
||||||
|
|
||||||
|
YOLO Mode: Uses --dangerously-bypass-approvals-and-sandbox
|
||||||
|
|
||||||
|
RLM Mode (optional):
|
||||||
|
--rlm-context <file> Treat a large context file as external environment.
|
||||||
|
The agent should read slices instead of loading it all.
|
||||||
|
--rlm [file] Shortcut for --rlm-context (defaults to rlm/context.txt)
|
||||||
|
|
||||||
|
RLM workspace (when enabled):
|
||||||
|
- rlm/trace/ Prompt snapshots + outputs per iteration
|
||||||
|
- rlm/index.tsv Index of all iterations (timestamp, prompt, log, status)
|
||||||
|
- rlm/queries/ and rlm/answers/ For optional recursive sub-queries
|
||||||
|
|
||||||
|
EOF
|
||||||
|
}
|
||||||
|
|
||||||
|
print_latest_output() {
|
||||||
|
local log_file="$1"
|
||||||
|
local label="${2:-Codex}"
|
||||||
|
local target="/dev/tty"
|
||||||
|
|
||||||
|
[ -f "$log_file" ] || return 0
|
||||||
|
|
||||||
|
if [ ! -w "$target" ]; then
|
||||||
|
target="/dev/stdout"
|
||||||
|
fi
|
||||||
|
|
||||||
|
if [ "$target" = "/dev/tty" ] && [ "$TAIL_RENDERED_LINES" -gt 0 ]; then
|
||||||
|
printf "\033[%dA\033[J" "$TAIL_RENDERED_LINES" > "$target"
|
||||||
|
fi
|
||||||
|
|
||||||
|
{
|
||||||
|
echo "Latest ${label} output (last ${TAIL_LINES} lines):"
|
||||||
|
tail -n "$TAIL_LINES" "$log_file"
|
||||||
|
} > "$target"
|
||||||
|
|
||||||
|
if [ "$target" = "/dev/tty" ]; then
|
||||||
|
TAIL_RENDERED_LINES=$((TAIL_LINES + 1))
|
||||||
|
fi
|
||||||
|
}
|
||||||
|
|
||||||
|
watch_latest_output() {
|
||||||
|
local log_file="$1"
|
||||||
|
local label="${2:-Codex}"
|
||||||
|
local target="/dev/tty"
|
||||||
|
local use_tty=false
|
||||||
|
local use_tput=false
|
||||||
|
|
||||||
|
[ -f "$log_file" ] || return 0
|
||||||
|
|
||||||
|
if [ ! -w "$target" ]; then
|
||||||
|
target="/dev/stdout"
|
||||||
|
else
|
||||||
|
use_tty=true
|
||||||
|
if command -v tput &>/dev/null; then
|
||||||
|
use_tput=true
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
|
||||||
|
if [ "$use_tty" = true ]; then
|
||||||
|
if [ "$use_tput" = true ]; then
|
||||||
|
tput cr > "$target"
|
||||||
|
tput sc > "$target"
|
||||||
|
else
|
||||||
|
printf "\r\0337" > "$target"
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
|
||||||
|
while true; do
|
||||||
|
local timestamp
|
||||||
|
timestamp=$(date '+%Y-%m-%d %H:%M:%S')
|
||||||
|
|
||||||
|
if [ "$use_tty" = true ]; then
|
||||||
|
if [ "$use_tput" = true ]; then
|
||||||
|
tput rc > "$target"
|
||||||
|
tput ed > "$target"
|
||||||
|
tput cr > "$target"
|
||||||
|
else
|
||||||
|
printf "\0338\033[J\r" > "$target"
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
|
||||||
|
{
|
||||||
|
echo -e "${CYAN}[$timestamp] Latest ${label} output (last ${ROLLING_OUTPUT_LINES} lines):${NC}"
|
||||||
|
if [ ! -s "$log_file" ]; then
|
||||||
|
echo "(no output yet)"
|
||||||
|
else
|
||||||
|
tail -n "$ROLLING_OUTPUT_LINES" "$log_file" 2>/dev/null || true
|
||||||
|
fi
|
||||||
|
echo ""
|
||||||
|
} > "$target"
|
||||||
|
|
||||||
|
sleep "$ROLLING_OUTPUT_INTERVAL"
|
||||||
|
done
|
||||||
|
}
|
||||||
|
|
||||||
|
# Parse arguments
|
||||||
|
while [[ $# -gt 0 ]]; do
|
||||||
|
case "$1" in
|
||||||
|
plan)
|
||||||
|
MODE="plan"
|
||||||
|
if [[ "${2:-}" =~ ^[0-9]+$ ]]; then
|
||||||
|
MAX_ITERATIONS="$2"
|
||||||
|
shift 2
|
||||||
|
else
|
||||||
|
MAX_ITERATIONS=1
|
||||||
|
shift
|
||||||
|
fi
|
||||||
|
;;
|
||||||
|
--rlm-context)
|
||||||
|
RLM_CONTEXT_FILE="${2:-}"
|
||||||
|
shift 2
|
||||||
|
;;
|
||||||
|
--rlm)
|
||||||
|
if [[ -n "${2:-}" && "${2:0:1}" != "-" ]]; then
|
||||||
|
RLM_CONTEXT_FILE="$2"
|
||||||
|
shift 2
|
||||||
|
else
|
||||||
|
RLM_CONTEXT_FILE="rlm/context.txt"
|
||||||
|
shift
|
||||||
|
fi
|
||||||
|
;;
|
||||||
|
-h|--help)
|
||||||
|
show_help
|
||||||
|
exit 0
|
||||||
|
;;
|
||||||
|
[0-9]*)
|
||||||
|
MODE="build"
|
||||||
|
MAX_ITERATIONS="$1"
|
||||||
|
shift
|
||||||
|
;;
|
||||||
|
*)
|
||||||
|
echo -e "${RED}Unknown argument: $1${NC}"
|
||||||
|
show_help
|
||||||
|
exit 1
|
||||||
|
;;
|
||||||
|
esac
|
||||||
|
done
|
||||||
|
|
||||||
|
cd "$PROJECT_DIR"
|
||||||
|
|
||||||
|
# Validate RLM context file (if provided)
|
||||||
|
if [ -n "$RLM_CONTEXT_FILE" ] && [ ! -f "$RLM_CONTEXT_FILE" ]; then
|
||||||
|
echo -e "${RED}Error: RLM context file not found: $RLM_CONTEXT_FILE${NC}"
|
||||||
|
echo "Create it first (example):"
|
||||||
|
echo " mkdir -p rlm && printf \"%s\" \"<your long context>\" > $RLM_CONTEXT_FILE"
|
||||||
|
exit 1
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Initialize RLM workspace (optional)
|
||||||
|
if [ -n "$RLM_CONTEXT_FILE" ]; then
|
||||||
|
mkdir -p "$RLM_TRACE_DIR" "$RLM_QUERIES_DIR" "$RLM_ANSWERS_DIR"
|
||||||
|
if [ ! -f "$RLM_INDEX" ]; then
|
||||||
|
echo -e "timestamp\tmode\titeration\tprompt\tlog\toutput\tstatus" > "$RLM_INDEX"
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Session log (captures ALL output)
|
||||||
|
SESSION_LOG="$LOG_DIR/ralph_codex_${MODE}_session_$(date '+%Y%m%d_%H%M%S').log"
|
||||||
|
exec > >(tee -a "$SESSION_LOG") 2>&1
|
||||||
|
|
||||||
|
# Check if Codex CLI is available
|
||||||
|
if ! command -v "$CODEX_CMD" &> /dev/null; then
|
||||||
|
echo -e "${RED}Error: Codex CLI not found${NC}"
|
||||||
|
echo ""
|
||||||
|
echo "Install Codex CLI:"
|
||||||
|
echo " npm install -g @openai/codex"
|
||||||
|
echo ""
|
||||||
|
echo "Then authenticate:"
|
||||||
|
echo " codex login"
|
||||||
|
exit 1
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Determine prompt file
|
||||||
|
if [ "$MODE" = "plan" ]; then
|
||||||
|
PROMPT_FILE="PROMPT_plan.md"
|
||||||
|
else
|
||||||
|
PROMPT_FILE="PROMPT_build.md"
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Create prompt files if they don't exist (same as ralph-loop.sh)
|
||||||
|
if [ ! -f "PROMPT_build.md" ]; then
|
||||||
|
echo -e "${YELLOW}Creating PROMPT_build.md...${NC}"
|
||||||
|
cat > "PROMPT_build.md" << 'BUILDEOF'
|
||||||
|
# Ralph Build Mode
|
||||||
|
|
||||||
|
Based on Geoffrey Huntley's Ralph Wiggum methodology.
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 0: Orient
|
||||||
|
|
||||||
|
Read `.specify/memory/constitution.md` to understand project principles and constraints.
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 1: Discover Work Items
|
||||||
|
|
||||||
|
Search for incomplete work from these sources (in order):
|
||||||
|
|
||||||
|
1. **specs/ folder** — Look for `.md` files NOT marked `## Status: COMPLETE`
|
||||||
|
2. **IMPLEMENTATION_PLAN.md** — If exists, find unchecked `- [ ]` tasks
|
||||||
|
3. **GitHub Issues** — Check for open issues (if this is a GitHub repo)
|
||||||
|
4. **Any task tracker** — Jira, Linear, etc. if configured
|
||||||
|
|
||||||
|
Pick the **HIGHEST PRIORITY** incomplete item:
|
||||||
|
- Lower numbers = higher priority (001 before 010)
|
||||||
|
- `[HIGH]` before `[MEDIUM]` before `[LOW]`
|
||||||
|
- Bugs/blockers before features
|
||||||
|
|
||||||
|
Before implementing, search the codebase to verify it's not already done.
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 1b: Re-Verification Mode (No Incomplete Work Found)
|
||||||
|
|
||||||
|
**If ALL specs appear complete**, don't just exit — do a quality check:
|
||||||
|
|
||||||
|
1. **Randomly pick** one completed spec from `specs/`
|
||||||
|
2. **Strictly re-verify** ALL its acceptance criteria:
|
||||||
|
- Run the actual tests mentioned in the spec
|
||||||
|
- Manually verify each criterion is truly met
|
||||||
|
- Check edge cases
|
||||||
|
- Look for regressions
|
||||||
|
3. **If any criterion fails**: Unmark the spec as complete and fix it
|
||||||
|
4. **If all pass**: Output `<promise>DONE</promise>` to confirm quality
|
||||||
|
|
||||||
|
This ensures the codebase stays healthy even when "nothing to do."
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 2: Implement
|
||||||
|
|
||||||
|
Implement the selected spec/task completely:
|
||||||
|
- Follow the spec's requirements exactly
|
||||||
|
- Write clean, maintainable code
|
||||||
|
- Add tests as needed
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 3: Validate
|
||||||
|
|
||||||
|
Run the project's test suite and verify:
|
||||||
|
- All tests pass
|
||||||
|
- No lint errors
|
||||||
|
- The spec's acceptance criteria are 100% met
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 4: Commit & Update
|
||||||
|
|
||||||
|
1. Mark the spec/task as complete (add `## Status: COMPLETE` to spec file)
|
||||||
|
2. `git add -A`
|
||||||
|
3. `git commit` with a descriptive message
|
||||||
|
4. `git push`
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Completion Signal
|
||||||
|
|
||||||
|
**CRITICAL:** Only output the magic phrase when the work is 100% complete.
|
||||||
|
|
||||||
|
Check:
|
||||||
|
- [ ] Implementation matches all requirements
|
||||||
|
- [ ] All tests pass
|
||||||
|
- [ ] All acceptance criteria verified
|
||||||
|
- [ ] Changes committed and pushed
|
||||||
|
- [ ] Spec marked as complete
|
||||||
|
|
||||||
|
**If ALL checks pass, output:** `<promise>DONE</promise>`
|
||||||
|
|
||||||
|
**If ANY check fails:** Fix the issue and try again. Do NOT output the magic phrase.
|
||||||
|
BUILDEOF
|
||||||
|
fi
|
||||||
|
|
||||||
|
if [ ! -f "PROMPT_plan.md" ]; then
|
||||||
|
echo -e "${YELLOW}Creating PROMPT_plan.md...${NC}"
|
||||||
|
cat > "PROMPT_plan.md" << 'PLANEOF'
|
||||||
|
# Ralph Planning Mode (OPTIONAL)
|
||||||
|
|
||||||
|
This mode is OPTIONAL. Most projects work fine directly from specs.
|
||||||
|
|
||||||
|
Only use this when you want a detailed breakdown of specs into smaller tasks.
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 0: Orient
|
||||||
|
|
||||||
|
0a. Read `.specify/memory/constitution.md` for project principles.
|
||||||
|
|
||||||
|
0b. Study `specs/` to learn all feature specifications.
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 1: Gap Analysis
|
||||||
|
|
||||||
|
Compare specs against current codebase:
|
||||||
|
- What's fully implemented?
|
||||||
|
- What's partially done?
|
||||||
|
- What's not started?
|
||||||
|
- What has issues or bugs?
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 2: Create Plan
|
||||||
|
|
||||||
|
Create `IMPLEMENTATION_PLAN.md` with a prioritized task list:
|
||||||
|
|
||||||
|
```markdown
|
||||||
|
# Implementation Plan
|
||||||
|
|
||||||
|
> Auto-generated breakdown of specs into tasks.
|
||||||
|
> Delete this file to return to working directly from specs.
|
||||||
|
|
||||||
|
## Priority Tasks
|
||||||
|
|
||||||
|
- [ ] [HIGH] Task description - from spec NNN
|
||||||
|
- [ ] [HIGH] Task description - from spec NNN
|
||||||
|
- [ ] [MEDIUM] Task description
|
||||||
|
- [ ] [LOW] Task description
|
||||||
|
|
||||||
|
## Completed
|
||||||
|
|
||||||
|
- [x] Completed task
|
||||||
|
```
|
||||||
|
|
||||||
|
Prioritize by:
|
||||||
|
1. Dependencies (do prerequisites first)
|
||||||
|
2. Impact (high-value features first)
|
||||||
|
3. Complexity (mix easy wins with harder tasks)
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Completion Signal
|
||||||
|
|
||||||
|
When the plan is complete and saved:
|
||||||
|
|
||||||
|
`<promise>DONE</promise>`
|
||||||
|
PLANEOF
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Build Codex flags for exec mode
|
||||||
|
CODEX_FLAGS="exec"
|
||||||
|
if [ "$YOLO_ENABLED" = true ]; then
|
||||||
|
CODEX_FLAGS="$CODEX_FLAGS --dangerously-bypass-approvals-and-sandbox"
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Get current branch
|
||||||
|
CURRENT_BRANCH=$(git branch --show-current 2>/dev/null || echo "main")
|
||||||
|
|
||||||
|
# Check for work sources - count .md files in specs/
|
||||||
|
HAS_SPECS=false
|
||||||
|
SPEC_COUNT=0
|
||||||
|
if [ -d "specs" ]; then
|
||||||
|
SPEC_COUNT=$(find specs -maxdepth 1 -name "*.md" -type f 2>/dev/null | wc -l)
|
||||||
|
[ "$SPEC_COUNT" -gt 0 ] && HAS_SPECS=true
|
||||||
|
fi
|
||||||
|
|
||||||
|
echo ""
|
||||||
|
echo -e "${GREEN}━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━${NC}"
|
||||||
|
echo -e "${GREEN} RALPH LOOP (Codex) STARTING ${NC}"
|
||||||
|
echo -e "${GREEN}━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━${NC}"
|
||||||
|
echo ""
|
||||||
|
echo -e "${BLUE}Mode:${NC} $MODE"
|
||||||
|
echo -e "${BLUE}Prompt:${NC} $PROMPT_FILE"
|
||||||
|
echo -e "${BLUE}Branch:${NC} $CURRENT_BRANCH"
|
||||||
|
echo -e "${YELLOW}YOLO:${NC} $([ "$YOLO_ENABLED" = true ] && echo "ENABLED" || echo "DISABLED")"
|
||||||
|
[ -n "$RLM_CONTEXT_FILE" ] && echo -e "${BLUE}RLM:${NC} $RLM_CONTEXT_FILE"
|
||||||
|
[ -n "$SESSION_LOG" ] && echo -e "${BLUE}Log:${NC} $SESSION_LOG"
|
||||||
|
[ $MAX_ITERATIONS -gt 0 ] && echo -e "${BLUE}Max:${NC} $MAX_ITERATIONS iterations"
|
||||||
|
echo ""
|
||||||
|
echo -e "${BLUE}Work source:${NC}"
|
||||||
|
if [ "$HAS_SPECS" = true ]; then
|
||||||
|
echo -e " ${GREEN}✓${NC} specs/ folder ($SPEC_COUNT specs)"
|
||||||
|
else
|
||||||
|
echo -e " ${RED}✗${NC} specs/ folder (no .md files found)"
|
||||||
|
fi
|
||||||
|
echo ""
|
||||||
|
echo -e "${CYAN}Using: $CODEX_CMD $CODEX_FLAGS${NC}"
|
||||||
|
echo -e "${CYAN}Agent must output <promise>DONE</promise> when complete.${NC}"
|
||||||
|
echo ""
|
||||||
|
echo -e "${YELLOW}Press Ctrl+C to stop the loop${NC}"
|
||||||
|
echo ""
|
||||||
|
|
||||||
|
ITERATION=0
|
||||||
|
CONSECUTIVE_FAILURES=0
|
||||||
|
MAX_CONSECUTIVE_FAILURES=3
|
||||||
|
|
||||||
|
while true; do
|
||||||
|
# Check max iterations
|
||||||
|
if [ $MAX_ITERATIONS -gt 0 ] && [ $ITERATION -ge $MAX_ITERATIONS ]; then
|
||||||
|
echo -e "${GREEN}Reached max iterations: $MAX_ITERATIONS${NC}"
|
||||||
|
break
|
||||||
|
fi
|
||||||
|
|
||||||
|
ITERATION=$((ITERATION + 1))
|
||||||
|
TIMESTAMP=$(date '+%Y-%m-%d %H:%M:%S')
|
||||||
|
|
||||||
|
echo ""
|
||||||
|
echo -e "${PURPLE}════════════════════ LOOP $ITERATION ════════════════════${NC}"
|
||||||
|
echo -e "${BLUE}[$TIMESTAMP]${NC} Starting iteration $ITERATION"
|
||||||
|
echo ""
|
||||||
|
|
||||||
|
# Log file for this iteration
|
||||||
|
LOG_FILE="$LOG_DIR/ralph_codex_${MODE}_iter_${ITERATION}_$(date '+%Y%m%d_%H%M%S').log"
|
||||||
|
OUTPUT_FILE="$LOG_DIR/ralph_codex_output_iter_${ITERATION}_$(date '+%Y%m%d_%H%M%S').txt"
|
||||||
|
RLM_STATUS="unknown"
|
||||||
|
: > "$LOG_FILE"
|
||||||
|
WATCH_PID=""
|
||||||
|
|
||||||
|
if [ "$ROLLING_OUTPUT_INTERVAL" -gt 0 ] && [ "$ROLLING_OUTPUT_LINES" -gt 0 ] && [ -t 1 ] && [ -w /dev/tty ]; then
|
||||||
|
watch_latest_output "$LOG_FILE" "Codex" &
|
||||||
|
WATCH_PID=$!
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Optional RLM context block appended to prompt at runtime
|
||||||
|
EFFECTIVE_PROMPT_FILE="$PROMPT_FILE"
|
||||||
|
if [ -n "$RLM_CONTEXT_FILE" ]; then
|
||||||
|
EFFECTIVE_PROMPT_FILE="$LOG_DIR/ralph_codex_prompt_iter_${ITERATION}_$(date '+%Y%m%d_%H%M%S').md"
|
||||||
|
cat "$PROMPT_FILE" > "$EFFECTIVE_PROMPT_FILE"
|
||||||
|
cat >> "$EFFECTIVE_PROMPT_FILE" << EOF
|
||||||
|
|
||||||
|
---
|
||||||
|
## RLM Context (Optional)
|
||||||
|
|
||||||
|
You have access to a large context file at:
|
||||||
|
**$RLM_CONTEXT_FILE**
|
||||||
|
|
||||||
|
Treat this file as an external environment. Do NOT paste the whole file into the prompt.
|
||||||
|
Instead, inspect it programmatically and recursively:
|
||||||
|
|
||||||
|
- Use small slices:
|
||||||
|
\`\`\`bash
|
||||||
|
sed -n 'START,ENDp' "$RLM_CONTEXT_FILE"
|
||||||
|
\`\`\`
|
||||||
|
- Or Python snippets:
|
||||||
|
\`\`\`bash
|
||||||
|
python - <<'PY'
|
||||||
|
from pathlib import Path
|
||||||
|
p = Path("$RLM_CONTEXT_FILE")
|
||||||
|
print(p.read_text().splitlines()[START:END])
|
||||||
|
PY
|
||||||
|
\`\`\`
|
||||||
|
- Use search:
|
||||||
|
\`\`\`bash
|
||||||
|
rg -n "pattern" "$RLM_CONTEXT_FILE"
|
||||||
|
\`\`\`
|
||||||
|
|
||||||
|
Goal: decompose the task into smaller sub-queries and only load the pieces you need.
|
||||||
|
This mirrors the Recursive Language Model approach from https://arxiv.org/html/2512.24601v1
|
||||||
|
|
||||||
|
## RLM Workspace (Optional)
|
||||||
|
|
||||||
|
Past loop outputs are preserved on disk:
|
||||||
|
- Iteration logs: \`logs/\`
|
||||||
|
- Prompt/output snapshots: \`rlm/trace/\`
|
||||||
|
- Iteration index: \`rlm/index.tsv\`
|
||||||
|
|
||||||
|
Use these as an external memory store (search/slice as needed).
|
||||||
|
If you need a recursive sub-query, write a focused prompt in \`rlm/queries/\`,
|
||||||
|
run:
|
||||||
|
\`./scripts/rlm-subcall.sh --query rlm/queries/<file>.md\`
|
||||||
|
and store the result in \`rlm/answers/\`.
|
||||||
|
EOF
|
||||||
|
RLM_PROMPT_SNAPSHOT="$RLM_TRACE_DIR/iter_${ITERATION}_prompt.md"
|
||||||
|
cp "$EFFECTIVE_PROMPT_FILE" "$RLM_PROMPT_SNAPSHOT"
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Run Codex with exec mode, reading prompt from stdin with "-"
|
||||||
|
# Use --output-last-message to capture the final response for checking
|
||||||
|
echo -e "${BLUE}Running: cat $EFFECTIVE_PROMPT_FILE | $CODEX_CMD $CODEX_FLAGS - --output-last-message $OUTPUT_FILE${NC}"
|
||||||
|
echo ""
|
||||||
|
|
||||||
|
CODEX_EXIT=0
|
||||||
|
if cat "$EFFECTIVE_PROMPT_FILE" | "$CODEX_CMD" $CODEX_FLAGS - --output-last-message "$OUTPUT_FILE" 2>&1 | tee "$LOG_FILE"; then
|
||||||
|
if [ -n "$WATCH_PID" ]; then
|
||||||
|
kill "$WATCH_PID" 2>/dev/null || true
|
||||||
|
wait "$WATCH_PID" 2>/dev/null || true
|
||||||
|
fi
|
||||||
|
echo ""
|
||||||
|
echo -e "${GREEN}✓ Codex execution completed${NC}"
|
||||||
|
|
||||||
|
# Check if DONE promise was output (accept both DONE and ALL_DONE variants)
|
||||||
|
if [ -f "$OUTPUT_FILE" ] && grep -qE "<promise>(ALL_)?DONE</promise>" "$OUTPUT_FILE"; then
|
||||||
|
DETECTED_SIGNAL=$(grep -oE "<promise>(ALL_)?DONE</promise>" "$OUTPUT_FILE" | tail -1)
|
||||||
|
echo -e "${GREEN}✓ Completion signal detected: ${DETECTED_SIGNAL}${NC}"
|
||||||
|
echo -e "${GREEN}✓ Task completed successfully!${NC}"
|
||||||
|
CONSECUTIVE_FAILURES=0
|
||||||
|
RLM_STATUS="done"
|
||||||
|
|
||||||
|
if [ "$MODE" = "plan" ]; then
|
||||||
|
echo ""
|
||||||
|
echo -e "${GREEN}Planning complete!${NC}"
|
||||||
|
break
|
||||||
|
fi
|
||||||
|
# Also check the main log
|
||||||
|
elif grep -qE "<promise>(ALL_)?DONE</promise>" "$LOG_FILE"; then
|
||||||
|
DETECTED_SIGNAL=$(grep -oE "<promise>(ALL_)?DONE</promise>" "$LOG_FILE" | tail -1)
|
||||||
|
echo -e "${GREEN}✓ Completion signal detected: ${DETECTED_SIGNAL}${NC}"
|
||||||
|
echo -e "${GREEN}✓ Task completed successfully!${NC}"
|
||||||
|
CONSECUTIVE_FAILURES=0
|
||||||
|
RLM_STATUS="done"
|
||||||
|
else
|
||||||
|
echo -e "${YELLOW}⚠ No completion signal found${NC}"
|
||||||
|
echo -e "${YELLOW} Agent did not output <promise>DONE</promise> or <promise>ALL_DONE</promise>${NC}"
|
||||||
|
echo -e "${YELLOW} Retrying in next iteration...${NC}"
|
||||||
|
CONSECUTIVE_FAILURES=$((CONSECUTIVE_FAILURES + 1))
|
||||||
|
RLM_STATUS="incomplete"
|
||||||
|
print_latest_output "$LOG_FILE" "Codex"
|
||||||
|
|
||||||
|
if [ $CONSECUTIVE_FAILURES -ge $MAX_CONSECUTIVE_FAILURES ]; then
|
||||||
|
echo ""
|
||||||
|
echo -e "${RED}⚠ $MAX_CONSECUTIVE_FAILURES consecutive iterations without completion.${NC}"
|
||||||
|
echo -e "${RED} The agent may be stuck. Check logs:${NC}"
|
||||||
|
echo -e "${RED} - $LOG_FILE${NC}"
|
||||||
|
echo -e "${RED} - $OUTPUT_FILE${NC}"
|
||||||
|
CONSECUTIVE_FAILURES=0
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
else
|
||||||
|
if [ -n "$WATCH_PID" ]; then
|
||||||
|
kill "$WATCH_PID" 2>/dev/null || true
|
||||||
|
wait "$WATCH_PID" 2>/dev/null || true
|
||||||
|
fi
|
||||||
|
CODEX_EXIT=$?
|
||||||
|
echo -e "${RED}✗ Codex execution failed (exit code: $CODEX_EXIT)${NC}"
|
||||||
|
echo -e "${YELLOW}Check log: $LOG_FILE${NC}"
|
||||||
|
CONSECUTIVE_FAILURES=$((CONSECUTIVE_FAILURES + 1))
|
||||||
|
RLM_STATUS="error"
|
||||||
|
print_latest_output "$LOG_FILE" "Codex"
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Record iteration in RLM index (optional)
|
||||||
|
if [ -n "$RLM_CONTEXT_FILE" ]; then
|
||||||
|
RLM_PROMPT_PATH="${RLM_PROMPT_SNAPSHOT:-}"
|
||||||
|
RLM_OUTPUT_SNAPSHOT="$RLM_TRACE_DIR/iter_${ITERATION}_output.log"
|
||||||
|
cp "$LOG_FILE" "$RLM_OUTPUT_SNAPSHOT"
|
||||||
|
if [ -f "$OUTPUT_FILE" ]; then
|
||||||
|
RLM_LAST_MESSAGE_SNAPSHOT="$RLM_TRACE_DIR/iter_${ITERATION}_last_message.txt"
|
||||||
|
cp "$OUTPUT_FILE" "$RLM_LAST_MESSAGE_SNAPSHOT"
|
||||||
|
fi
|
||||||
|
RLM_OUTPUT_PATH="${RLM_LAST_MESSAGE_SNAPSHOT:-$RLM_OUTPUT_SNAPSHOT}"
|
||||||
|
echo -e "${TIMESTAMP}\t${MODE}\t${ITERATION}\t${RLM_PROMPT_PATH}\t${LOG_FILE}\t${RLM_OUTPUT_PATH}\t${RLM_STATUS}" >> "$RLM_INDEX"
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Push changes after each iteration
|
||||||
|
git push origin "$CURRENT_BRANCH" 2>/dev/null || {
|
||||||
|
if git log origin/$CURRENT_BRANCH..HEAD --oneline 2>/dev/null | grep -q .; then
|
||||||
|
git push -u origin "$CURRENT_BRANCH" 2>/dev/null || true
|
||||||
|
fi
|
||||||
|
}
|
||||||
|
|
||||||
|
# Brief pause between iterations
|
||||||
|
echo ""
|
||||||
|
echo -e "${BLUE}Waiting 2s before next iteration...${NC}"
|
||||||
|
sleep 2
|
||||||
|
done
|
||||||
|
|
||||||
|
echo ""
|
||||||
|
echo -e "${GREEN}━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━${NC}"
|
||||||
|
echo -e "${GREEN} RALPH LOOP (Codex) FINISHED ($ITERATION iterations) ${NC}"
|
||||||
|
echo -e "${GREEN}━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━${NC}"
|
||||||
688
scripts/ralph-loop.sh
Executable file
688
scripts/ralph-loop.sh
Executable file
@@ -0,0 +1,688 @@
|
|||||||
|
#!/bin/bash
|
||||||
|
#
|
||||||
|
# Ralph Loop for Claude Code
|
||||||
|
#
|
||||||
|
# Based on Geoffrey Huntley's Ralph Wiggum methodology:
|
||||||
|
# https://github.com/ghuntley/how-to-ralph-wiggum
|
||||||
|
#
|
||||||
|
# Combined with SpecKit-style specifications.
|
||||||
|
#
|
||||||
|
# Key principles:
|
||||||
|
# - Each iteration picks ONE task/spec to work on
|
||||||
|
# - Agent works until acceptance criteria are met
|
||||||
|
# - Only outputs <promise>DONE</promise> when truly complete
|
||||||
|
# - Bash loop checks for magic phrase before continuing
|
||||||
|
# - Fresh context window each iteration
|
||||||
|
#
|
||||||
|
# Work sources (in priority order):
|
||||||
|
# 1. IMPLEMENTATION_PLAN.md (if exists) - pick highest priority task
|
||||||
|
# 2. specs/ folder - pick highest priority incomplete spec
|
||||||
|
#
|
||||||
|
# Usage:
|
||||||
|
# ./scripts/ralph-loop.sh # Build mode (unlimited)
|
||||||
|
# ./scripts/ralph-loop.sh 20 # Build mode (max 20 iterations)
|
||||||
|
# ./scripts/ralph-loop.sh plan # Planning mode (creates IMPLEMENTATION_PLAN.md)
|
||||||
|
#
|
||||||
|
|
||||||
|
set -e
|
||||||
|
set -o pipefail
|
||||||
|
|
||||||
|
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
|
||||||
|
PROJECT_DIR="$(dirname "$SCRIPT_DIR")"
|
||||||
|
LOG_DIR="$PROJECT_DIR/logs"
|
||||||
|
CONSTITUTION="$PROJECT_DIR/.specify/memory/constitution.md"
|
||||||
|
RLM_DIR="$PROJECT_DIR/rlm"
|
||||||
|
RLM_TRACE_DIR="$RLM_DIR/trace"
|
||||||
|
RLM_QUERIES_DIR="$RLM_DIR/queries"
|
||||||
|
RLM_ANSWERS_DIR="$RLM_DIR/answers"
|
||||||
|
RLM_INDEX="$RLM_DIR/index.tsv"
|
||||||
|
|
||||||
|
# Configuration
|
||||||
|
MAX_ITERATIONS=0 # 0 = unlimited
|
||||||
|
MODE="build"
|
||||||
|
CLAUDE_CMD="${CLAUDE_CMD:-claude}"
|
||||||
|
YOLO_FLAG="--dangerously-skip-permissions"
|
||||||
|
RLM_CONTEXT_FILE=""
|
||||||
|
TAIL_LINES=5
|
||||||
|
TAIL_RENDERED_LINES=0
|
||||||
|
ROLLING_OUTPUT_LINES=5
|
||||||
|
ROLLING_OUTPUT_INTERVAL=10
|
||||||
|
ROLLING_RENDERED_LINES=0
|
||||||
|
|
||||||
|
# Colors
|
||||||
|
RED='\033[0;31m'
|
||||||
|
GREEN='\033[0;32m'
|
||||||
|
YELLOW='\033[1;33m'
|
||||||
|
BLUE='\033[0;34m'
|
||||||
|
PURPLE='\033[0;35m'
|
||||||
|
CYAN='\033[0;36m'
|
||||||
|
NC='\033[0m'
|
||||||
|
|
||||||
|
mkdir -p "$LOG_DIR"
|
||||||
|
|
||||||
|
# Check constitution for YOLO setting
|
||||||
|
YOLO_ENABLED=true
|
||||||
|
if [[ -f "$CONSTITUTION" ]]; then
|
||||||
|
if grep -q "YOLO Mode.*DISABLED" "$CONSTITUTION" 2>/dev/null; then
|
||||||
|
YOLO_ENABLED=false
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
|
||||||
|
show_help() {
|
||||||
|
cat <<EOF
|
||||||
|
Ralph Loop for Claude Code
|
||||||
|
|
||||||
|
Based on Geoffrey Huntley's Ralph Wiggum methodology + SpecKit specs.
|
||||||
|
https://github.com/ghuntley/how-to-ralph-wiggum
|
||||||
|
|
||||||
|
Usage:
|
||||||
|
./scripts/ralph-loop.sh # Build mode, unlimited iterations
|
||||||
|
./scripts/ralph-loop.sh 20 # Build mode, max 20 iterations
|
||||||
|
./scripts/ralph-loop.sh plan # Planning mode (optional)
|
||||||
|
./scripts/ralph-loop.sh --rlm-context ./rlm/context.txt
|
||||||
|
./scripts/ralph-loop.sh --rlm ./rlm/context.txt
|
||||||
|
|
||||||
|
Modes:
|
||||||
|
build (default) Pick spec/task and implement
|
||||||
|
plan Create IMPLEMENTATION_PLAN.md from specs (OPTIONAL)
|
||||||
|
|
||||||
|
Work Sources (checked in order):
|
||||||
|
1. IMPLEMENTATION_PLAN.md - If exists, pick highest priority task
|
||||||
|
2. specs/ folder - Otherwise, pick highest priority incomplete spec
|
||||||
|
|
||||||
|
The plan mode is OPTIONAL. Most projects can work directly from specs.
|
||||||
|
|
||||||
|
RLM Mode (optional):
|
||||||
|
--rlm-context <file> Treat a large context file as external environment.
|
||||||
|
The agent should read slices instead of loading it all.
|
||||||
|
--rlm [file] Shortcut for --rlm-context (defaults to rlm/context.txt)
|
||||||
|
|
||||||
|
How it works:
|
||||||
|
1. Each iteration feeds PROMPT.md to Claude via stdin
|
||||||
|
2. Claude picks the HIGHEST PRIORITY incomplete spec/task
|
||||||
|
3. Claude implements, tests, and verifies acceptance criteria
|
||||||
|
4. Claude outputs <promise>DONE</promise> ONLY if criteria are met
|
||||||
|
5. Bash loop checks for the magic phrase
|
||||||
|
6. If found, loop continues to next iteration (fresh context)
|
||||||
|
7. If not found, loop retries
|
||||||
|
|
||||||
|
RLM workspace (when enabled):
|
||||||
|
- rlm/trace/ Prompt snapshots + outputs per iteration
|
||||||
|
- rlm/index.tsv Index of all iterations (timestamp, prompt, log, status)
|
||||||
|
- rlm/queries/ and rlm/answers/ For optional recursive sub-queries
|
||||||
|
|
||||||
|
EOF
|
||||||
|
}
|
||||||
|
|
||||||
|
print_latest_output() {
|
||||||
|
local log_file="$1"
|
||||||
|
local label="${2:-Claude}"
|
||||||
|
local target="/dev/tty"
|
||||||
|
|
||||||
|
[ -f "$log_file" ] || return 0
|
||||||
|
|
||||||
|
if [ ! -w "$target" ]; then
|
||||||
|
target="/dev/stdout"
|
||||||
|
fi
|
||||||
|
|
||||||
|
if [ "$target" = "/dev/tty" ] && [ "$TAIL_RENDERED_LINES" -gt 0 ]; then
|
||||||
|
printf "\033[%dA\033[J" "$TAIL_RENDERED_LINES" > "$target"
|
||||||
|
fi
|
||||||
|
|
||||||
|
{
|
||||||
|
echo "Latest ${label} output (last ${TAIL_LINES} lines):"
|
||||||
|
tail -n "$TAIL_LINES" "$log_file"
|
||||||
|
} > "$target"
|
||||||
|
|
||||||
|
if [ "$target" = "/dev/tty" ]; then
|
||||||
|
TAIL_RENDERED_LINES=$((TAIL_LINES + 1))
|
||||||
|
fi
|
||||||
|
}
|
||||||
|
|
||||||
|
watch_latest_output() {
|
||||||
|
local log_file="$1"
|
||||||
|
local label="${2:-Claude}"
|
||||||
|
local target="/dev/tty"
|
||||||
|
local use_tty=false
|
||||||
|
local use_tput=false
|
||||||
|
|
||||||
|
[ -f "$log_file" ] || return 0
|
||||||
|
|
||||||
|
if [ ! -w "$target" ]; then
|
||||||
|
target="/dev/stdout"
|
||||||
|
else
|
||||||
|
use_tty=true
|
||||||
|
if command -v tput &>/dev/null; then
|
||||||
|
use_tput=true
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
|
||||||
|
if [ "$use_tty" = true ]; then
|
||||||
|
if [ "$use_tput" = true ]; then
|
||||||
|
tput cr > "$target"
|
||||||
|
tput sc > "$target"
|
||||||
|
else
|
||||||
|
printf "\r\0337" > "$target"
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
|
||||||
|
while true; do
|
||||||
|
local timestamp
|
||||||
|
timestamp=$(date '+%Y-%m-%d %H:%M:%S')
|
||||||
|
|
||||||
|
if [ "$use_tty" = true ]; then
|
||||||
|
if [ "$use_tput" = true ]; then
|
||||||
|
tput rc > "$target"
|
||||||
|
tput ed > "$target"
|
||||||
|
tput cr > "$target"
|
||||||
|
else
|
||||||
|
printf "\0338\033[J\r" > "$target"
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
|
||||||
|
{
|
||||||
|
echo -e "${CYAN}[$timestamp] Latest ${label} output (last ${ROLLING_OUTPUT_LINES} lines):${NC}"
|
||||||
|
if [ ! -s "$log_file" ]; then
|
||||||
|
echo "(no output yet)"
|
||||||
|
else
|
||||||
|
tail -n "$ROLLING_OUTPUT_LINES" "$log_file" 2>/dev/null || true
|
||||||
|
fi
|
||||||
|
echo ""
|
||||||
|
} > "$target"
|
||||||
|
|
||||||
|
sleep "$ROLLING_OUTPUT_INTERVAL"
|
||||||
|
done
|
||||||
|
}
|
||||||
|
|
||||||
|
# Parse arguments
|
||||||
|
while [[ $# -gt 0 ]]; do
|
||||||
|
case "$1" in
|
||||||
|
plan)
|
||||||
|
MODE="plan"
|
||||||
|
if [[ "${2:-}" =~ ^[0-9]+$ ]]; then
|
||||||
|
MAX_ITERATIONS="$2"
|
||||||
|
shift 2
|
||||||
|
else
|
||||||
|
MAX_ITERATIONS=1
|
||||||
|
shift
|
||||||
|
fi
|
||||||
|
;;
|
||||||
|
--rlm-context)
|
||||||
|
RLM_CONTEXT_FILE="${2:-}"
|
||||||
|
shift 2
|
||||||
|
;;
|
||||||
|
--rlm)
|
||||||
|
if [[ -n "${2:-}" && "${2:0:1}" != "-" ]]; then
|
||||||
|
RLM_CONTEXT_FILE="$2"
|
||||||
|
shift 2
|
||||||
|
else
|
||||||
|
RLM_CONTEXT_FILE="rlm/context.txt"
|
||||||
|
shift
|
||||||
|
fi
|
||||||
|
;;
|
||||||
|
-h|--help)
|
||||||
|
show_help
|
||||||
|
exit 0
|
||||||
|
;;
|
||||||
|
[0-9]*)
|
||||||
|
MODE="build"
|
||||||
|
MAX_ITERATIONS="$1"
|
||||||
|
shift
|
||||||
|
;;
|
||||||
|
*)
|
||||||
|
echo -e "${RED}Unknown argument: $1${NC}"
|
||||||
|
show_help
|
||||||
|
exit 1
|
||||||
|
;;
|
||||||
|
esac
|
||||||
|
done
|
||||||
|
|
||||||
|
cd "$PROJECT_DIR"
|
||||||
|
|
||||||
|
# Validate RLM context file (if provided)
|
||||||
|
if [ -n "$RLM_CONTEXT_FILE" ] && [ ! -f "$RLM_CONTEXT_FILE" ]; then
|
||||||
|
echo -e "${RED}Error: RLM context file not found: $RLM_CONTEXT_FILE${NC}"
|
||||||
|
echo "Create it first (example):"
|
||||||
|
echo " mkdir -p rlm && printf \"%s\" \"<your long context>\" > $RLM_CONTEXT_FILE"
|
||||||
|
exit 1
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Initialize RLM workspace (optional)
|
||||||
|
if [ -n "$RLM_CONTEXT_FILE" ]; then
|
||||||
|
mkdir -p "$RLM_TRACE_DIR" "$RLM_QUERIES_DIR" "$RLM_ANSWERS_DIR"
|
||||||
|
if [ ! -f "$RLM_INDEX" ]; then
|
||||||
|
echo -e "timestamp\tmode\titeration\tprompt\tlog\toutput\tstatus" > "$RLM_INDEX"
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Session log (captures ALL output)
|
||||||
|
SESSION_LOG="$LOG_DIR/ralph_${MODE}_session_$(date '+%Y%m%d_%H%M%S').log"
|
||||||
|
exec > >(tee -a "$SESSION_LOG") 2>&1
|
||||||
|
|
||||||
|
# Check if Claude CLI is available
|
||||||
|
if ! command -v "$CLAUDE_CMD" &> /dev/null; then
|
||||||
|
echo -e "${RED}Error: Claude CLI not found${NC}"
|
||||||
|
echo ""
|
||||||
|
echo "Install Claude Code CLI and authenticate first."
|
||||||
|
echo "https://claude.ai/code"
|
||||||
|
exit 1
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Determine which prompt to use based on mode and available files
|
||||||
|
if [ "$MODE" = "plan" ]; then
|
||||||
|
PROMPT_FILE="PROMPT_plan.md"
|
||||||
|
else
|
||||||
|
PROMPT_FILE="PROMPT_build.md"
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Create/update the build prompt to be flexible about plan vs specs
|
||||||
|
cat > "PROMPT_build.md" << 'BUILDEOF'
|
||||||
|
# Ralph Build Mode
|
||||||
|
|
||||||
|
Based on Geoffrey Huntley's Ralph Wiggum methodology.
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 0: Orient
|
||||||
|
|
||||||
|
Read `.specify/memory/constitution.md` to understand project principles and constraints.
|
||||||
|
|
||||||
|
---
|
||||||
|
BUILDEOF
|
||||||
|
|
||||||
|
# Optional RLM context block
|
||||||
|
if [ -n "$RLM_CONTEXT_FILE" ]; then
|
||||||
|
cat >> "PROMPT_build.md" << EOF
|
||||||
|
|
||||||
|
## Phase 0d: RLM Context (Optional)
|
||||||
|
|
||||||
|
You have access to a large context file at:
|
||||||
|
**$RLM_CONTEXT_FILE**
|
||||||
|
|
||||||
|
Treat this file as an external environment. Do NOT paste the whole file into the prompt.
|
||||||
|
Instead, inspect it programmatically and recursively:
|
||||||
|
|
||||||
|
- Use small slices:
|
||||||
|
```bash
|
||||||
|
sed -n 'START,ENDp' "$RLM_CONTEXT_FILE"
|
||||||
|
```
|
||||||
|
- Or Python snippets:
|
||||||
|
```bash
|
||||||
|
python - <<'PY'
|
||||||
|
from pathlib import Path
|
||||||
|
p = Path("$RLM_CONTEXT_FILE")
|
||||||
|
print(p.read_text().splitlines()[START:END])
|
||||||
|
PY
|
||||||
|
```
|
||||||
|
- Use search:
|
||||||
|
```bash
|
||||||
|
rg -n "pattern" "$RLM_CONTEXT_FILE"
|
||||||
|
```
|
||||||
|
|
||||||
|
Goal: decompose the task into smaller sub-queries and only load the pieces you need.
|
||||||
|
This mirrors the Recursive Language Model approach from https://arxiv.org/html/2512.24601v1
|
||||||
|
|
||||||
|
## RLM Workspace (Optional)
|
||||||
|
|
||||||
|
Past loop outputs are preserved on disk:
|
||||||
|
- Iteration logs: `logs/`
|
||||||
|
- Prompt/output snapshots: `rlm/trace/`
|
||||||
|
- Iteration index: `rlm/index.tsv`
|
||||||
|
|
||||||
|
Use these as an external memory store (search/slice as needed).
|
||||||
|
If you need a recursive sub-query, write a focused prompt in `rlm/queries/`,
|
||||||
|
run:
|
||||||
|
`./scripts/rlm-subcall.sh --query rlm/queries/<file>.md`
|
||||||
|
and store the result in `rlm/answers/`.
|
||||||
|
EOF
|
||||||
|
fi
|
||||||
|
|
||||||
|
cat >> "PROMPT_build.md" << 'BUILDEOF'
|
||||||
|
|
||||||
|
## Phase 1: Discover Work Items
|
||||||
|
|
||||||
|
Search for incomplete work from these sources (in order):
|
||||||
|
|
||||||
|
1. **specs/ folder** — Look for `.md` files NOT marked `## Status: COMPLETE`
|
||||||
|
2. **IMPLEMENTATION_PLAN.md** — If exists, find unchecked `- [ ]` tasks
|
||||||
|
3. **GitHub Issues** — Check for open issues (if this is a GitHub repo)
|
||||||
|
4. **Any task tracker** — Jira, Linear, etc. if configured
|
||||||
|
|
||||||
|
Pick the **HIGHEST PRIORITY** incomplete item:
|
||||||
|
- Lower numbers = higher priority (001 before 010)
|
||||||
|
- `[HIGH]` before `[MEDIUM]` before `[LOW]`
|
||||||
|
- Bugs/blockers before features
|
||||||
|
|
||||||
|
Before implementing, search the codebase to verify it's not already done.
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 1b: Re-Verification Mode (No Incomplete Work Found)
|
||||||
|
|
||||||
|
**If ALL specs appear complete**, don't just exit — do a quality check:
|
||||||
|
|
||||||
|
1. **Randomly pick** one completed spec from `specs/`
|
||||||
|
2. **Strictly re-verify** ALL its acceptance criteria:
|
||||||
|
- Run the actual tests mentioned in the spec
|
||||||
|
- Manually verify each criterion is truly met
|
||||||
|
- Check edge cases
|
||||||
|
- Look for regressions
|
||||||
|
3. **If any criterion fails**: Unmark the spec as complete and fix it
|
||||||
|
4. **If all pass**: Output `<promise>DONE</promise>` to confirm quality
|
||||||
|
|
||||||
|
This ensures the codebase stays healthy even when "nothing to do."
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 2: Implement
|
||||||
|
|
||||||
|
Implement the selected spec/task completely:
|
||||||
|
- Follow the spec's requirements exactly
|
||||||
|
- Write clean, maintainable code
|
||||||
|
- Add tests as needed
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 3: Validate
|
||||||
|
|
||||||
|
Run the project's test suite and verify:
|
||||||
|
- All tests pass
|
||||||
|
- No lint errors
|
||||||
|
- The spec's acceptance criteria are 100% met
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 4: Commit & Update
|
||||||
|
|
||||||
|
1. Mark the spec/task as complete (add `## Status: COMPLETE` to spec file)
|
||||||
|
2. `git add -A`
|
||||||
|
3. `git commit` with a descriptive message
|
||||||
|
4. `git push`
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Completion Signal
|
||||||
|
|
||||||
|
**CRITICAL:** Only output the magic phrase when the work is 100% complete.
|
||||||
|
|
||||||
|
Check:
|
||||||
|
- [ ] Implementation matches all requirements
|
||||||
|
- [ ] All tests pass
|
||||||
|
- [ ] All acceptance criteria verified
|
||||||
|
- [ ] Changes committed and pushed
|
||||||
|
- [ ] Spec marked as complete
|
||||||
|
|
||||||
|
**If ALL checks pass, output:** `<promise>DONE</promise>`
|
||||||
|
|
||||||
|
**If ANY check fails:** Fix the issue and try again. Do NOT output the magic phrase.
|
||||||
|
BUILDEOF
|
||||||
|
|
||||||
|
# Create planning prompt (only used if plan mode is explicitly requested)
|
||||||
|
cat > "PROMPT_plan.md" << 'PLANEOF'
|
||||||
|
# Ralph Planning Mode (OPTIONAL)
|
||||||
|
|
||||||
|
This mode is OPTIONAL. Most projects work fine directly from specs.
|
||||||
|
|
||||||
|
Only use this when you want a detailed breakdown of specs into smaller tasks.
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 0: Orient
|
||||||
|
|
||||||
|
0a. Read `.specify/memory/constitution.md` for project principles.
|
||||||
|
|
||||||
|
0b. Study `specs/` to learn all feature specifications.
|
||||||
|
|
||||||
|
---
|
||||||
|
PLANEOF
|
||||||
|
|
||||||
|
# Optional RLM context block for planning
|
||||||
|
if [ -n "$RLM_CONTEXT_FILE" ]; then
|
||||||
|
cat >> "PROMPT_plan.md" << EOF
|
||||||
|
|
||||||
|
## Phase 0c: RLM Context (Optional)
|
||||||
|
|
||||||
|
You have access to a large context file at:
|
||||||
|
**$RLM_CONTEXT_FILE**
|
||||||
|
|
||||||
|
Treat this file as an external environment. Do NOT paste the whole file into the prompt.
|
||||||
|
Inspect only the slices you need using shell tools or Python.
|
||||||
|
This mirrors the Recursive Language Model approach from https://arxiv.org/html/2512.24601v1
|
||||||
|
|
||||||
|
## RLM Workspace (Optional)
|
||||||
|
|
||||||
|
Past loop outputs are preserved on disk:
|
||||||
|
- Iteration logs: `logs/`
|
||||||
|
- Prompt/output snapshots: `rlm/trace/`
|
||||||
|
- Iteration index: `rlm/index.tsv`
|
||||||
|
|
||||||
|
Use these as an external memory store (search/slice as needed).
|
||||||
|
For recursive sub-queries, use:
|
||||||
|
`./scripts/rlm-subcall.sh --query rlm/queries/<file>.md`
|
||||||
|
EOF
|
||||||
|
fi
|
||||||
|
|
||||||
|
cat >> "PROMPT_plan.md" << 'PLANEOF'
|
||||||
|
|
||||||
|
## Phase 1: Gap Analysis
|
||||||
|
|
||||||
|
Compare specs against current codebase:
|
||||||
|
- What's fully implemented?
|
||||||
|
- What's partially done?
|
||||||
|
- What's not started?
|
||||||
|
- What has issues or bugs?
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Phase 2: Create Plan
|
||||||
|
|
||||||
|
Create `IMPLEMENTATION_PLAN.md` with a prioritized task list:
|
||||||
|
|
||||||
|
```markdown
|
||||||
|
# Implementation Plan
|
||||||
|
|
||||||
|
> Auto-generated breakdown of specs into tasks.
|
||||||
|
> Delete this file to return to working directly from specs.
|
||||||
|
|
||||||
|
## Priority Tasks
|
||||||
|
|
||||||
|
- [ ] [HIGH] Task description - from spec NNN
|
||||||
|
- [ ] [HIGH] Task description - from spec NNN
|
||||||
|
- [ ] [MEDIUM] Task description
|
||||||
|
- [ ] [LOW] Task description
|
||||||
|
|
||||||
|
## Completed
|
||||||
|
|
||||||
|
- [x] Completed task
|
||||||
|
```
|
||||||
|
|
||||||
|
Prioritize by:
|
||||||
|
1. Dependencies (do prerequisites first)
|
||||||
|
2. Impact (high-value features first)
|
||||||
|
3. Complexity (mix easy wins with harder tasks)
|
||||||
|
|
||||||
|
---
|
||||||
|
|
||||||
|
## Completion Signal
|
||||||
|
|
||||||
|
When the plan is complete and saved:
|
||||||
|
|
||||||
|
`<promise>DONE</promise>`
|
||||||
|
PLANEOF
|
||||||
|
|
||||||
|
# Check prompt file exists
|
||||||
|
if [ ! -f "$PROMPT_FILE" ]; then
|
||||||
|
echo -e "${RED}Error: $PROMPT_FILE not found${NC}"
|
||||||
|
exit 1
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Build Claude flags
|
||||||
|
CLAUDE_FLAGS="-p"
|
||||||
|
if [ "$YOLO_ENABLED" = true ]; then
|
||||||
|
CLAUDE_FLAGS="$CLAUDE_FLAGS $YOLO_FLAG"
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Get current branch
|
||||||
|
CURRENT_BRANCH=$(git branch --show-current 2>/dev/null || echo "main")
|
||||||
|
|
||||||
|
# Check for work sources - count .md files in specs/
|
||||||
|
HAS_PLAN=false
|
||||||
|
HAS_SPECS=false
|
||||||
|
SPEC_COUNT=0
|
||||||
|
[ -f "IMPLEMENTATION_PLAN.md" ] && HAS_PLAN=true
|
||||||
|
if [ -d "specs" ]; then
|
||||||
|
SPEC_COUNT=$(find specs -maxdepth 1 -name "*.md" -type f 2>/dev/null | wc -l)
|
||||||
|
[ "$SPEC_COUNT" -gt 0 ] && HAS_SPECS=true
|
||||||
|
fi
|
||||||
|
|
||||||
|
echo ""
|
||||||
|
echo -e "${GREEN}━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━${NC}"
|
||||||
|
echo -e "${GREEN} RALPH LOOP (Claude Code) STARTING ${NC}"
|
||||||
|
echo -e "${GREEN}━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━${NC}"
|
||||||
|
echo ""
|
||||||
|
echo -e "${BLUE}Mode:${NC} $MODE"
|
||||||
|
echo -e "${BLUE}Prompt:${NC} $PROMPT_FILE"
|
||||||
|
echo -e "${BLUE}Branch:${NC} $CURRENT_BRANCH"
|
||||||
|
echo -e "${YELLOW}YOLO:${NC} $([ "$YOLO_ENABLED" = true ] && echo "ENABLED" || echo "DISABLED")"
|
||||||
|
[ -n "$RLM_CONTEXT_FILE" ] && echo -e "${BLUE}RLM:${NC} $RLM_CONTEXT_FILE"
|
||||||
|
[ -n "$SESSION_LOG" ] && echo -e "${BLUE}Log:${NC} $SESSION_LOG"
|
||||||
|
[ $MAX_ITERATIONS -gt 0 ] && echo -e "${BLUE}Max:${NC} $MAX_ITERATIONS iterations"
|
||||||
|
echo ""
|
||||||
|
echo -e "${BLUE}Work source:${NC}"
|
||||||
|
if [ "$HAS_PLAN" = true ]; then
|
||||||
|
echo -e " ${GREEN}✓${NC} IMPLEMENTATION_PLAN.md (will use this)"
|
||||||
|
else
|
||||||
|
echo -e " ${YELLOW}○${NC} IMPLEMENTATION_PLAN.md (not found, that's OK)"
|
||||||
|
fi
|
||||||
|
if [ "$HAS_SPECS" = true ]; then
|
||||||
|
echo -e " ${GREEN}✓${NC} specs/ folder ($SPEC_COUNT specs)"
|
||||||
|
else
|
||||||
|
echo -e " ${RED}✗${NC} specs/ folder (no .md files found)"
|
||||||
|
fi
|
||||||
|
echo ""
|
||||||
|
echo -e "${CYAN}The loop checks for <promise>DONE</promise> in each iteration.${NC}"
|
||||||
|
echo -e "${CYAN}Agent must verify acceptance criteria before outputting it.${NC}"
|
||||||
|
echo ""
|
||||||
|
echo -e "${YELLOW}Press Ctrl+C to stop the loop${NC}"
|
||||||
|
echo ""
|
||||||
|
|
||||||
|
ITERATION=0
|
||||||
|
CONSECUTIVE_FAILURES=0
|
||||||
|
MAX_CONSECUTIVE_FAILURES=3
|
||||||
|
|
||||||
|
while true; do
|
||||||
|
# Check max iterations
|
||||||
|
if [ $MAX_ITERATIONS -gt 0 ] && [ $ITERATION -ge $MAX_ITERATIONS ]; then
|
||||||
|
echo -e "${GREEN}Reached max iterations: $MAX_ITERATIONS${NC}"
|
||||||
|
break
|
||||||
|
fi
|
||||||
|
|
||||||
|
ITERATION=$((ITERATION + 1))
|
||||||
|
TIMESTAMP=$(date '+%Y-%m-%d %H:%M:%S')
|
||||||
|
|
||||||
|
echo ""
|
||||||
|
echo -e "${PURPLE}════════════════════ LOOP $ITERATION ════════════════════${NC}"
|
||||||
|
echo -e "${BLUE}[$TIMESTAMP]${NC} Starting iteration $ITERATION"
|
||||||
|
echo ""
|
||||||
|
|
||||||
|
# Log file for this iteration
|
||||||
|
LOG_FILE="$LOG_DIR/ralph_${MODE}_iter_${ITERATION}_$(date '+%Y%m%d_%H%M%S').log"
|
||||||
|
: > "$LOG_FILE"
|
||||||
|
WATCH_PID=""
|
||||||
|
|
||||||
|
if [ "$ROLLING_OUTPUT_INTERVAL" -gt 0 ] && [ "$ROLLING_OUTPUT_LINES" -gt 0 ] && [ -t 1 ] && [ -w /dev/tty ]; then
|
||||||
|
watch_latest_output "$LOG_FILE" "Claude" &
|
||||||
|
WATCH_PID=$!
|
||||||
|
fi
|
||||||
|
RLM_STATUS="unknown"
|
||||||
|
|
||||||
|
# Snapshot prompt (optional RLM workspace)
|
||||||
|
if [ -n "$RLM_CONTEXT_FILE" ]; then
|
||||||
|
RLM_PROMPT_SNAPSHOT="$RLM_TRACE_DIR/iter_${ITERATION}_prompt.md"
|
||||||
|
cp "$PROMPT_FILE" "$RLM_PROMPT_SNAPSHOT"
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Run Claude with prompt via stdin, capture output
|
||||||
|
CLAUDE_OUTPUT=""
|
||||||
|
if CLAUDE_OUTPUT=$(cat "$PROMPT_FILE" | "$CLAUDE_CMD" $CLAUDE_FLAGS 2>&1 | tee "$LOG_FILE"); then
|
||||||
|
if [ -n "$WATCH_PID" ]; then
|
||||||
|
kill "$WATCH_PID" 2>/dev/null || true
|
||||||
|
wait "$WATCH_PID" 2>/dev/null || true
|
||||||
|
fi
|
||||||
|
echo ""
|
||||||
|
echo -e "${GREEN}✓ Claude execution completed${NC}"
|
||||||
|
|
||||||
|
# Check if DONE promise was output (accept both DONE and ALL_DONE variants)
|
||||||
|
if echo "$CLAUDE_OUTPUT" | grep -qE "<promise>(ALL_)?DONE</promise>"; then
|
||||||
|
DETECTED_SIGNAL=$(echo "$CLAUDE_OUTPUT" | grep -oE "<promise>(ALL_)?DONE</promise>" | tail -1)
|
||||||
|
echo -e "${GREEN}✓ Completion signal detected: ${DETECTED_SIGNAL}${NC}"
|
||||||
|
echo -e "${GREEN}✓ Task completed successfully!${NC}"
|
||||||
|
CONSECUTIVE_FAILURES=0
|
||||||
|
RLM_STATUS="done"
|
||||||
|
|
||||||
|
# For planning mode, stop after one successful plan
|
||||||
|
if [ "$MODE" = "plan" ]; then
|
||||||
|
echo ""
|
||||||
|
echo -e "${GREEN}Planning complete!${NC}"
|
||||||
|
echo -e "${CYAN}Run './scripts/ralph-loop.sh' to start building.${NC}"
|
||||||
|
echo -e "${CYAN}Or delete IMPLEMENTATION_PLAN.md to work directly from specs.${NC}"
|
||||||
|
break
|
||||||
|
fi
|
||||||
|
else
|
||||||
|
echo -e "${YELLOW}⚠ No completion signal found${NC}"
|
||||||
|
echo -e "${YELLOW} Agent did not output <promise>DONE</promise> or <promise>ALL_DONE</promise>${NC}"
|
||||||
|
echo -e "${YELLOW} This means acceptance criteria were not met.${NC}"
|
||||||
|
echo -e "${YELLOW} Retrying in next iteration...${NC}"
|
||||||
|
CONSECUTIVE_FAILURES=$((CONSECUTIVE_FAILURES + 1))
|
||||||
|
RLM_STATUS="incomplete"
|
||||||
|
print_latest_output "$LOG_FILE" "Claude"
|
||||||
|
|
||||||
|
if [ $CONSECUTIVE_FAILURES -ge $MAX_CONSECUTIVE_FAILURES ]; then
|
||||||
|
echo ""
|
||||||
|
echo -e "${RED}⚠ $MAX_CONSECUTIVE_FAILURES consecutive iterations without completion.${NC}"
|
||||||
|
echo -e "${RED} The agent may be stuck. Consider:${NC}"
|
||||||
|
echo -e "${RED} - Checking the logs in $LOG_DIR${NC}"
|
||||||
|
echo -e "${RED} - Simplifying the current spec${NC}"
|
||||||
|
echo -e "${RED} - Manually fixing blocking issues${NC}"
|
||||||
|
echo ""
|
||||||
|
CONSECUTIVE_FAILURES=0
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
else
|
||||||
|
if [ -n "$WATCH_PID" ]; then
|
||||||
|
kill "$WATCH_PID" 2>/dev/null || true
|
||||||
|
wait "$WATCH_PID" 2>/dev/null || true
|
||||||
|
fi
|
||||||
|
echo -e "${RED}✗ Claude execution failed${NC}"
|
||||||
|
echo -e "${YELLOW}Check log: $LOG_FILE${NC}"
|
||||||
|
CONSECUTIVE_FAILURES=$((CONSECUTIVE_FAILURES + 1))
|
||||||
|
RLM_STATUS="error"
|
||||||
|
print_latest_output "$LOG_FILE" "Claude"
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Record iteration in RLM index (optional)
|
||||||
|
if [ -n "$RLM_CONTEXT_FILE" ]; then
|
||||||
|
RLM_PROMPT_PATH="${RLM_PROMPT_SNAPSHOT:-}"
|
||||||
|
RLM_OUTPUT_SNAPSHOT="$RLM_TRACE_DIR/iter_${ITERATION}_output.log"
|
||||||
|
cp "$LOG_FILE" "$RLM_OUTPUT_SNAPSHOT"
|
||||||
|
echo -e "${TIMESTAMP}\t${MODE}\t${ITERATION}\t${RLM_PROMPT_PATH}\t${LOG_FILE}\t${RLM_OUTPUT_SNAPSHOT}\t${RLM_STATUS}" >> "$RLM_INDEX"
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Push changes after each iteration (if any)
|
||||||
|
git push origin "$CURRENT_BRANCH" 2>/dev/null || {
|
||||||
|
if git log origin/$CURRENT_BRANCH..HEAD --oneline 2>/dev/null | grep -q .; then
|
||||||
|
echo -e "${YELLOW}Push failed, creating remote branch...${NC}"
|
||||||
|
git push -u origin "$CURRENT_BRANCH" 2>/dev/null || true
|
||||||
|
fi
|
||||||
|
}
|
||||||
|
|
||||||
|
# Brief pause between iterations
|
||||||
|
echo ""
|
||||||
|
echo -e "${BLUE}Waiting 2s before next iteration...${NC}"
|
||||||
|
sleep 2
|
||||||
|
done
|
||||||
|
|
||||||
|
echo ""
|
||||||
|
echo -e "${GREEN}━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━${NC}"
|
||||||
|
echo -e "${GREEN} RALPH LOOP FINISHED ($ITERATION iterations) ${NC}"
|
||||||
|
echo -e "${GREEN}━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━${NC}"
|
||||||
41
specs/001-core-ui-camera.md
Normal file
41
specs/001-core-ui-camera.md
Normal file
@@ -0,0 +1,41 @@
|
|||||||
|
# Feature: Core UI and Camera Feed (PyObjC)
|
||||||
|
|
||||||
|
## Status: COMPLETE
|
||||||
|
|
||||||
|
## Description
|
||||||
|
Create the main application window using PyObjC (AppKit) and display a live camera feed. This ensures a native macOS look and feel.
|
||||||
|
|
||||||
|
## Requirements
|
||||||
|
|
||||||
|
1. **App & Window Setup (AppKit)**:
|
||||||
|
- Initialize `NSApplication`.
|
||||||
|
- Create a main `NSWindow` titled "ItemSense".
|
||||||
|
- Size: 800x600 (resizable).
|
||||||
|
- Window should center on screen.
|
||||||
|
|
||||||
|
2. **UI Layout**:
|
||||||
|
- Use `NSStackView` (vertical) or manual constraints to layout:
|
||||||
|
- Top: Video Feed (`NSImageView`).
|
||||||
|
- Bottom: "Capture" button (`NSButton`).
|
||||||
|
|
||||||
|
3. **Camera Feed**:
|
||||||
|
- Use `opencv-python` to capture frames from webcam (index 0).
|
||||||
|
- Convert frames (`cv2` BGR -> RGB) to `NSImage/CGImage`.
|
||||||
|
- Update the `NSImageView` at ~30 FPS using a timer (`NSTimer` or equivalent app loop integration).
|
||||||
|
|
||||||
|
4. **Capture Button**:
|
||||||
|
- Standard macOS Push Button.
|
||||||
|
- Label: "Capture".
|
||||||
|
- Action: Print "Capture clicked" to console.
|
||||||
|
|
||||||
|
5. **Lifecycle**:
|
||||||
|
- Ensure `Cmd+Q` works.
|
||||||
|
- Ensure closing the window terminates the app (or at least the `applicationShouldTerminateAfterLastWindowClosed:` delegate method returns True).
|
||||||
|
|
||||||
|
## Acceptance Criteria
|
||||||
|
|
||||||
|
- [ ] App launches with a native macOS window "ItemSense".
|
||||||
|
- [ ] Live camera feed is visible in the view.
|
||||||
|
- [ ] "Capture" button is visible at the bottom.
|
||||||
|
- [ ] Clicking "Capture" prints to console.
|
||||||
|
- [ ] App exits cleanly on window close or Cmd+Q.
|
||||||
29
specs/002-openai-integration.md
Normal file
29
specs/002-openai-integration.md
Normal file
@@ -0,0 +1,29 @@
|
|||||||
|
# Feature: OpenAI Vision Integration (PyObjC)
|
||||||
|
|
||||||
|
## Description
|
||||||
|
Implement the logic to capture a frame from the AppKit interface and send it to OpenAI's API.
|
||||||
|
|
||||||
|
## Requirements
|
||||||
|
|
||||||
|
1. **Image Handling**:
|
||||||
|
- On "Capture" click:
|
||||||
|
- Stop/Pause the live feed update.
|
||||||
|
- Store the current frame (in memory).
|
||||||
|
- Show "Processing..." (maybe change button text or add a label).
|
||||||
|
|
||||||
|
2. **OpenAI API Call**:
|
||||||
|
- Async handling is important to not block the UI thread (spinning beachball).
|
||||||
|
- Run the API request in a background thread (`threading`).
|
||||||
|
- Model: `gpt-5-mini` (fallback `gpt-4o-mini`).
|
||||||
|
- Prompt: "What is this item? Please provide a brief description."
|
||||||
|
|
||||||
|
3. **Response Handling**:
|
||||||
|
- When response returns, schedule a UI update on the main thread (`performSelectorOnMainThread:` or `dispatch_async`).
|
||||||
|
- Print response to console (UI display comes in Spec 003).
|
||||||
|
|
||||||
|
## Acceptance Criteria
|
||||||
|
|
||||||
|
- [ ] UI remains responsive (no beachball) during API call.
|
||||||
|
- [ ] "Processing..." indication is shown.
|
||||||
|
- [ ] Image frame is correctly sent to OpenAI.
|
||||||
|
- [ ] Text response is received and printed to console.
|
||||||
25
specs/003-result-display.md
Normal file
25
specs/003-result-display.md
Normal file
@@ -0,0 +1,25 @@
|
|||||||
|
# Feature: Result Display (PyObjC)
|
||||||
|
|
||||||
|
## Description
|
||||||
|
Display the analysis results natively in the AppKit UI.
|
||||||
|
|
||||||
|
## Requirements
|
||||||
|
|
||||||
|
1. **Result UI**:
|
||||||
|
- Add a scrollable `NSTextView` (within an `NSScrollView`) below the image view.
|
||||||
|
- Initially empty or hidden.
|
||||||
|
|
||||||
|
2. **Workflow**:
|
||||||
|
- **Live Mode**: Camera active, Button says "Capture", Text view hidden/empty.
|
||||||
|
- **Processing Mode**: specific indication.
|
||||||
|
- **Result Mode**: Camera paused on captured frame, Button says "Scan Another", Text view shows description.
|
||||||
|
|
||||||
|
3. **Data Binding**:
|
||||||
|
- Update the `NSTextView` string with the OpenAI response.
|
||||||
|
- Clicking "Scan Another" resets the UI to **Live Mode**.
|
||||||
|
|
||||||
|
## Acceptance Criteria
|
||||||
|
|
||||||
|
- [ ] App cycles correctly: Capture -> Result -> Scan Another -> Capture.
|
||||||
|
- [ ] Result text is readable in a native macOS scroll view.
|
||||||
|
- [ ] Window resizing layout remains sane.
|
||||||
Reference in New Issue
Block a user