|
@@ -7,6 +7,8 @@
|
|
|
# Usage: run-all.sh <repo-path> "<question>" [headless|tmux|all]
|
|
# Usage: run-all.sh <repo-path> "<question>" [headless|tmux|all]
|
|
|
# Env: CG_BIN codegraph binary (default: command -v codegraph)
|
|
# Env: CG_BIN codegraph binary (default: command -v codegraph)
|
|
|
# AGENT_EVAL_OUT output dir (default: /tmp/agent-eval)
|
|
# AGENT_EVAL_OUT output dir (default: /tmp/agent-eval)
|
|
|
|
|
+# MODEL / EFFORT claude model/effort (default: sonnet / high — the
|
|
|
|
|
+# standing A/B policy; see CLAUDE.md, don't raise)
|
|
|
set -uo pipefail
|
|
set -uo pipefail
|
|
|
|
|
|
|
|
REPO="${1:?usage: run-all.sh <repo-path> \"<question>\" [headless|tmux|all]}"
|
|
REPO="${1:?usage: run-all.sh <repo-path> \"<question>\" [headless|tmux|all]}"
|
|
@@ -39,7 +41,7 @@ headless() {
|
|
|
( cd "$REPO" && claude -p "$Q" \
|
|
( cd "$REPO" && claude -p "$Q" \
|
|
|
--output-format stream-json --verbose \
|
|
--output-format stream-json --verbose \
|
|
|
--permission-mode bypassPermissions \
|
|
--permission-mode bypassPermissions \
|
|
|
- --model opus \
|
|
|
|
|
|
|
+ --model "${MODEL:-sonnet}" --effort "${EFFORT:-high}" \
|
|
|
--max-budget-usd 4 \
|
|
--max-budget-usd 4 \
|
|
|
--strict-mcp-config --mcp-config "$cfg" \
|
|
--strict-mcp-config --mcp-config "$cfg" \
|
|
|
> "$OUT/run-$label.jsonl" 2>"$OUT/run-$label.err" )
|
|
> "$OUT/run-$label.jsonl" 2>"$OUT/run-$label.err" )
|
|
@@ -56,11 +58,11 @@ fi
|
|
|
|
|
|
|
|
if [ "$MODE" = tmux ] || [ "$MODE" = all ]; then
|
|
if [ "$MODE" = tmux ] || [ "$MODE" = all ]; then
|
|
|
echo "############################## INTERACTIVE [with] ##############################"
|
|
echo "############################## INTERACTIVE [with] ##############################"
|
|
|
- CLAUDE_EXTRA_ARGS="--model opus --strict-mcp-config --mcp-config $OUT/mcp-codegraph.json" \
|
|
|
|
|
|
|
+ CLAUDE_EXTRA_ARGS="--model ${MODEL:-sonnet} --effort ${EFFORT:-high} --strict-mcp-config --mcp-config $OUT/mcp-codegraph.json" \
|
|
|
bash "$HARNESS/itrun.sh" "$REPO" "int-with" "$Q" 2>&1 || echo "[itrun WITH failed]"
|
|
bash "$HARNESS/itrun.sh" "$REPO" "int-with" "$Q" 2>&1 || echo "[itrun WITH failed]"
|
|
|
echo
|
|
echo
|
|
|
echo "############################## INTERACTIVE [without] ##############################"
|
|
echo "############################## INTERACTIVE [without] ##############################"
|
|
|
- CLAUDE_EXTRA_ARGS="--model opus --strict-mcp-config --mcp-config $OUT/mcp-empty.json" \
|
|
|
|
|
|
|
+ CLAUDE_EXTRA_ARGS="--model ${MODEL:-sonnet} --effort ${EFFORT:-high} --strict-mcp-config --mcp-config $OUT/mcp-empty.json" \
|
|
|
bash "$HARNESS/itrun.sh" "$REPO" "int-without" "$Q" 2>&1 || echo "[itrun WITHOUT failed]"
|
|
bash "$HARNESS/itrun.sh" "$REPO" "int-without" "$Q" 2>&1 || echo "[itrun WITHOUT failed]"
|
|
|
echo
|
|
echo
|
|
|
fi
|
|
fi
|