mirror of https://github.com/garrytan/gstack.git
simplify: one command for evals — bun run test:evals
Remove test:eval, test:e2e, test:all. Just two commands: - bun test (free) - bun run test:evals (everything that costs money) Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
parent
b5b2a15ad2
commit
942df42161
|
|
@ -5,10 +5,7 @@
|
||||||
```bash
|
```bash
|
||||||
bun install # install dependencies
|
bun install # install dependencies
|
||||||
bun test # run free tests (browse + snapshot + skill validation)
|
bun test # run free tests (browse + snapshot + skill validation)
|
||||||
bun run test:evals # run ALL paid evals: LLM judge + Agent SDK E2E (~$4/run)
|
bun run test:evals # run paid evals: LLM judge + Agent SDK E2E (~$4/run)
|
||||||
bun run test:eval # run LLM-as-judge evals only (~$0.15/run)
|
|
||||||
bun run test:e2e # run Agent SDK E2E tests only (~$3.85/run)
|
|
||||||
bun run test:all # free tests + all evals
|
|
||||||
bun run dev <cmd> # run CLI in dev mode, e.g. bun run dev goto https://example.com
|
bun run dev <cmd> # run CLI in dev mode, e.g. bun run dev goto https://example.com
|
||||||
bun run build # gen docs + compile binaries
|
bun run build # gen docs + compile binaries
|
||||||
bun run gen:skill-docs # regenerate SKILL.md files from templates
|
bun run gen:skill-docs # regenerate SKILL.md files from templates
|
||||||
|
|
@ -16,8 +13,8 @@ bun run skill:check # health dashboard for all skills
|
||||||
bun run dev:skill # watch mode: auto-regen + validate on change
|
bun run dev:skill # watch mode: auto-regen + validate on change
|
||||||
```
|
```
|
||||||
|
|
||||||
All eval commands require `ANTHROPIC_API_KEY` in your environment. E2E tests must
|
`test:evals` requires `ANTHROPIC_API_KEY` and must be run from a plain terminal
|
||||||
be run from a plain terminal (not inside Claude Code — nested sessions hang).
|
(not inside Claude Code — nested Agent SDK sessions hang).
|
||||||
|
|
||||||
## Project structure
|
## Project structure
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -14,9 +14,6 @@
|
||||||
"server": "bun run browse/src/server.ts",
|
"server": "bun run browse/src/server.ts",
|
||||||
"test": "bun test browse/test/ test/ --ignore test/skill-e2e.test.ts --ignore test/skill-llm-eval.test.ts",
|
"test": "bun test browse/test/ test/ --ignore test/skill-e2e.test.ts --ignore test/skill-llm-eval.test.ts",
|
||||||
"test:evals": "EVALS=1 bun test test/skill-llm-eval.test.ts test/skill-e2e.test.ts",
|
"test:evals": "EVALS=1 bun test test/skill-llm-eval.test.ts test/skill-e2e.test.ts",
|
||||||
"test:eval": "EVALS=1 bun test test/skill-llm-eval.test.ts",
|
|
||||||
"test:e2e": "EVALS=1 bun test test/skill-e2e.test.ts",
|
|
||||||
"test:all": "bun test browse/test/ test/ --ignore test/skill-e2e.test.ts --ignore test/skill-llm-eval.test.ts && EVALS=1 bun test test/skill-e2e.test.ts test/skill-llm-eval.test.ts",
|
|
||||||
"skill:check": "bun run scripts/skill-check.ts",
|
"skill:check": "bun run scripts/skill-check.ts",
|
||||||
"dev:skill": "bun run scripts/dev-skill.ts",
|
"dev:skill": "bun run scripts/dev-skill.ts",
|
||||||
"start": "bun run browse/src/server.ts"
|
"start": "bun run browse/src/server.ts"
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue