mirror of
https://github.com/browseros-ai/BrowserOS.git
synced 2026-05-18 11:06:19 +00:00
* feat(eval): add suite variant config bridge * feat(eval): add stable run artifacts * refactor(eval): add shared grader contract * feat(eval): persist grader artifacts * refactor(eval): rename runner layers * refactor(eval): add executor backend boundary * refactor(eval): split clado backend * feat(eval): add workflow compatible cli * feat(eval): add r2 publisher module * ci(eval): migrate weekly workflow to eval cli * docs(eval): document suite pipeline * chore(eval): verify pipeline refactor * fix: address review feedback for PR #875 * docs(eval): add env example * docs(eval): explain suites and variants * chore(eval): organize config layouts * chore(eval): colocate grader python evaluators
52 lines
1.2 KiB
Plaintext
Vendored
52 lines
1.2 KiB
Plaintext
Vendored
# Copy to .env.development for local eval runs.
|
|
|
|
# Provider keys used by existing config files.
|
|
OPENROUTER_API_KEY=
|
|
FIREWORKS_API_KEY=
|
|
ANTHROPIC_API_KEY=
|
|
OPENAI_API_KEY=
|
|
GOOGLE_GENERATIVE_AI_API_KEY=
|
|
|
|
# Claude Agent SDK token used by performance_grader.
|
|
CLAUDE_CODE_OAUTH_TOKEN=
|
|
|
|
# Suite-mode model selection.
|
|
EVAL_VARIANT=local
|
|
EVAL_AGENT_PROVIDER=openai-compatible
|
|
EVAL_AGENT_MODEL=
|
|
EVAL_AGENT_API_KEY=
|
|
EVAL_AGENT_BASE_URL=
|
|
EVAL_AGENT_SUPPORTS_IMAGES=true
|
|
|
|
# Optional suite-mode executor override for orchestrator suites.
|
|
EVAL_EXECUTOR_MODEL=
|
|
EVAL_EXECUTOR_API_KEY=
|
|
EVAL_EXECUTOR_BASE_URL=
|
|
|
|
# Clado visual action executor.
|
|
CLADO_ACTION_MODEL=
|
|
CLADO_ACTION_API_KEY=
|
|
CLADO_ACTION_BASE_URL=
|
|
# Backward-compatible alias used by older local scripts.
|
|
CLADO_ACTION_URL=
|
|
|
|
# BrowserOS runner.
|
|
BROWSEROS_BINARY=/Applications/BrowserOS.app/Contents/MacOS/BrowserOS
|
|
BROWSEROS_SERVER_URL=http://127.0.0.1:9110
|
|
BROWSEROS_SERVER_LOG_DIR=/tmp/browseros-server-logs
|
|
BROWSEROS_CONFIG_URL=
|
|
|
|
# Captcha solver extension.
|
|
NOPECHA_API_KEY=
|
|
|
|
# WebArena-Infinity.
|
|
WEBARENA_INFINITY_DIR=
|
|
INFINITY_APP_URL=
|
|
|
|
# R2 publishing and weekly report.
|
|
EVAL_R2_ACCOUNT_ID=
|
|
EVAL_R2_ACCESS_KEY_ID=
|
|
EVAL_R2_SECRET_ACCESS_KEY=
|
|
EVAL_R2_BUCKET=browseros-eval
|
|
EVAL_R2_CDN_BASE_URL=https://eval.browseros.com
|