diff --git a/.github/workflows/run_agent_evals.yml b/.github/workflows/run_agent_evals.yml index 1a875aa2c463d264002f14264993b9c99ae1f49c..034a69c276d7b11325dcc4493b25d3c61d3f6455 100644 --- a/.github/workflows/run_agent_evals.yml +++ b/.github/workflows/run_agent_evals.yml @@ -6,6 +6,9 @@ env: CARGO_INCREMENTAL: '0' RUST_BACKTRACE: '1' ANTHROPIC_API_KEY: ${{ secrets.ANTHROPIC_API_KEY }} + OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }} + GOOGLE_API_KEY: ${{ secrets.GOOGLE_API_KEY }} + GOOGLE_CLOUD_PROJECT: ${{ secrets.GOOGLE_CLOUD_PROJECT }} ZED_CLIENT_CHECKSUM_SEED: ${{ secrets.ZED_CLIENT_CHECKSUM_SEED }} ZED_EVAL_TELEMETRY: '1' MODEL_NAME: ${{ inputs.model_name }} diff --git a/crates/eval/src/eval.rs b/crates/eval/src/eval.rs index d04dad8e99961480ce5f08328fa97aeabf5eda10..3166a7321782069153deb74b90e6b5b71fc99e06 100644 --- a/crates/eval/src/eval.rs +++ b/crates/eval/src/eval.rs @@ -463,8 +463,8 @@ pub fn find_model( .ok_or_else(|| { anyhow::anyhow!( "No language model with ID {}/{} was available. Available models: {}", - selected.model.0, selected.provider.0, + selected.model.0, model_registry .available_models(cx) .map(|model| format!("{}/{}", model.provider_id().0, model.id().0)) diff --git a/tooling/xtask/src/tasks/workflows/run_agent_evals.rs b/tooling/xtask/src/tasks/workflows/run_agent_evals.rs index 4601d5a5bf6a60435a87edab9cd6d62b77ef52a8..341ca1d4a517489bc9248a0d52e39f75e8da7074 100644 --- a/tooling/xtask/src/tasks/workflows/run_agent_evals.rs +++ b/tooling/xtask/src/tasks/workflows/run_agent_evals.rs @@ -19,6 +19,9 @@ pub(crate) fn run_agent_evals() -> Workflow { .add_env(("CARGO_INCREMENTAL", 0)) .add_env(("RUST_BACKTRACE", 1)) .add_env(("ANTHROPIC_API_KEY", vars::ANTHROPIC_API_KEY)) + .add_env(("OPENAI_API_KEY", vars::OPENAI_API_KEY)) + .add_env(("GOOGLE_API_KEY", vars::GOOGLE_API_KEY)) + .add_env(("GOOGLE_CLOUD_PROJECT", vars::GOOGLE_CLOUD_PROJECT)) .add_env(("ZED_CLIENT_CHECKSUM_SEED", vars::ZED_CLIENT_CHECKSUM_SEED)) .add_env(("ZED_EVAL_TELEMETRY", 1)) .add_env(("MODEL_NAME", model_name.to_string())) diff --git a/tooling/xtask/src/tasks/workflows/vars.rs b/tooling/xtask/src/tasks/workflows/vars.rs index 51f6383b1eddafd2a723e31ea23247b90b3a955c..58f2ba7b63aabcff80fb2c1073da892da2e7b25f 100644 --- a/tooling/xtask/src/tasks/workflows/vars.rs +++ b/tooling/xtask/src/tasks/workflows/vars.rs @@ -17,6 +17,9 @@ macro_rules! var { } secret!(ANTHROPIC_API_KEY); +secret!(OPENAI_API_KEY); +secret!(GOOGLE_API_KEY); +secret!(GOOGLE_CLOUD_PROJECT); secret!(APPLE_NOTARIZATION_ISSUER_ID); secret!(APPLE_NOTARIZATION_KEY); secret!(APPLE_NOTARIZATION_KEY_ID);