Skip to content

Run evals periodically #10226

Run evals periodically

Run evals periodically #10226

Workflow file for this run

# Copyright 2025 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# Generated by dev/tasks/generate-github-actions
name: Run evals periodically
on:
schedule:
# Run every 15 minutes
- cron: "*/15 * * * *"
workflow_dispatch:
# This allows you to manually trigger the workflow from the GitHub UI
inputs:
reason:
description: "Reason for manual trigger"
required: false
default: "Manual run via UI"
jobs:
run-eval:
if: github.repository == 'GoogleCloudPlatform/kubectl-ai'
runs-on: ubuntu-latest
timeout-minutes: 15
# Add "id-token" with the intended permissions.
permissions:
contents: "read"
id-token: "write"
steps:
- uses: actions/checkout@v4
- name: Kind Cluster Setup
uses: ./.github/actions/kind-cluster-setup
with:
cluster_name: periodic-eval-cluster
- name: Run an easy eval
run: |
TEST_ARGS="--llm-provider vertexai --models gemini-2.5-pro --concurrency=1 --task-pattern=scale-" ./dev/ci/periodics/run-evals.sh
- name: Analyse results
run: |
./dev/ci/periodics/analyze-evals.sh
cat ${{ github.workspace }}/.build/k8s-bench.md >> ${GITHUB_STEP_SUMMARY}
concurrency:
group: ${{ github.workflow }}-${{ github.head_ref || github.ref }}
cancel-in-progress: false