diff --git a/.github/workflows/llm-benchmark-periodic.yml b/.github/workflows/llm-benchmark-periodic.yml index f8b4c1fb179..40ad2c75fe4 100644 --- a/.github/workflows/llm-benchmark-periodic.yml +++ b/.github/workflows/llm-benchmark-periodic.yml @@ -29,19 +29,10 @@ concurrency: jobs: run-benchmarks: - runs-on: spacetimedb-new-runner - container: - image: localhost:5000/spacetimedb-ci:latest - options: >- - --privileged + runs-on: spacetimedb-new-runner-2 timeout-minutes: 180 steps: - - name: Install spacetime CLI - run: | - curl -sSf https://install.spacetimedb.com | sh -s -- -y - echo "$HOME/.local/bin" >> $GITHUB_PATH - - name: Checkout master uses: actions/checkout@v4 with: @@ -75,6 +66,13 @@ jobs: - name: Build llm-benchmark tool run: cargo install --path tools/xtask-llm-benchmark --locked + - name: Build SpacetimeDB server for benchmark harness + run: | + cargo ci smoketests prepare + mkdir -p "$HOME/.local/bin" + ln -sf "$GITHUB_WORKSPACE/target/release/spacetimedb-cli" "$HOME/.local/bin/spacetime" + echo "$HOME/.local/bin" >> "$GITHUB_PATH" + - name: Run benchmarks env: OPENROUTER_API_KEY: ${{ secrets.OPENROUTER_API_KEY }} diff --git a/.github/workflows/llm-benchmark-validate-goldens.yml b/.github/workflows/llm-benchmark-validate-goldens.yml index f9d634c50ea..17384a654e3 100644 --- a/.github/workflows/llm-benchmark-validate-goldens.yml +++ b/.github/workflows/llm-benchmark-validate-goldens.yml @@ -15,11 +15,7 @@ concurrency: jobs: validate-goldens: - runs-on: spacetimedb-new-runner - container: - image: localhost:5000/spacetimedb-ci:latest - options: >- - --privileged + runs-on: spacetimedb-new-runner-2 timeout-minutes: 60 strategy: @@ -28,11 +24,6 @@ jobs: lang: [rust, csharp, typescript] steps: - - name: Install spacetime CLI - run: | - curl -sSf https://install.spacetimedb.com | sh -s -- -y - echo "$HOME/.local/bin" >> $GITHUB_PATH - - name: Checkout master uses: actions/checkout@v4 with: @@ -70,6 +61,13 @@ jobs: - name: Build llm-benchmark tool run: cargo install --path tools/xtask-llm-benchmark --locked + - name: Build SpacetimeDB server for benchmark harness + run: | + cargo ci smoketests prepare + mkdir -p "$HOME/.local/bin" + ln -sf "$GITHUB_WORKSPACE/target/release/spacetimedb-cli" "$HOME/.local/bin/spacetime" + echo "$HOME/.local/bin" >> "$GITHUB_PATH" + - name: Validate golden answers (${{ matrix.lang }}) env: MSBUILDDISABLENODEREUSE: "1"