Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
18 changes: 8 additions & 10 deletions .github/workflows/llm-benchmark-periodic.yml
Original file line number Diff line number Diff line change
Expand Up @@ -29,19 +29,10 @@ concurrency:

jobs:
run-benchmarks:
runs-on: spacetimedb-new-runner
container:
image: localhost:5000/spacetimedb-ci:latest
options: >-
--privileged
runs-on: spacetimedb-new-runner-2
timeout-minutes: 180

steps:
- name: Install spacetime CLI
run: |
curl -sSf https://install.spacetimedb.com | sh -s -- -y
echo "$HOME/.local/bin" >> $GITHUB_PATH

- name: Checkout master
uses: actions/checkout@v4
with:
Expand Down Expand Up @@ -75,6 +66,13 @@ jobs:
- name: Build llm-benchmark tool
run: cargo install --path tools/xtask-llm-benchmark --locked

- name: Build SpacetimeDB server for benchmark harness
run: |
cargo ci smoketests prepare
mkdir -p "$HOME/.local/bin"
ln -sf "$GITHUB_WORKSPACE/target/release/spacetimedb-cli" "$HOME/.local/bin/spacetime"
echo "$HOME/.local/bin" >> "$GITHUB_PATH"

- name: Run benchmarks
env:
OPENROUTER_API_KEY: ${{ secrets.OPENROUTER_API_KEY }}
Expand Down
18 changes: 8 additions & 10 deletions .github/workflows/llm-benchmark-validate-goldens.yml
Original file line number Diff line number Diff line change
Expand Up @@ -15,11 +15,7 @@ concurrency:

jobs:
validate-goldens:
runs-on: spacetimedb-new-runner
container:
image: localhost:5000/spacetimedb-ci:latest
options: >-
--privileged
runs-on: spacetimedb-new-runner-2
timeout-minutes: 60

strategy:
Expand All @@ -28,11 +24,6 @@ jobs:
lang: [rust, csharp, typescript]

steps:
- name: Install spacetime CLI
run: |
curl -sSf https://install.spacetimedb.com | sh -s -- -y
echo "$HOME/.local/bin" >> $GITHUB_PATH

- name: Checkout master
uses: actions/checkout@v4
with:
Expand Down Expand Up @@ -70,6 +61,13 @@ jobs:
- name: Build llm-benchmark tool
run: cargo install --path tools/xtask-llm-benchmark --locked

- name: Build SpacetimeDB server for benchmark harness
run: |
cargo ci smoketests prepare
mkdir -p "$HOME/.local/bin"
ln -sf "$GITHUB_WORKSPACE/target/release/spacetimedb-cli" "$HOME/.local/bin/spacetime"
echo "$HOME/.local/bin" >> "$GITHUB_PATH"

- name: Validate golden answers (${{ matrix.lang }})
env:
MSBUILDDISABLENODEREUSE: "1"
Expand Down
Loading