Skip to content

Continuous Benchmark Hnsw Indexing #242

Continuous Benchmark Hnsw Indexing

Continuous Benchmark Hnsw Indexing #242

name: Continuous Benchmark Hnsw Indexing
on:
workflow_dispatch:
inputs:
dataset_name:
description: 'First dataset name for transform benchmark'
required: false
type: choice
options:
- 'cohere-wiki-100k-no-filters'
- 'laion-small-clip-no-filters-1'
dataset_2_name:
description: 'Second dataset name for transform benchmark'
required: false
type: choice
options:
- 'cohere-wiki-100k-no-filters-2'
- 'laion-small-clip-no-filters-2'
schedule:
# Run every day at 3am
- cron: "0 3 * * *"
# Restrict to only running this workflow one at a time.
# Any new runs will be queued until the previous run is complete.
# Any existing pending runs will be cancelled and replaced with current run.
concurrency:
group: continuous-benchmark
jobs:
runUpdateHealingBenchmark:
runs-on: ubuntu-latest
container: alpine/ansible:2.18.1
steps:
- uses: actions/checkout@v3
- uses: webfactory/[email protected]
with:
ssh-private-key: ${{ secrets.SSH_PRIVATE_KEY }}
- name: Create inventory
uses: ./.github/workflows/actions/create-inventory
with:
hcloud_token: ${{ secrets.HCLOUD_TOKEN }}
db_host: ${{ secrets.POSTGRES_HOST }}
server_name: "benchmark-server-1"
- name: Run bench
id: hnsw-indexing-update
run: |
cd ansible/playbooks && ansible-playbook playbook-hnsw-index.yml --extra-vars "
bench=update
dataset_name=dbpedia-openai-100K-1536-angular
"
runTransformHealingBenchmark:
runs-on: ubuntu-latest
container: alpine/ansible:2.18.1
needs: runUpdateHealingBenchmark
steps:
- uses: actions/checkout@v3
- uses: webfactory/[email protected]
with:
ssh-private-key: ${{ secrets.SSH_PRIVATE_KEY }}
- name: Create inventory
uses: ./.github/workflows/actions/create-inventory
with:
hcloud_token: ${{ secrets.HCLOUD_TOKEN }}
db_host: ${{ secrets.POSTGRES_HOST }}
server_name: "benchmark-server-1"
- name: Run bench
id: hnsw-indexing-transform
run: |
cd ansible/playbooks && ansible-playbook playbook-hnsw-index.yml --extra-vars "
bench=transform
dataset_name=${{ inputs.dataset_name || 'laion-small-clip-no-filters-1' }}
dataset_2_name=${{ inputs.dataset_2_name || 'laion-small-clip-no-filters-2' }}
"