Skip to content

Generate TPC-H files to S3 #20

Generate TPC-H files to S3

Generate TPC-H files to S3 #20

name: "Generate TPC-H files to S3"
on:
workflow_dispatch: { }
schedule:
# 5AM UTC
- cron: "0 5 * * *"
concurrency:
group: ${{ github.workflow }}
permissions:
actions: write
id-token: write
jobs:
generate_files:
name: Generate S3 TPCH files
runs-on:
- runs-on=${{ github.run_id }}
- family=m7i.2xlarge
- image=ubuntu24-full-x64
- spot=false
steps:
- uses: actions/checkout@v4
- name: Setup AWS CLI
uses: aws-actions/configure-aws-credentials@v4
with:
role-to-assume: arn:aws:iam::375504701696:role/GitHubBenchmarkRole
aws-region: us-east-1
- name: Generate files locally
shell: bash
run: |
# We run each query once to make sure we don't upload a file if there's a bug that causes a panic.
cargo run --release --bin tpch -- --formats parquet,vortex -i1
aws s3 rm --recursive s3://vortex-bench-dev-eu/tpch-sf1/
aws s3 cp --recursive bench-vortex/data/tpch/1 s3://vortex-bench-dev-eu/tpch-sf1/