Skip to content

Commit

Permalink
Merge pull request #106 from Tmonster/robust-data-generation
Browse files Browse the repository at this point in the history
Cleaner Data Generation
  • Loading branch information
samansmink authored Feb 20, 2025
2 parents 906e91e + 354a3ab commit 15a1e37
Show file tree
Hide file tree
Showing 225 changed files with 702 additions and 6,327 deletions.
16 changes: 12 additions & 4 deletions .github/workflows/Rest.yml
Original file line number Diff line number Diff line change
Expand Up @@ -39,6 +39,10 @@ jobs:
with:
vcpkgGitCommitId: 5e5d0e1cd7785623065e77eff011afdeec1a3574

- name: Setup Ccache
uses: hendrikmuhs/ccache-action@main
continue-on-error: true

- name: Build extension
env:
GEN: ninja
Expand All @@ -47,12 +51,16 @@ jobs:
make release
- name: Start Rest Catalog
working-directory: scripts/
run: |
./start-rest-catalog.sh
make start-rest-catalog
- name: Generate data
run: |
make data
- name: Test With rest catalog
- name: Test with rest catalog
env:
ICEBERG_SERVER_AVAILABLE: 1
DUCKDB_ICEBERG_HAVE_GENERATED_DATA: 1
run: |
make test_release
make test_release
4 changes: 4 additions & 0 deletions .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -12,3 +12,7 @@ data/iceberg/generated_*
scripts/metastore_db/
scripts/derby.log
scripts/test-script-with-path.sql
scripts/data_generators/__pycache__/
scripts/data_generators/*/__pycache__/
scripts/data_generators/*/*/*.parquet
data/generated/*
17 changes: 11 additions & 6 deletions Makefile
Original file line number Diff line number Diff line change
Expand Up @@ -5,18 +5,23 @@ EXT_NAME=iceberg
EXT_CONFIG=${PROJ_DIR}extension_config.cmake

# We need this for testing
CORE_EXTENSIONS='httpfs'
CORE_EXTENSIONS='parquet;httpfs'

# Include the Makefile from extension-ci-tools
include extension-ci-tools/makefiles/duckdb_extension.Makefile

start-rest-catalog: install_requirements
./scripts/start-rest-catalog.sh

install_requirements:
python3 -m pip install -r scripts/requirements.txt

# Custom makefile targets
data: data_clean
python3 scripts/test_data_generator/generate_iceberg.py 0.001 data/iceberg/generated_spec1_0_001 1
python3 scripts/test_data_generator/generate_iceberg.py 0.001 data/iceberg/generated_spec2_0_001 2
data: data_clean start-rest-catalog
python3 scripts/data_generators/generate_data.py

data_large: data data_clean
python3 scripts/test_data_generator/generate_iceberg.py 1 data/iceberg/generated_spec2_1 2
python3 scripts/data_generators/generate_data.py

data_clean:
rm -rf data/iceberg/generated_*
rm -rf data/generated

This file was deleted.

Binary file not shown.
Binary file not shown.
Binary file not shown.

This file was deleted.

Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.

This file was deleted.

Loading

0 comments on commit 15a1e37

Please sign in to comment.