Skip to content

Commit

Permalink
legate-dataframe initial commit
Browse files Browse the repository at this point in the history
Co-authored-by: Mads R. B. Kristensen <[email protected]>
Co-authored-by: Sebastian Berg <[email protected]>
Co-authored-by: Ben Jarmak <[email protected]>
Co-authored-by: James Lamb <[email protected]>
Co-authored-by: Divye Gala <[email protected]>
Co-authored-by: James Lamb <[email protected]>
Co-authored-by: Sebastian Berg <[email protected]>
Co-authored-by: jakirkham <[email protected]>
  • Loading branch information
9 people committed Nov 22, 2024
0 parents commit 6334781
Show file tree
Hide file tree
Showing 183 changed files with 15,605 additions and 0 deletions.
11 changes: 11 additions & 0 deletions .dockerignore
Original file line number Diff line number Diff line change
@@ -0,0 +1,11 @@
cpp/build/
ci/manual-ci-test.py
Docker
python/_skbuild
python/*.egg-info
.pytest_cache
.mypy_cache
.git
.cache
.vscode
.ruff_cache
5 changes: 5 additions & 0 deletions .github/copy-pr-bot.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
# Copyright 2024 NVIDIA Corporation
# Configuration file for `copy-pr-bot` GitHub App
# https://docs.gha-runners.nvidia.com/apps/copy-pr-bot/

enabled: true
10 changes: 10 additions & 0 deletions .github/pull_request_template.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,10 @@
## Description
<!-- Provide a standalone description of changes in this PR. -->
<!-- Reference any issues closed by this PR with "closes #1234". -->
<!-- Read DEVELOPER_GUIDE.md. -->

## Checklist
- [ ] New or existing tests cover these changes.
- [ ] The documentation is up to date with these changes.
- [ ] Run `./build.sh test` for local testing, see [CONTRIBUTING.md](https://github.com/rapidsai/legate-dataframe/blob/main/CONTRIBUTING.md#testing).
- [ ] Ensure `pre-commit` checks are passing see [CONTRIBUTING.md](https://github.com/rapidsai/legate-dataframe/blob/main/CONTRIBUTING.md#Pre-commit-hooks).
43 changes: 43 additions & 0 deletions .github/workflows/build.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,43 @@
name: build

concurrency:
group: ci-on-${{ github.event_name }}-from-${{ github.ref_name }}
cancel-in-progress: true

on:
# run on pushes to certain branches
push:
branches:
- "main"
- "release/v[0-9][0-9].[0-9][0-9].[0-9][0-9]"
# run on pushes of any tags
tags:
- "*"
# run by clicking buttons in the GitHub Actions UI
workflow_dispatch:
inputs:
deploy-docs:
description: 'Update the docs site?'
required: true
type: boolean

jobs:
conda-python-build:
uses: ./.github/workflows/conda-python-build.yaml
with:
script: "ci/build_all.sh"
secrets: inherit
upload-conda:
needs:
- conda-python-build
uses: ./.github/workflows/conda-upload-packages.yaml
secrets: inherit
docs-build:
needs:
- conda-python-build
uses: ./.github/workflows/docs-build.yaml
with:
script: "ci/build_docs.sh"
# only deploy docs on tag pushes or when someone manually runs the workflow with "update docs" selected
deploy: ${{ (github.event_name == 'push' && startsWith(github.ref, 'refs/tags')) || (github.event_name == 'workflow_dispatch' && inputs.deploy-docs == true) }}
secrets: inherit
59 changes: 59 additions & 0 deletions .github/workflows/conda-python-build.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,59 @@
name: conda-python-build

concurrency:
group: conda-python-build-on-${{ github.event_name }}-from-${{ github.ref_name }}
cancel-in-progress: true

on:
# run only when called by other workflows
workflow_call:
inputs:
script:
required: true
type: string
description: "relative path to a script that builds conda packages"

env:
# CUDA architectures to build for
CUDAARCHS: "all-major"
# where conda-python-build puts files it creates
RAPIDS_CONDA_BLD_OUTPUT_DIR: /tmp/conda-bld-output


jobs:

build:
strategy:
fail-fast: false
# available legate-core and cunumeric packages:
#
# * https://anaconda.org/legate/legate-core
# * https://anaconda.org/legate/cunumeric
#
# Valid set of RAPIDS ci-conda image tags:
#
# * https://hub.docker.com/r/rapidsai/ci-conda/tags
matrix:
ARCH:
- "amd64"
CUDA_VER:
- "12.5.1"
PY_VER:
- "3.10"
- "3.11"
# - "3.12" requires update to RAPIDS 24.10
runs-on: linux-${{ matrix.ARCH }}-cpu4
container:
image: "rapidsai/ci-conda:cuda${{ matrix.CUDA_VER }}-ubuntu22.04-py${{ matrix.PY_VER }}"
steps:
- uses: actions/checkout@v4
with:
fetch-depth: 0
- name: build
run: "${{ inputs.script }}"
- name: upload
uses: actions/upload-artifact@v4
with:
name: legate-dataframe-conda-cuda${{ matrix.CUDA_VER }}-${{ matrix.ARCH }}-py${{ matrix.PY_VER }}
path: ${{ env.RAPIDS_CONDA_BLD_OUTPUT_DIR }}
if-no-files-found: error
37 changes: 37 additions & 0 deletions .github/workflows/conda-upload-packages.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,37 @@
# adopted from https://github.com/rapidsai/shared-workflows/blob/branch-24.12/.github/workflows/conda-upload-packages.yaml
# with some notable differences:
#
# * assumes packages were uploaded to GitHub artifact store, not Amazon S3
# * always publishes to the same channel, but uses different label for non-release packages
#

on:
# run only when called by other workflows
workflow_call:

env:
# where jobs that download conda packages store the local channel
RAPIDS_LOCAL_CONDA_CHANNEL: /tmp/local-conda-packages

jobs:
upload:
runs-on: linux-amd64-cpu4
container:
image: rapidsai/ci-conda:latest
steps:
- uses: actions/checkout@v4
with:
fetch-depth: 0
- name: download conda packages
uses: actions/download-artifact@v4
with:
# omitting 'name' here means "download all artifacts from this run"... useful to
# avoid having to list the matrix of CUDA / Python versions here
path: ${{ env.RAPIDS_LOCAL_CONDA_CHANNEL }}
github-token: ${{ secrets.GITHUB_TOKEN }}
repository: ${{ github.repository }}
run-id: ${{ github.run_id }}
- name: Upload packages
run: "ci/upload-to-anaconda.sh"
env:
CONDA_LEGATE_TOKEN: ${{ secrets.CONDA_LEGATE_TOKEN }}
76 changes: 76 additions & 0 deletions .github/workflows/docs-build.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,76 @@
name: docs-build

concurrency:
group: docs-build-on-${{ github.event_name }}-from-${{ github.ref_name }}
cancel-in-progress: true

on:
# run only when called by other workflows
workflow_call:
inputs:
deploy:
required: true
type: boolean
default: false
description: "set to true to publish docs"
script:
required: true
type: string
description: "relative path to a script that builds conda packages"

env:
# where jobs that download conda packages store the local channel
RAPIDS_LOCAL_CONDA_CHANNEL: /tmp/local-conda-packages

jobs:

build:
strategy:
matrix:
include:
- ARCH: amd64
CUDA_VER: "12.5.1"
PY_VER: "3.11"
runs-on: linux-${{ matrix.ARCH }}-gpu-v100-latest-1
container:
image: "rapidsai/ci-conda:cuda${{ matrix.CUDA_VER }}-ubuntu22.04-py${{ matrix.PY_VER }}"
env:
NVIDIA_VISIBLE_DEVICES: ${{ env.NVIDIA_VISIBLE_DEVICES }}
steps:
- uses: actions/checkout@v4
with:
fetch-depth: 0
- name: download conda packages
uses: actions/download-artifact@v4
with:
name: legate-dataframe-conda-cuda${{ matrix.CUDA_VER }}-${{ matrix.ARCH }}-py${{ matrix.PY_VER }}
path: ${{ env.RAPIDS_LOCAL_CONDA_CHANNEL }}
github-token: ${{ secrets.GITHUB_TOKEN }}
repository: ${{ github.repository }}
run-id: ${{ github.run_id }}
- name: build docs
run: "${{ inputs.script }}"
- uses: actions/upload-pages-artifact@v3
with:
path: docs/build/html

deploy:
needs:
- build
if: inputs.deploy

# Grant GITHUB_TOKEN the permissions required to make a Pages deployment
permissions:
pages: write # to deploy to Pages
id-token: write # to verify the deployment originates from an appropriate source

# Deploy to the github-pages environment
environment:
name: github-pages
url: ${{ steps.deployment.outputs.page_url }}

runs-on: ubuntu-latest
steps:
- name: Deploy to GitHub Pages
id: deployment
uses: actions/deploy-pages@v4
87 changes: 87 additions & 0 deletions .github/workflows/pr.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,87 @@
name: pr

concurrency:
group: ci-on-${{ github.event_name }}-from-${{ github.ref_name }}
cancel-in-progress: true

on:
push:
branches:
- "pull-request/[0-9]+"

env:
# where jobs that download conda packages store the local channel
RAPIDS_LOCAL_CONDA_CHANNEL: /tmp/local-conda-packages

jobs:

# group together all jobs that must pass for a PR to be merged
# (for use by branch protections)
pr-builder:
needs:
- pre-commit
- conda-python-build
- conda-python-tests
uses: rapidsai/shared-workflows/.github/workflows/[email protected]

pre-commit:
runs-on: ubuntu-latest
steps:
- uses: actions/checkout@v4
- uses: pre-commit/[email protected]

conda-python-build:
needs:
- pre-commit
uses: ./.github/workflows/conda-python-build.yaml
with:
script: "ci/build_all.sh"
secrets: inherit

conda-python-tests:
needs:
- pre-commit
- conda-python-build
strategy:
fail-fast: false
# As of the last time this was updated, legate-core / cunumeric packages were published for only:
#
# * architectures: amd64 only
# * CUDA: >=12.2
# * Python: 3.10, 3.11, 3.12
#
# Valid set of RAPIDS ci-conda image tags: https://hub.docker.com/r/rapidsai/ci-conda/tags
matrix:
include:
- ARCH: "amd64"
CUDA_VER: "12.5.1"
PY_VER: "3.10"
runs-on: linux-${{ matrix.ARCH }}-gpu-v100-latest-1
container:
image: "rapidsai/ci-conda:cuda${{ matrix.CUDA_VER }}-ubuntu22.04-py${{ matrix.PY_VER }}"
env:
NVIDIA_VISIBLE_DEVICES: ${{ env.NVIDIA_VISIBLE_DEVICES }}
steps:
- uses: actions/checkout@v4
with:
fetch-depth: 0
- name: download conda packages
uses: actions/download-artifact@v4
with:
name: legate-dataframe-conda-cuda${{ matrix.CUDA_VER }}-${{ matrix.ARCH }}-py${{ matrix.PY_VER }}
path: ${{ env.RAPIDS_LOCAL_CONDA_CHANNEL }}
github-token: ${{ secrets.GITHUB_TOKEN }}
repository: ${{ github.repository }}
run-id: ${{ github.run_id }}
- name: test python and C++ interface
run: |
ci/test_all.sh
docs-build:
needs:
- conda-python-build
uses: ./.github/workflows/docs-build.yaml
with:
script: "ci/build_docs.sh"
deploy: false
secrets: inherit
17 changes: 17 additions & 0 deletions .gitignore
Original file line number Diff line number Diff line change
@@ -0,0 +1,17 @@
*.*~
build
_skbuild
record.txt
*.so
dask-worker-space
__pycache__
.cache
*.egg-info
.vscode
legate_dataframe/install_info.py
cufile.log
docs/build/
cpp/doxygen/html/
.mypy_cache
.hypothesis
.ruff_cache
Loading

0 comments on commit 6334781

Please sign in to comment.