Add blocksize to DocumentDataset.read_*
that uses dask_cudf.read_*
#1479
Workflow file for this run
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: Test Python package | |
on: | |
push: | |
branches: | |
- main | |
pull_request: | |
workflow_dispatch: | |
# When this workflow is queued, automatically cancel any previous running | |
# or pending jobs from the same branch | |
concurrency: | |
group: test-${{ github.ref }} | |
cancel-in-progress: true | |
jobs: | |
build_and_test: | |
runs-on: ${{ matrix.os }} | |
strategy: | |
fail-fast: false | |
matrix: | |
os: [ubuntu-latest] | |
python-version: ["3.10"] | |
steps: | |
- uses: actions/checkout@v4 | |
- name: Optionally free up space on Ubuntu | |
run: | | |
sudo rm -rf /usr/share/dotnet | |
sudo rm -rf /opt/ghc | |
sudo rm -rf "/usr/local/share/boost" | |
sudo rm -rf "$AGENT_TOOLSDIRECTORY" | |
- name: Set up Python ${{ matrix.python-version }} | |
uses: actions/setup-python@v5 | |
with: | |
python-version: ${{ matrix.python-version }} | |
- name: Install NeMo-Curator and pytest | |
# TODO: Remove pytest when optional test dependencies are added to setup.py | |
# Installing wheel beforehand due to fasttext issue: | |
# https://github.com/facebookresearch/fastText/issues/512#issuecomment-1837367666 | |
run: | | |
pip install wheel | |
pip install --no-cache-dir . | |
pip install pytest | |
- name: Run tests | |
run: | | |
python -m pytest -v --cpu |