Skip to content

Implement oneTBB-based parallelism for C lib #1224

Implement oneTBB-based parallelism for C lib

Implement oneTBB-based parallelism for C lib #1224

Workflow file for this run

name: tests
on:
push:
branches:
- "*"
# not on tags
pull_request:
env:
BLAKE3_CI: "1"
RUSTFLAGS: "-D warnings"
RUST_BACKTRACE: "1"
jobs:
library_tests:
name: ${{ matrix.target.name }} ${{ matrix.channel }}
runs-on: ${{ matrix.target.os }}
strategy:
fail-fast: false
matrix:
target: [
{ "os": "ubuntu-latest", "toolchain": "x86_64-unknown-linux-gnu", "name": "Linux GNU" },
{ "os": "macOS-latest", "toolchain": "x86_64-apple-darwin", "name": "macOS" },
{ "os": "windows-latest", "toolchain": "x86_64-pc-windows-msvc", "name": "Windows MSVC" },
{ "os": "windows-latest", "toolchain": "x86_64-pc-windows-gnu", "name": "Windows GNU" }
]
channel: [
"stable",
"beta",
"nightly",
# The current MSRV. This crate doesn't have an official MSRV policy,
# but in practice we'll probably do what libc does:
# https://github.com/rust-lang/libs-team/issues/72.
# This test target is here so that we notice if we accidentally bump
# the MSRV, but it's not a promise that we won't bump it.
"1.70.0",
]
steps:
- uses: actions/checkout@v4
- uses: dtolnay/rust-toolchain@master
with:
toolchain: ${{ format('{0}-{1}', matrix.channel, matrix.target.toolchain) }}
# Print the compiler version, for debugging.
- name: print compiler version
run: cargo run --quiet
working-directory: ./tools/compiler_version
# Print out instruction set support, for debugging.
- name: print instruction set support
run: cargo run --quiet
working-directory: ./tools/instruction_set_support
# Default tests plus Rayon and trait implementations.
- run: cargo test --features=rayon,traits-preview,serde,zeroize
# Same but with only one thread in the Rayon pool. This can find deadlocks.
- name: "again with RAYON_NUM_THREADS=1"
run: cargo test --features=rayon,traits-preview,serde,zeroize
env:
RAYON_NUM_THREADS: 1
# The mmap feature by itself (update_mmap_rayon is omitted).
- run: cargo test --features=mmap
# All public features put together.
- run: cargo test --features=mmap,rayon,traits-preview,serde,zeroize
# no_std tests.
- run: cargo test --no-default-features
# A matrix of different test settings:
# - debug vs release
# - assembly vs Rust+C intrinsics vs pure Rust intrinsics
# - different levels of SIMD support
#
# Full SIMD support.
- run: cargo test --features=
- run: cargo test --features=prefer_intrinsics
- run: cargo test --features=pure
- run: cargo test --features= --release
- run: cargo test --features=prefer_intrinsics --release
- run: cargo test --features=pure --release
# No AVX-512.
- run: cargo test --features=no_avx512
- run: cargo test --features=no_avx512,prefer_intrinsics
- run: cargo test --features=no_avx512,pure
- run: cargo test --features=no_avx512 --release
- run: cargo test --features=no_avx512,prefer_intrinsics --release
- run: cargo test --features=no_avx512,pure --release
# No AVX2.
- run: cargo test --features=no_avx512,no_avx2
- run: cargo test --features=no_avx512,no_avx2,prefer_intrinsics
- run: cargo test --features=no_avx512,no_avx2,pure
- run: cargo test --features=no_avx512,no_avx2 --release
- run: cargo test --features=no_avx512,no_avx2,prefer_intrinsics --release
- run: cargo test --features=no_avx512,no_avx2,pure --release
# No SSE4.1
- run: cargo test --features=no_avx512,no_avx2,no_sse41
- run: cargo test --features=no_avx512,no_avx2,no_sse41,prefer_intrinsics
- run: cargo test --features=no_avx512,no_avx2,no_sse41,pure
- run: cargo test --features=no_avx512,no_avx2,no_sse41 --release
- run: cargo test --features=no_avx512,no_avx2,no_sse41,prefer_intrinsics --release
- run: cargo test --features=no_avx512,no_avx2,no_sse41,pure --release
# No SSE2
- run: cargo test --features=no_avx512,no_avx2,no_sse41,no_sse2
- run: cargo test --features=no_avx512,no_avx2,no_sse41,no_sse2,prefer_intrinsics
- run: cargo test --features=no_avx512,no_avx2,no_sse41,no_sse2,pure
- run: cargo test --features=no_avx512,no_avx2,no_sse41,no_sse2 --release
- run: cargo test --features=no_avx512,no_avx2,no_sse41,no_sse2,prefer_intrinsics --release
- run: cargo test --features=no_avx512,no_avx2,no_sse41,no_sse2,pure --release
# Test benchmarks. RUSTC_BOOTSTRAP=1 lets this run on non-nightly toolchains.
- run: cargo test --benches --features=rayon
env:
RUSTC_BOOTSTRAP: 1
# Test vectors.
- name: test vectors
run: cargo test
working-directory: ./test_vectors
- name: test vectors intrinsics
run: cargo test --features=prefer_intrinsics
working-directory: ./test_vectors
- name: test vectors pure
run: cargo test --features=pure
working-directory: ./test_vectors
# Test C code.
- name: cargo test C bindings assembly
run: cargo test
working-directory: ./c/blake3_c_rust_bindings
- name: cargo test C bindings intrinsics
run: cargo test --features=prefer_intrinsics
working-directory: ./c/blake3_c_rust_bindings
- name: cargo test C bindings no AVX-512
run: cargo test
working-directory: ./c/blake3_c_rust_bindings
env:
CFLAGS: -DBLAKE3_NO_AVX512
- name: cargo test C bindings no AVX2
run: cargo test
working-directory: ./c/blake3_c_rust_bindings
env:
CFLAGS: -DBLAKE3_NO_AVX512 -DBLAKE3_NO_AVX2
- name: cargo test C bindings no SSE41
run: cargo test
working-directory: ./c/blake3_c_rust_bindings
env:
CFLAGS: -DBLAKE3_NO_AVX512 -DBLAKE3_NO_AVX2 -DBLAKE3_NO_SSE41
- name: cargo test C bindings no SSE2
run: cargo test
working-directory: ./c/blake3_c_rust_bindings
env:
CFLAGS: -DBLAKE3_NO_AVX512 -DBLAKE3_NO_AVX2 -DBLAKE3_NO_SSE41 -DBLAKE3_NO_SSE2
# Reference impl doc test.
- name: reference impl doc test
run: cargo test
working-directory: ./reference_impl
b3sum_tests:
name: b3sum ${{ matrix.target.name }} ${{ matrix.channel }}
runs-on: ${{ matrix.target.os }}
strategy:
fail-fast: false
matrix:
target: [
{ "os": "ubuntu-latest", "toolchain": "x86_64-unknown-linux-gnu", "name": "Linux GNU" },
{ "os": "macOS-latest", "toolchain": "x86_64-apple-darwin", "name": "macOS" },
{ "os": "windows-latest", "toolchain": "x86_64-pc-windows-msvc", "name": "Windows MSVC" },
{ "os": "windows-latest", "toolchain": "x86_64-pc-windows-gnu", "name": "Windows GNU" }
]
channel: [
"stable",
"beta",
"nightly",
# The b3sum MSRV is sometimes higher than the blake3 crate's, because
# b3sum depends on Clap. We check in the b3sum Cargo.lock, so Clap
# update shouldn't randomly break us here.
"1.74.1",
]
steps:
- uses: actions/checkout@v4
- uses: dtolnay/rust-toolchain@master
with:
toolchain: ${{ format('{0}-{1}', matrix.channel, matrix.target.toolchain) }}
# Test b3sum.
- name: test b3sum
run: cargo test
working-directory: ./b3sum
- name: test b3sum --no-default-features
run: cargo test --no-default-features
working-directory: ./b3sum
cross_tests:
name: cross ${{ matrix.arch }}
runs-on: ubuntu-latest
strategy:
fail-fast: false
matrix:
arch:
- i586-unknown-linux-musl
- i686-unknown-linux-musl
- armv7-unknown-linux-gnueabihf
- aarch64-unknown-linux-gnu
# Big-endian targets. See https://twitter.com/burntsushi5/status/1695483429997945092.
- powerpc64-unknown-linux-gnu
- s390x-unknown-linux-gnu
steps:
- uses: actions/checkout@v4
- uses: dtolnay/rust-toolchain@stable
- run: cargo install cross
# Test the portable implementation on everything.
- run: cross test --target ${{ matrix.arch }}
# Test building for ancient i386 processors without guaranteed SSE2 support.
- run: cross rustc --target ${{ matrix.arch }} -- -C target-cpu=i386
if: startsWith(matrix.arch, 'i586-') || startsWith(matrix.arch, 'i686-')
# Test the NEON implementation on ARM targets.
- run: cross test --target ${{ matrix.arch }} --features=neon
if: startsWith(matrix.arch, 'armv7-') || startsWith(matrix.arch, 'aarch64-')
# NEON is enabled by default on aarch64, disabling it through the no_neon feature.
- run: cross test --target ${{ matrix.arch }} --features=no_neon
if: startsWith(matrix.arch, 'aarch64-')
# Test vectors. Note that this uses a hacky script due to path dependency limitations.
- run: ./test_vectors/cross_test.sh --target ${{ matrix.arch }}
# C code. Same issue with the hacky script.
- run: ./c/blake3_c_rust_bindings/cross_test.sh --target ${{ matrix.arch }}
- run: ./c/blake3_c_rust_bindings/cross_test.sh --target ${{ matrix.arch }} --features=neon
if: startsWith(matrix.arch, 'armv7-') || startsWith(matrix.arch, 'aarch64-')
# Currently only on x86.
c_tests:
name: C tests tbb=${{ matrix.tbb }} simd=${{ matrix.simd }}
runs-on: ubuntu-latest
strategy:
fail-fast: false
matrix:
tbb: ["OFF", "ON"]
simd: ["x86-intrinsics", "amd64-asm"]
steps:
- uses: actions/checkout@v4
- run: |
sudo apt-get update
sudo apt-get install ninja-build libtbb-dev libtbb12
# Test the intrinsics-based and assembly-based implementations.
- run: |
cmake --fresh -S c -B c/build -G Ninja "-DBLAKE3_TBB_PARALLELISM=OFF" "-DBLAKE3_SIMD_TYPE=${{ matrix.simd }}"
cmake --build c/build --target test
cat c/build/Testing/Temporary/LastTest.log
- run: |
cmake --fresh -S c -B c/build -G Ninja "-DBLAKE3_TBB_PARALLELISM=OFF" "-DBLAKE3_SIMD_TYPE=${{ matrix.simd }}" "-DBLAKE3_NO_SSE2=1"
cmake --build c/build --target test
cat c/build/Testing/Temporary/LastTest.log
- run: |
cmake --fresh -S c -B c/build -G Ninja "-DBLAKE3_TBB_PARALLELISM=OFF" "-DBLAKE3_SIMD_TYPE=${{ matrix.simd }}" "-DBLAKE3_NO_SSE2=1" "-DBLAKE3_NO_SSE41=1"
cmake --build c/build --target test
cat c/build/Testing/Temporary/LastTest.log
- run: |
cmake --fresh -S c -B c/build -G Ninja "-DBLAKE3_TBB_PARALLELISM=OFF" "-DBLAKE3_SIMD_TYPE=${{ matrix.simd }}" "-DBLAKE3_NO_SSE2=1" "-DBLAKE3_NO_SSE41=1" "-DBLAKE3_NO_AVX2=1"
cmake --build c/build --target test
cat c/build/Testing/Temporary/LastTest.log
- run: |
cmake --fresh -S c -B c/build -G Ninja "-DBLAKE3_TBB_PARALLELISM=OFF" "-DBLAKE3_SIMD_TYPE=${{ matrix.simd }}" "-DBLAKE3_NO_SSE2=1" "-DBLAKE3_NO_SSE41=1" "-DBLAKE3_NO_AVX2=1" "-DBLAKE3_NO_AVX512=1"
cmake --build c/build --target test
cat c/build/Testing/Temporary/LastTest.log
# Test with TBB disabled/enabled.
- run: |
cmake --fresh -S c -B c/build -G Ninja "-DBLAKE3_TBB_PARALLELISM=${{ matrix.tbb }}"
cmake --build c/build --target test
cat c/build/Testing/Temporary/LastTest.log
# Build the example with TBB disabled/enabled.
- run: |
cmake --fresh -S c -B c/build -G Ninja
cmake --build c/build --target example
# Note that this jobs builds AArch64 binaries from an x86_64 host.
build_apple_silicon:
name: build for Apple Silicon
runs-on: macOS-latest
strategy:
fail-fast: false
steps:
- uses: actions/checkout@v4
- uses: dtolnay/rust-toolchain@stable
with:
targets: aarch64-apple-darwin
- name: build blake3
run: cargo build --target aarch64-apple-darwin
- name: build b3sum
run: cargo build --target aarch64-apple-darwin
working-directory: ./b3sum
build_tinycc:
name: build with the Tiny C Compiler
runs-on: ubuntu-latest
steps:
- uses: actions/checkout@v4
- name: install TCC
run: sudo apt-get install -y tcc
- name: compile
run: >
tcc -shared -O3 -o libblake3.so \
-DBLAKE3_NO_SSE2 -DBLAKE3_NO_SSE41 -DBLAKE3_NO_AVX2 -DBLAKE3_NO_AVX512 \
blake3.c blake3_dispatch.c blake3_portable.c
working-directory: ./c
# See https://github.com/BLAKE3-team/BLAKE3/issues/271 for why we test this.
# Note that this isn't guaranteed to execute on an AVX-512-supporting server,
# but hopefully at least some of the time it will.
gcc54:
name: "compile and test with GCC 5.4"
runs-on: ubuntu-latest
steps:
- uses: actions/checkout@v4
- uses: addnab/docker-run-action@v3
with:
image: gcc:5.4
options: -v ${{ github.workspace }}:/work
run: |
cat /proc/cpuinfo
curl https://sh.rustup.rs -sSf | sh -s -- -y --profile minimal
cd /work
~/.cargo/bin/cargo test --features prefer_intrinsics
# CMake build test (Library only).
cmake_build:
name: CMake ${{ matrix.os }} CC=${{ matrix.toolchain.cc }} CXX=${{ matrix.toolchain.cxx }} tbb=${{ matrix.tbb }}
runs-on: ${{ matrix.os }}
strategy:
fail-fast: false
matrix:
os: ["ubuntu-latest", "macOS-latest", "windows-latest"]
toolchain: [
{ cc: gcc, cxx: g++ },
{ cc: cl, cxx: cl },
{ cc: clang, cxx: clang++ }
]
tbb: ["OFF", "ON"]
exclude:
- os: macOS-latest
toolchain: { cc: cl, cxx: cl }
- os: macOS-latest
toolchain: { cc: gcc, cxx: g++ }
- os: ubuntu-latest
toolchain: { cc: cl, cxx: cl }
- os: windows-latest
toolchain: { cc: gcc, cxx: g++ }
tbb: "ON"
- os: windows-latest
toolchain: { cc: clang, cxx: clang++ }
tbb: "ON"
include:
- os: windows-latest
toolchain: { cc: clang-cl, cxx: clang-cl }
tbb: "OFF"
- os: windows-latest
toolchain: { cc: clang-cl, cxx: clang-cl }
tbb: "ON"
steps:
- uses: actions/checkout@v4
- run: |
sudo apt-get update
sudo apt-get install ninja-build libtbb-dev libtbb12
if: matrix.os == 'ubuntu-latest'
- run: |
brew update
brew install ninja tbb
if: matrix.os == 'macOS-latest'
- run: |
choco install ninja
if: matrix.os == 'windows-latest'
- run: |
cmake --fresh -S c -B c/build -G Ninja -DCMAKE_C_COMPILER=${{ matrix.toolchain.cc }} -DCMAKE_CXX_COMPILER=${{ matrix.toolchain.cxx }} -DCMAKE_INSTALL_PREFIX=${{github.workspace}}/target -DBLAKE3_TBB_PARALLELISM=${{ matrix.tbb }}
cmake --build c/build --target install
if: matrix.os != 'windows-latest'
- shell: cmd
run: |
call "C:/Program Files/Microsoft Visual Studio/2022/Enterprise/VC/Auxiliary/Build/vcvarsall.bat" x64
cmake --fresh -S c -B c/build -G Ninja -DCMAKE_C_COMPILER=${{ matrix.toolchain.cc }} -DCMAKE_CXX_COMPILER=${{ matrix.toolchain.cxx }} -DCMAKE_INSTALL_PREFIX=${{github.workspace}}/target -DBLAKE3_TBB_PARALLELISM=${{ matrix.tbb }} -DBLAKE3_TBB_ALLOW_FETCHING=YES
cmake --build c/build --target install
if: matrix.os == 'windows-latest'
miri_smoketest:
name: Miri smoketest
runs-on: ubuntu-latest
steps:
- uses: actions/checkout@v4
- uses: dtolnay/rust-toolchain@nightly
with:
components: miri
# Currently the test search "miri" only matches "test_miri_smoketest", but
# we might add more. If this accidentally picks up anything incompatible or
# slow, we can narrow it.
- run: cargo miri test miri