Skip to content

Commit

Permalink
Merge branch 'branch-22.04' into jni-mixed-semi-join
Browse files Browse the repository at this point in the history
  • Loading branch information
jlowe committed Jan 25, 2022
2 parents 5225a1c + a552afb commit 00eee6f
Show file tree
Hide file tree
Showing 245 changed files with 4,595 additions and 2,010 deletions.
27 changes: 27 additions & 0 deletions .clang-tidy
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
---
Checks:
'modernize-*,
-modernize-use-equals-default,
-modernize-concat-nested-namespaces,
-modernize-use-trailing-return-type'

# -modernize-use-equals-default # auto-fix is broken (doesn't insert =default correctly)
# -modernize-concat-nested-namespaces # auto-fix is broken (can delete code)
# -modernize-use-trailing-return-type # just a preference

WarningsAsErrors: ''
HeaderFilterRegex: ''
AnalyzeTemporaryDtors: false
FormatStyle: none
CheckOptions:
- key: modernize-loop-convert.MaxCopySize
value: '16'
- key: modernize-loop-convert.MinConfidence
value: reasonable
- key: modernize-pass-by-value.IncludeStyle
value: llvm
- key: modernize-replace-auto-ptr.IncludeStyle
value: llvm
- key: modernize-use-nullptr.NullMacros
value: 'NULL'
...
4 changes: 4 additions & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
@@ -1,3 +1,7 @@
# cuDF 22.04.00 (Date TBD)

Please see https://github.com/rapidsai/cudf/releases/tag/v22.04.00a for the latest changes to this development branch.

# cuDF 22.02.00 (Date TBD)

Please see https://github.com/rapidsai/cudf/releases/tag/v22.02.00a for the latest changes to this development branch.
Expand Down
76 changes: 0 additions & 76 deletions Dockerfile

This file was deleted.

2 changes: 1 addition & 1 deletion ci/benchmark/build.sh
Original file line number Diff line number Diff line change
Expand Up @@ -37,7 +37,7 @@ export GBENCH_BENCHMARKS_DIR="$WORKSPACE/cpp/build/gbenchmarks/"
export LIBCUDF_KERNEL_CACHE_PATH="$HOME/.jitify-cache"

# Dask & Distributed git tag
export DASK_DISTRIBUTED_GIT_TAG='main'
export DASK_DISTRIBUTED_GIT_TAG='2022.01.0'

function remove_libcudf_kernel_cache_dir {
EXITCODE=$?
Expand Down
5 changes: 3 additions & 2 deletions ci/cpu/prebuild.sh
Original file line number Diff line number Diff line change
Expand Up @@ -4,12 +4,13 @@
set -e

DEFAULT_CUDA_VER="11.5"
DEFAULT_PYTHON_VER="3.8"

#Always upload cudf Python package
export UPLOAD_CUDF=1

#Upload libcudf once per CUDA
if [[ "$PYTHON" == "3.7" ]]; then
if [[ "$PYTHON" == "${DEFAULT_PYTHON_VER}" ]]; then
export UPLOAD_LIBCUDF=1
else
export UPLOAD_LIBCUDF=0
Expand All @@ -23,7 +24,7 @@ else
fi

#We only want to upload libcudf_kafka once per python/CUDA combo
if [[ "$PYTHON" == "3.7" ]] && [[ "$CUDA" == "${DEFAULT_CUDA_VER}" ]]; then
if [[ "$PYTHON" == "${DEFAULT_PYTHON_VER}" ]] && [[ "$CUDA" == "${DEFAULT_CUDA_VER}" ]]; then
export UPLOAD_LIBCUDF_KAFKA=1
else
export UPLOAD_LIBCUDF_KAFKA=0
Expand Down
4 changes: 2 additions & 2 deletions ci/gpu/build.sh
Original file line number Diff line number Diff line change
Expand Up @@ -31,10 +31,10 @@ export GIT_DESCRIBE_TAG=`git describe --tags`
export MINOR_VERSION=`echo $GIT_DESCRIBE_TAG | grep -o -E '([0-9]+\.[0-9]+)'`

# Dask & Distributed git tag
export DASK_DISTRIBUTED_GIT_TAG='main'
export DASK_DISTRIBUTED_GIT_TAG='2022.01.0'

# ucx-py version
export UCX_PY_VERSION='0.24.*'
export UCX_PY_VERSION='0.25.*'

################################################################################
# TRAP - Setup trap for removing jitify cache
Expand Down
2 changes: 1 addition & 1 deletion ci/gpu/java.sh
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@ export GIT_DESCRIBE_TAG=`git describe --tags`
export MINOR_VERSION=`echo $GIT_DESCRIBE_TAG | grep -o -E '([0-9]+\.[0-9]+)'`

# ucx-py version
export UCX_PY_VERSION='0.24.*'
export UCX_PY_VERSION='0.25.*'

################################################################################
# TRAP - Setup trap for removing jitify cache
Expand Down
7 changes: 4 additions & 3 deletions conda/environments/cudf_dev_cuda11.5.yml
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@ dependencies:
- clang=11.1.0
- clang-tools=11.1.0
- cupy>=9.5.0,<11.0.0a0
- rmm=22.02.*
- rmm=22.04.*
- cmake>=3.20.1
- cmake_setuptools>=0.1.3
- python>=3.7,<3.9
Expand All @@ -33,6 +33,7 @@ dependencies:
- ipython
- pandoc=<2.0.0
- cudatoolkit=11.5
- cuda-python >=11.5,<12.0
- pip
- flake8=3.8.3
- black=19.10
Expand All @@ -41,8 +42,8 @@ dependencies:
- pydocstyle=6.1.1
- typing_extensions
- pre-commit
- dask>=2021.11.1
- distributed>=2021.11.1
- dask>=2021.11.1,<=2022.01.0
- distributed>=2021.11.1,<=2022.01.0
- streamz
- arrow-cpp=5.0.0
- dlpack>=0.5,<0.6.0a0
Expand Down
2 changes: 1 addition & 1 deletion conda/recipes/cudf/meta.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -52,7 +52,7 @@ requirements:
- packaging
- cachetools
- ptxcompiler # [linux64] # CUDA enhanced compatibility. See https://github.com/rapidsai/ptxcompiler

- cuda-python >=11.5,<12.0
test: # [linux64]
requires: # [linux64]
- cudatoolkit {{ cuda_version }}.* # [linux64]
Expand Down
2 changes: 1 addition & 1 deletion conda/recipes/cudf_kafka/meta.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -35,7 +35,7 @@ requirements:
run:
- python
- libcudf_kafka {{ version }}
- python-confluent-kafka >=1.7.0,<1.8.0a0=py{{ py_version_numeric }}*
- python-confluent-kafka >=1.7.0,<1.8.0a0
- cudf {{ version }}

test: # [linux64]
Expand Down
8 changes: 4 additions & 4 deletions conda/recipes/custreamz/meta.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -26,15 +26,15 @@ build:
requirements:
host:
- python
- python-confluent-kafka >=1.7.0,<1.8.0a0=py{{ py_version_numeric }}*
- python-confluent-kafka >=1.7.0,<1.8.0a0
- cudf_kafka {{ version }}
run:
- python
- streamz
- cudf {{ version }}
- dask>=2021.11.1,<=2021.11.2
- distributed>=2021.11.1,<=2021.11.2
- python-confluent-kafka >=1.7.0,<1.8.0a0=py{{ py_version_numeric }}*
- dask>=2021.11.1,<=2022.01.0
- distributed>=2021.11.1,<=2022.01.0
- python-confluent-kafka >=1.7.0,<1.8.0a0
- cudf_kafka {{ version }}

test: # [linux64]
Expand Down
8 changes: 4 additions & 4 deletions conda/recipes/dask-cudf/meta.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -27,14 +27,14 @@ requirements:
host:
- python
- cudf {{ version }}
- dask>=2021.11.1
- distributed>=2021.11.1
- dask>=2021.11.1,<=2022.01.0
- distributed>=2021.11.1,<=2022.01.0
- cudatoolkit {{ cuda_version }}
run:
- python
- cudf {{ version }}
- dask>=2021.11.1
- distributed>=2021.11.1
- dask>=2021.11.1,<=2022.01.0
- distributed>=2021.11.1,<=2022.01.0
- {{ pin_compatible('cudatoolkit', max_pin='x', min_pin='x') }}

test: # [linux64]
Expand Down
13 changes: 10 additions & 3 deletions cpp/CMakeLists.txt
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
# =============================================================================
# Copyright (c) 2018-2021, NVIDIA CORPORATION.
# Copyright (c) 2018-2022, NVIDIA CORPORATION.
#
# Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except
# in compliance with the License. You may obtain a copy of the License at
Expand All @@ -25,7 +25,7 @@ rapids_cuda_init_architectures(CUDF)

project(
CUDF
VERSION 22.02.00
VERSION 22.04.00
LANGUAGES C CXX CUDA
)

Expand Down Expand Up @@ -186,6 +186,8 @@ add_library(
src/binaryop/compiled/Mod.cu
src/binaryop/compiled/Mul.cu
src/binaryop/compiled/NullEquals.cu
src/binaryop/compiled/NullLogicalOr.cu
src/binaryop/compiled/NullLogicalAnd.cu
src/binaryop/compiled/NullMax.cu
src/binaryop/compiled/NullMin.cu
src/binaryop/compiled/PMod.cu
Expand Down Expand Up @@ -322,11 +324,16 @@ add_library(
src/jit/parser.cpp
src/jit/type.cpp
src/join/conditional_join.cu
src/join/mixed_join.cu
src/join/cross_join.cu
src/join/hash_join.cu
src/join/join.cu
src/join/join_utils.cu
src/join/mixed_join.cu
src/join/mixed_join_kernels.cu
src/join/mixed_join_kernels_semi.cu
src/join/mixed_join_semi.cu
src/join/mixed_join_size_kernels.cu
src/join/mixed_join_size_kernels_semi.cu
src/join/semi_join.cu
src/lists/contains.cu
src/lists/combine/concatenate_list_elements.cu
Expand Down
3 changes: 2 additions & 1 deletion cpp/benchmarks/common/generate_benchmark_input.cpp
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
/*
* Copyright (c) 2020-2021, NVIDIA CORPORATION.
* Copyright (c) 2020-2022, NVIDIA CORPORATION.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
Expand Down Expand Up @@ -31,6 +31,7 @@

#include <future>
#include <memory>
#include <optional>
#include <random>
#include <thread>
#include <vector>
Expand Down
4 changes: 2 additions & 2 deletions cpp/benchmarks/common/generate_benchmark_input.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -300,8 +300,8 @@ class data_profile {

auto get_bool_probability() const { return bool_probability; }
auto get_null_frequency() const { return null_frequency; };
auto get_cardinality() const { return cardinality; };
auto get_avg_run_length() const { return avg_run_length; };
[[nodiscard]] auto get_cardinality() const { return cardinality; };
[[nodiscard]] auto get_avg_run_length() const { return avg_run_length; };

// Users should pass integral values for bounds when setting the parameters for types that have
// discrete distributions (integers, strings, lists). Otherwise the call with have no effect.
Expand Down
6 changes: 4 additions & 2 deletions cpp/benchmarks/copying/contiguous_split_benchmark.cu
Original file line number Diff line number Diff line change
Expand Up @@ -51,10 +51,12 @@ void BM_contiguous_split_common(benchmark::State& state,
std::vector<std::unique_ptr<cudf::column>> columns(src_cols.size());
std::transform(src_cols.begin(), src_cols.end(), columns.begin(), [](T& in) {
auto ret = in.release();
ret->null_count();
// computing the null count is not a part of the benchmark's target code path, and we want the
// property to be pre-computed so that we measure the performance of only the intended code path
[[maybe_unused]] auto const nulls = ret->null_count();
return ret;
});
cudf::table src_table(std::move(columns));
auto const src_table = cudf::table(std::move(columns));

for (auto _ : state) {
cuda_event_timer raii(state, true); // flush_l2_cache = true, stream = 0
Expand Down
2 changes: 1 addition & 1 deletion cpp/benchmarks/copying/gather_benchmark.cu
Original file line number Diff line number Diff line change
Expand Up @@ -39,7 +39,7 @@ template <class TypeParam, bool coalesce>
void BM_gather(benchmark::State& state)
{
const cudf::size_type source_size{(cudf::size_type)state.range(0)};
const cudf::size_type n_cols = (cudf::size_type)state.range(1);
const auto n_cols = (cudf::size_type)state.range(1);

// Every element is valid
auto data = cudf::detail::make_counting_transform_iterator(0, [](auto i) { return i; });
Expand Down
2 changes: 1 addition & 1 deletion cpp/benchmarks/copying/scatter_benchmark.cu
Original file line number Diff line number Diff line change
Expand Up @@ -40,7 +40,7 @@ template <class TypeParam, bool coalesce>
void BM_scatter(benchmark::State& state)
{
const cudf::size_type source_size{(cudf::size_type)state.range(0)};
const cudf::size_type n_cols = (cudf::size_type)state.range(1);
const auto n_cols = (cudf::size_type)state.range(1);

// Every element is valid
auto data = cudf::detail::make_counting_transform_iterator(0, [](auto i) { return i; });
Expand Down
Loading

0 comments on commit 00eee6f

Please sign in to comment.