Skip to content
This repository was archived by the owner on Mar 21, 2024. It is now read-only.
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
26 commits
Select commit Hold shift + click to select a range
4c579e2
Bump CUB for CDP update.
alliepiper Jun 29, 2022
4182f8e
Use seq algos for CDP launches on sm90+.
alliepiper Jun 29, 2022
3c9c838
Ensure kernels are instantiated for CDPv1 nvcc device passes.
alliepiper Aug 12, 2022
f27d762
Add changelog for 1.17.1.
alliepiper Aug 15, 2022
37a8d2b
Bump CUB.
alliepiper Aug 15, 2022
1fe97c6
Add Thrust 2.0.0 changelog.
alliepiper Aug 15, 2022
d6e9274
Bump CUB.
alliepiper Aug 15, 2022
92b3aaf
Merge branch 'ctk12_cdp_updates' into staging/ctk_12.0
alliepiper Aug 16, 2022
89a5fbd
Bump version to 2.0.1 for CTK12.
alliepiper Aug 16, 2022
8fe85d8
Add sm90 option to CMake builds.
alliepiper Aug 16, 2022
d31abae
Merge branch 'ctk12_sm90_cmake_option' into staging/ctk_12.0
alliepiper Aug 16, 2022
5372a29
Bump CUB.
alliepiper Aug 17, 2022
1e6fb36
Move sync from for_each to parallel_for to fix CDP usages.
alliepiper Aug 26, 2022
512272c
Merge pull request #1776 from allisonvacanti/cdp_for_each_fix_backport
alliepiper Aug 29, 2022
f32a788
Merge remote-tracking branch 'origin/2.0.X' into staging/ctk_12.0
alliepiper Aug 29, 2022
f58f28c
Only generate per-dialect targets when needed.
Aug 30, 2022
73a4616
Fix FindTBB.cmake for MSVC 2022.
Aug 30, 2022
786e5aa
Merge pull request #1781 from allisonvacanti/c++20_fix_backport
alliepiper Aug 30, 2022
af8317f
Merge remote-tracking branch 'origin/2.0.X' into staging/ctk_12.0
alliepiper Aug 30, 2022
d205a6f
Merge pull request #1799 from miscco/no_throw
miscco Sep 26, 2022
8a2c7e5
Merge branch 'staging/ctk_12.0' into gpgpu
wmaxey Sep 27, 2022
6c518b0
WAR bug on MSVC 2022.
Aug 31, 2022
0c28b7c
Actually really for real remove throw
miscco Oct 5, 2022
cb86111
Bump CUB.
alliepiper Dec 13, 2022
a31906a
Merge branch 'staging/ctk_12.0' into main
alliepiper Dec 13, 2022
bdd6880
Limit gpuCI configurations to CTK only.
Dec 15, 2022
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
43 changes: 0 additions & 43 deletions ci/axis/cpu.yml
Original file line number Diff line number Diff line change
Expand Up @@ -5,11 +5,9 @@

SDK_TYPE:
- cuda
- nvhpc

SDK_VER:
- 11.5.1-devel
- 22.1-devel-cuda11.5

OS_TYPE:
- ubuntu
Expand All @@ -18,7 +16,6 @@ OS_VER:
- 20.04

CXX_TYPE:
- nvcxx
- clang
- gcc
- icc
Expand All @@ -32,55 +29,18 @@ CXX_VER:
- 10
- 11
- 12
- 22.1
- latest

exclude:
# Excludes by `SDK_TYPE`.
- CXX_TYPE: gcc
SDK_TYPE: nvhpc
- CXX_TYPE: clang
SDK_TYPE: nvhpc
- CXX_TYPE: icc
SDK_TYPE: nvhpc
- CXX_TYPE: nvcxx
SDK_TYPE: cuda
# Excludes by `SDK_VER`.
- SDK_TYPE: cuda
SDK_VER: 22.1-devel-cuda11.5
- SDK_TYPE: nvhpc
SDK_VER: 11.5.1-devel
# Excludes by `CXX_VER`.
- CXX_TYPE: nvcxx
CXX_VER: 5
- CXX_TYPE: nvcxx
CXX_VER: 6
- CXX_TYPE: nvcxx
CXX_VER: 7
- CXX_TYPE: nvcxx
CXX_VER: 8
- CXX_TYPE: nvcxx
CXX_VER: 9
- CXX_TYPE: nvcxx
CXX_VER: 10
- CXX_TYPE: nvcxx
CXX_VER: 11
- CXX_TYPE: nvcxx
CXX_VER: 12
- CXX_TYPE: nvcxx
CXX_VER: latest
- CXX_TYPE: gcc
CXX_VER: 12
- CXX_TYPE: gcc
CXX_VER: 22.1
- CXX_TYPE: gcc
CXX_VER: latest
- CXX_TYPE: clang
CXX_VER: 5
- CXX_TYPE: clang
CXX_VER: 6
- CXX_TYPE: clang
CXX_VER: 22.1
- CXX_TYPE: clang
CXX_VER: latest
- CXX_TYPE: icc
Expand All @@ -99,6 +59,3 @@ exclude:
CXX_VER: 11
- CXX_TYPE: icc
CXX_VER: 12
- CXX_TYPE: icc
CXX_VER: 22.1

2 changes: 1 addition & 1 deletion cmake/ThrustCudaConfig.cmake
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
enable_language(CUDA)

set(THRUST_KNOWN_COMPUTE_ARCHS 35 37 50 52 53 60 61 62 70 72 75 80 86)
set(THRUST_KNOWN_COMPUTE_ARCHS 35 37 50 52 53 60 61 62 70 72 75 80 86 90)

# Split CUDA_FLAGS into 3 parts:
#
Expand Down
1 change: 1 addition & 0 deletions docs/github_pages/releases.md
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,7 @@ nav_order: 3

| Version | Included In |
|-----------------|-------------------------------------------|
| 2.0.1 | CUDA Toolkit 12.0 |
| 2.0.0 | TBD |
| 1.17.2 | TBD |
| 1.17.1 | TBD |
Expand Down
28 changes: 22 additions & 6 deletions thrust/system/cuda/detail/cdp_dispatch.h
Original file line number Diff line number Diff line change
Expand Up @@ -42,13 +42,29 @@
* \endcode
*/

#ifdef THRUST_RDC_ENABLED
#if defined(CUB_DETAIL_CDPv1)

// seq_impl unused.
// Special case for NVCC -- need to inform the device path about the kernels
// that are launched from the host path.
#if defined(__CUDACC__) && defined(__CUDA_ARCH__)

// seq_impl only used on platforms that do not support device synchronization.
#define THRUST_CDP_DISPATCH(par_impl, seq_impl) \
NV_IF_TARGET(NV_ANY_TARGET, par_impl, par_impl)
if (false) \
{ /* Without this, the device pass won't compile any kernels. */ \
NV_IF_TARGET(NV_ANY_TARGET, par_impl); \
} \
NV_DISPATCH_TARGET(NV_PROVIDES_SM_90, seq_impl, NV_ANY_TARGET, par_impl)

#else // THRUST_RDC_ENABLED
#else // NVCC device pass

// seq_impl only used on platforms that do not support device synchronization.
#define THRUST_CDP_DISPATCH(par_impl, seq_impl) \
NV_DISPATCH_TARGET(NV_PROVIDES_SM_90, seq_impl, NV_ANY_TARGET, par_impl)

#endif // NVCC device pass

#else // CDPv1 unavailable. Always fallback to serial on device:

// Special case for NVCC -- need to inform the device path about the kernels
// that are launched from the host path.
Expand All @@ -62,11 +78,11 @@
} \
NV_IF_TARGET(NV_IS_HOST, par_impl, seq_impl)

#else // NVCC device pass
#else // !(NVCC device pass):

#define THRUST_CDP_DISPATCH(par_impl, seq_impl) \
NV_IF_TARGET(NV_IS_HOST, par_impl, seq_impl)

#endif // NVCC device pass

#endif // THRUST_RDC_ENABLED
#endif // CDP version