-
Notifications
You must be signed in to change notification settings - Fork 188
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Overwrites all generated PTX source, test and documentation files and runs `pre-commit run --all-files`
- Loading branch information
1 parent
83d180f
commit 2d1d9db
Showing
58 changed files
with
4,646 additions
and
4,484 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
27 changes: 17 additions & 10 deletions
27
libcudacxx/include/cuda/__ptx/instructions/generated/cp_async_bulk_commit_group.inc
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,21 +1,28 @@ | ||
#ifndef _CUDA_PTX_GENERATED_CP_ASYNC_BULK_COMMIT_GROUP_H_ | ||
#define _CUDA_PTX_GENERATED_CP_ASYNC_BULK_COMMIT_GROUP_H_ | ||
|
||
/* | ||
// cp.async.bulk.commit_group; // PTX ISA 80, SM_90 | ||
template <typename=void> | ||
__device__ static inline void cp_async_bulk_commit_group(); | ||
*/ | ||
#if __cccl_ptx_isa >= 800 | ||
extern "C" _CCCL_DEVICE void __cuda_ptx_cp_async_bulk_commit_group_is_not_supported_before_SM_90__(); | ||
template <typename = void> | ||
template <typename=void> | ||
_CCCL_DEVICE static inline void cp_async_bulk_commit_group() | ||
{ | ||
NV_IF_ELSE_TARGET( | ||
NV_PROVIDES_SM_90, | ||
(asm volatile("cp.async.bulk.commit_group;" | ||
: | ||
: | ||
:);), | ||
( | ||
// Unsupported architectures will have a linker error with a semi-decent error message | ||
__cuda_ptx_cp_async_bulk_commit_group_is_not_supported_before_SM_90__();)); | ||
NV_IF_ELSE_TARGET(NV_PROVIDES_SM_90,( | ||
asm volatile ( | ||
"cp.async.bulk.commit_group;" | ||
: | ||
: | ||
: | ||
); | ||
),( | ||
// Unsupported architectures will have a linker error with a semi-decent error message | ||
__cuda_ptx_cp_async_bulk_commit_group_is_not_supported_before_SM_90__(); | ||
)); | ||
} | ||
#endif // __cccl_ptx_isa >= 800 | ||
|
||
#endif // _CUDA_PTX_GENERATED_CP_ASYNC_BULK_COMMIT_GROUP_H_ |
Oops, something went wrong.