Skip to content

Commit

Permalink
Regenerate PTX test
Browse files Browse the repository at this point in the history
Overwrites all generated PTX tests and runs `pre-commit run --all-files`
  • Loading branch information
bernhardmgruber committed Nov 25, 2024
1 parent 0b36a7d commit 59a6584
Show file tree
Hide file tree
Showing 49 changed files with 42 additions and 42 deletions.
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
__global__ void test_cp_reduce_async_bulk_bf16(void** fn_ptr)
{
# if __cccl_ptx_isa >= 800
#if __cccl_ptx_isa >= 800
NV_IF_TARGET(
NV_PROVIDES_SM_90,
(
Expand All @@ -12,9 +12,9 @@ __global__ void test_cp_reduce_async_bulk_bf16(void** fn_ptr)
__nv_bfloat16*,
const __nv_bfloat16*,
uint32_t)>(cuda::ptx::cp_reduce_async_bulk));));
# endif // __cccl_ptx_isa >= 800
#endif // __cccl_ptx_isa >= 800

# if __cccl_ptx_isa >= 800
#if __cccl_ptx_isa >= 800
NV_IF_TARGET(
NV_PROVIDES_SM_90,
(
Expand All @@ -26,9 +26,9 @@ __global__ void test_cp_reduce_async_bulk_bf16(void** fn_ptr)
__nv_bfloat16*,
const __nv_bfloat16*,
uint32_t)>(cuda::ptx::cp_reduce_async_bulk));));
# endif // __cccl_ptx_isa >= 800
#endif // __cccl_ptx_isa >= 800

# if __cccl_ptx_isa >= 800
#if __cccl_ptx_isa >= 800
NV_IF_TARGET(
NV_PROVIDES_SM_90,
(
Expand All @@ -40,5 +40,5 @@ __global__ void test_cp_reduce_async_bulk_bf16(void** fn_ptr)
__nv_bfloat16*,
const __nv_bfloat16*,
uint32_t)>(cuda::ptx::cp_reduce_async_bulk));));
# endif // __cccl_ptx_isa >= 800
#endif // __cccl_ptx_isa >= 800
}
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
__global__ void test_cp_reduce_async_bulk_f16(void** fn_ptr)
{
# if __cccl_ptx_isa >= 800
#if __cccl_ptx_isa >= 800
NV_IF_TARGET(
NV_PROVIDES_SM_90,
(
Expand All @@ -9,9 +9,9 @@ __global__ void test_cp_reduce_async_bulk_f16(void** fn_ptr)
static_cast<void (*)(
cuda::ptx::space_global_t, cuda::ptx::space_shared_t, cuda::ptx::op_min_t, __half*, const __half*, uint32_t)>(
cuda::ptx::cp_reduce_async_bulk));));
# endif // __cccl_ptx_isa >= 800
#endif // __cccl_ptx_isa >= 800

# if __cccl_ptx_isa >= 800
#if __cccl_ptx_isa >= 800
NV_IF_TARGET(
NV_PROVIDES_SM_90,
(
Expand All @@ -20,9 +20,9 @@ __global__ void test_cp_reduce_async_bulk_f16(void** fn_ptr)
static_cast<void (*)(
cuda::ptx::space_global_t, cuda::ptx::space_shared_t, cuda::ptx::op_max_t, __half*, const __half*, uint32_t)>(
cuda::ptx::cp_reduce_async_bulk));));
# endif // __cccl_ptx_isa >= 800
#endif // __cccl_ptx_isa >= 800

# if __cccl_ptx_isa >= 800
#if __cccl_ptx_isa >= 800
NV_IF_TARGET(
NV_PROVIDES_SM_90,
(
Expand All @@ -31,5 +31,5 @@ __global__ void test_cp_reduce_async_bulk_f16(void** fn_ptr)
static_cast<void (*)(
cuda::ptx::space_global_t, cuda::ptx::space_shared_t, cuda::ptx::op_add_t, __half*, const __half*, uint32_t)>(
cuda::ptx::cp_reduce_async_bulk));));
# endif // __cccl_ptx_isa >= 800
#endif // __cccl_ptx_isa >= 800
}
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@
*
*/

#include "generated/barrier_cluster.inc"
#include "generated/barrier_cluster.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@
*
*/

#include "generated/cp_async_bulk_commit_group.inc"
#include "generated/cp_async_bulk_commit_group.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@
*
*/

#include "generated/cp_async_bulk.inc"
#include "generated/cp_async_bulk.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -33,7 +33,7 @@
*
*/

#include "generated/cp_async_bulk_multicast.inc"
#include "generated/cp_async_bulk_multicast.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@
*
*/

#include "generated/cp_async_bulk_tensor.inc"
#include "generated/cp_async_bulk_tensor.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -33,7 +33,7 @@
*
*/

#include "generated/cp_async_bulk_tensor_multicast.inc"
#include "generated/cp_async_bulk_tensor_multicast.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@
*
*/

#include "generated/cp_async_bulk_wait_group.inc"
#include "generated/cp_async_bulk_wait_group.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,14 +31,14 @@
*
*/

#include "generated/cp_reduce_async_bulk.inc"
#include "generated/cp_reduce_async_bulk.h"

#ifdef _LIBCUDACXX_HAS_NVF16
# include "generated/cp_reduce_async_bulk_f16.inc"
# include "generated/cp_reduce_async_bulk_f16.h"
#endif // _LIBCUDACXX_HAS_NVF16

#ifdef _LIBCUDACXX_HAS_NVBF16
# include "generated/cp_reduce_async_bulk_bf16.inc"
# include "generated/cp_reduce_async_bulk_bf16.h"
#endif // _LIBCUDACXX_HAS_NVBF16

int main(int, char**)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@
*
*/

#include "generated/cp_reduce_async_bulk_tensor.inc"
#include "generated/cp_reduce_async_bulk_tensor.h"

int main(int, char**)
{
Expand Down
10 changes: 5 additions & 5 deletions libcudacxx/test/libcudacxx/cuda/ptx/ptx.fence.compile.pass.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -31,11 +31,11 @@
*
*/

#include "generated/fence.inc"
#include "generated/fence_mbarrier_init.inc"
#include "generated/fence_proxy_alias.inc"
#include "generated/fence_proxy_async.inc"
#include "generated/fence_proxy_tensormap_generic.inc"
#include "generated/fence.h"
#include "generated/fence_mbarrier_init.h"
#include "generated/fence_proxy_alias.h"
#include "generated/fence_proxy_async.h"
#include "generated/fence_proxy_tensormap_generic.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -32,7 +32,7 @@
*
*/

#include "generated/get_sreg.inc"
#include "generated/get_sreg.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@
*
*/

#include "generated/getctarank.inc"
#include "generated/getctarank.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,9 +31,9 @@
*
*/

#include "generated/mbarrier_arrive.inc"
#include "generated/mbarrier_arrive_expect_tx.inc"
#include "generated/mbarrier_arrive_no_complete.inc"
#include "generated/mbarrier_arrive.h"
#include "generated/mbarrier_arrive_expect_tx.h"
#include "generated/mbarrier_arrive_no_complete.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@
*
*/

#include "generated/mbarrier_init.inc"
#include "generated/mbarrier_init.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,10 +31,10 @@
*
*/

#include "generated/mbarrier_try_wait.inc"
#include "generated/mbarrier_try_wait_parity.inc"
#include "generated/mbarrier_wait.inc"
#include "generated/mbarrier_wait_parity.inc"
#include "generated/mbarrier_try_wait.h"
#include "generated/mbarrier_try_wait_parity.h"
#include "generated/mbarrier_wait.h"
#include "generated/mbarrier_wait_parity.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@
*
*/

#include "generated/red_async.inc"
#include "generated/red_async.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@
*
*/

#include "generated/st_async.inc"
#include "generated/st_async.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@
*
*/

#include "generated/tensormap_cp_fenceproxy.inc"
#include "generated/tensormap_cp_fenceproxy.h"

int main(int, char**)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@
*
*/

#include "generated/tensormap_replace.inc"
#include "generated/tensormap_replace.h"

int main(int, char**)
{
Expand Down

0 comments on commit 59a6584

Please sign in to comment.