@@ -314,7 +314,7 @@ def __call__(
314
314
self ,
315
315
queue : Queue | MultiQueue ,
316
316
* args : MultiArray | Array | Buffer | numpy .generic ,
317
- local_mem : int = 0 ,
317
+ cu_dynamic_local_mem : int = 0 ,
318
318
) -> Any :
319
319
"""
320
320
Enqueues the kernel on the devices in the given queue.
@@ -332,8 +332,10 @@ def __call__(
332
332
If an argument is a integer-keyed ``dict``, its values corresponding to the
333
333
device indices the kernel is executed on will be passed as kernel arguments.
334
334
335
+ :param cu_dynamic_local_mem: **CUDA only.** The size of dynamically allocated local
336
+ (shared in CUDA terms) memory, in bytes. That is, the size of
337
+ ``extern __shared__`` arrays in CUDA kernels.
335
338
:param args: kernel arguments.
336
- :param kwds: backend-specific keyword parameters.
337
339
:returns: a list of ``Event`` objects for enqueued kernels in case of PyOpenCL.
338
340
"""
339
341
if isinstance (queue , Queue ):
@@ -357,7 +359,11 @@ def __call__(
357
359
single_queue = queue .queues [device ]
358
360
359
361
pkernel = self ._prepared_kernel_adapters [device ]
360
- ret_val = pkernel (single_queue ._queue_adapter , * kernel_args , local_mem = local_mem ) # noqa: SLF001
362
+ ret_val = pkernel (
363
+ single_queue ._queue_adapter , # noqa: SLF001
364
+ * kernel_args ,
365
+ cu_dynamic_local_mem = cu_dynamic_local_mem ,
366
+ )
361
367
ret_vals .append (ret_val )
362
368
363
369
return ret_vals
@@ -455,11 +461,11 @@ def __call__(
455
461
global_size : Sequence [int ] | Mapping [BoundDevice , Sequence [int ]],
456
462
local_size : Sequence [int ] | None | Mapping [BoundDevice , Sequence [int ] | None ] = None ,
457
463
* args : MultiArray | Array | Buffer | numpy .generic ,
458
- local_mem : int = 0 ,
464
+ cu_dynamic_local_mem : int = 0 ,
459
465
) -> Any :
460
466
"""
461
467
A shortcut for :py:meth:`Kernel.prepare` and subsequent :py:meth:`PreparedKernel.__call__`.
462
468
See their doc entries for details.
463
469
"""
464
470
pkernel = self .prepare (global_size , local_size )
465
- return pkernel (queue , * args , local_mem = local_mem )
471
+ return pkernel (queue , * args , cu_dynamic_local_mem = cu_dynamic_local_mem )
0 commit comments