def execute(self, repeat=1, unbind=True):
kernel = kernel_specs.get_kernel(self.kernel_name, self.kernel_opts)
for r in range(repeat):
if self.zero:
drv.memset_d32_async(*self.zero_args)
kernel.prepared_async_call(*self.kernel_args)
self.output_trans.execute()
if unbind:
self.output_trans.unbind()
self.zero_args = None
self.kernel_args[2:6] = (None,) * 4
# Magic numbers and shift amounts for integer division
# Suitable for when nmax*magic fits in 32 bits
# Shamelessly pulled directly from:
# http://www.hackersdelight.org/hdcodetxt/magicgu.py.txt
评论列表
文章目录