Source code for pyfr.backends.cuda.provider

# -*- coding: utf-8 -*-

from pyfr.backends.base import (BaseKernelProvider,
                                BasePointwiseKernelProvider, Kernel)
from pyfr.backends.cuda.generator import CUDAKernelGenerator
from pyfr.backends.cuda.compiler import SourceModule
from pyfr.util import memoize


def get_grid_for_block(block, nrow, ncol=1):
    return (-(-nrow // block[0]), -(-ncol // block[1]), 1)


class CUDAKernelProvider(BaseKernelProvider):
    @memoize
    def _build_kernel(self, name, src, argtypes):
        # Compile the source code and retrieve the function
        mod = SourceModule(self.backend, src)
        return mod.get_function(name, argtypes)


[docs]class CUDAPointwiseKernelProvider(CUDAKernelProvider, BasePointwiseKernelProvider): kernel_generator_cls = CUDAKernelGenerator
[docs] def _instantiate_kernel(self, dims, fun, arglst, argmv): # Determine the block size if len(dims) == 1: block = (64, 1, 1) else: block = (64, 4, 1) # Use this to compute the grid size grid = get_grid_for_block(block, dims[-1]) class PointwiseKernel(Kernel): if any(isinstance(arg, str) for arg in arglst): def run(self, queue, **kwargs): fun.exec_async(grid, block, queue.stream, *[kwargs.get(ka, ka) for ka in arglst]) else: def run(self, queue, **kwargs): fun.exec_async(grid, block, queue.stream, *arglst) return PointwiseKernel(*argmv)