nabu.processing.padding_opencl

[docs] module nabu.processing.padding_opencl
import numpy as npfrom ..utils importget_opencl_srcfilefrom ..opencl.processing importOpenCLProcessingfrom .padding_base importPaddingBasefrom ..opencl.utils import__has_pyopencl__if__has_pyopencl__:from ..opencl.memcpy importOpenCLMemcpy2Dclass OpenCLPadding(PaddingBase):[docs]
    """    A class for performing padding on GPU using OpenCL    """backend="opencl"# TODO docstring from base classdef __init__(self,shape,pad_width,mode="constant",opencl_options=None,**kwargs):super().__init__(shape,pad_width,mode=mode,**kwargs)self.opencl_processing=self.processing=OpenCLProcessing(**(opencl_optionsor{}))self.queue=self.opencl_processing.queueself._init_opencl_coordinate_transform()def _init_opencl_coordinate_transform(self):ifself.mode=="constant":self.d_padded_array_constant=self.processing.to_device("d_padded_array_constant",self.padded_array_constant)self.memcpy2D=OpenCLMemcpy2D(ctx=self.processing.ctx,queue=self.queue)# pylint: disable=E0606returnself._coords_transform_kernel=self.processing.kernel("coordinate_transform",filename=get_opencl_srcfile("padding.cl"),)self._coords_transform_global_size=self.padded_shape[::-1]self.d_coords_rows=self.processing.to_device("d_coords_rows",self.coords_rows)self.d_coords_cols=self.processing.to_device("d_coords_cols",self.coords_cols)def _pad_constant(self,image,output):pad_y,pad_x=self.pad_width# the following line is not implemented in pyopencl# self.d_padded_array_constant[pad_y[0] : pad_y[0] + self.shape[0], pad_x[0] : pad_x[0] + self.shape[1]] = image[:]# cl.enqueue_copy is too cumbersome to use for Buffer <-> Buffer.# Use a dedicated kernel instead.# This is not optimal (two copies) - TODO write a constant padding kernelself.memcpy2D(self.d_padded_array_constant,image,image.shape[::-1],dst_offset_xy=(pad_x[0],pad_y[0]))output[:]=self.d_padded_array_constant[:]returnoutputdef pad(self,image,output=None):[docs]
        """        Pad an array.        Parameters        ----------        image: pyopencl array            Image to pad        output: pyopencl array            Output image. If provided, must be in the expected shape.        """ifoutputisNone:output=self.processing.allocate_array("d_output",self.padded_shape)ifself.mode=="constant":returnself._pad_constant(image,output)self._coords_transform_kernel(image,output,self.d_coords_cols,self.d_coords_rows,np.int32(self.shape[1]),np.int32(self.padded_shape[1]),np.int32(self.padded_shape[0]),global_size=self._coords_transform_global_size,)returnoutput