1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88
|
/*
* Copyright (C) 2018-2025 Intel Corporation
*
* SPDX-License-Identifier: MIT
*
*/
R"===(
__kernel void CopyBufferRectBytes2d(
__global const char* src,
__global char* dst,
coord2_t SrcOrigin,
coord2_t DstOrigin,
idx_t SrcPitch,
idx_t DstPitch )
{
idx_t x = get_global_id(0);
idx_t y = get_global_id(1);
idx_t LSrcOffset = x + SrcOrigin.x + ( ( y + SrcOrigin.y ) * SrcPitch );
idx_t LDstOffset = x + DstOrigin.x + ( ( y + DstOrigin.y ) * DstPitch );
*( dst + LDstOffset ) = *( src + LSrcOffset );
}
__kernel void CopyBufferRectBytesMiddle2d(
const __global uint* src,
__global uint* dst,
coord2_t SrcOrigin,
coord2_t DstOrigin,
idx_t SrcPitch,
idx_t DstPitch )
{
idx_t x = get_global_id(0);
idx_t y = get_global_id(1);
idx_t LSrcOffset = SrcOrigin.x + ( ( y + SrcOrigin.y ) * SrcPitch );
idx_t LDstOffset = DstOrigin.x + ( ( y + DstOrigin.y ) * DstPitch );
src += LSrcOffset >> 2;
dst += LDstOffset >> 2;
uint4 loaded = vload4(x, src);
vstore4(loaded, x, dst);
}
__kernel void CopyBufferRectBytes3d(
__global const char* src,
__global char* dst,
coord4_t SrcOrigin,
coord4_t DstOrigin,
coord2_t SrcPitch,
coord2_t DstPitch )
{
idx_t x = get_global_id(0);
idx_t y = get_global_id(1);
idx_t z = get_global_id(2);
idx_t LSrcOffset = x + SrcOrigin.x + ( ( y + SrcOrigin.y ) * SrcPitch.x ) + ( ( z + SrcOrigin.z ) * SrcPitch.y );
idx_t LDstOffset = x + DstOrigin.x + ( ( y + DstOrigin.y ) * DstPitch.x ) + ( ( z + DstOrigin.z ) * DstPitch.y );
*( dst + LDstOffset ) = *( src + LSrcOffset );
}
__kernel void CopyBufferRectBytesMiddle3d(
const __global uint* src,
__global uint* dst,
coord4_t SrcOrigin,
coord4_t DstOrigin,
coord2_t SrcPitch,
coord2_t DstPitch )
{
idx_t x = get_global_id(0);
idx_t y = get_global_id(1);
idx_t z = get_global_id(2);
idx_t LSrcOffset = SrcOrigin.x + ( ( y + SrcOrigin.y ) * SrcPitch.x ) + ( ( z + SrcOrigin.z ) * SrcPitch.y );
idx_t LDstOffset = DstOrigin.x + ( ( y + DstOrigin.y ) * DstPitch.x ) + ( ( z + DstOrigin.z ) * DstPitch.y );
src += LSrcOffset >> 2;
dst += LDstOffset >> 2;
uint4 loaded = vload4(x, src);
vstore4(loaded, x, dst);
}
)==="
|