File: GPUShrinkImageFilter.cl

package info (click to toggle)
elastix 5.2.0-2
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 42,480 kB
  • sloc: cpp: 68,403; lisp: 4,118; python: 1,013; xml: 182; sh: 177; makefile: 33
file content (107 lines) | stat: -rw-r--r-- 3,843 bytes parent folder | download | duplicates (5)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
/*=========================================================================
 *
 *  Copyright UMC Utrecht and contributors
 *
 *  Licensed under the Apache License, Version 2.0 (the "License");
 *  you may not use this file except in compliance with the License.
 *  You may obtain a copy of the License at
 *
 *        http://www.apache.org/licenses/LICENSE-2.0.txt
 *
 *  Unless required by applicable law or agreed to in writing, software
 *  distributed under the License is distributed on an "AS IS" BASIS,
 *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 *  See the License for the specific language governing permissions and
 *  limitations under the License.
 *
 *=========================================================================*/
//
// \author Denis P. Shamonin and Marius Staring. Division of Image Processing,
// Department of Radiology, Leiden, The Netherlands
//
// \note This work was funded by the Netherlands Organisation for
// Scientific Research (NWO NRG-2010.02 and NWO 639.021.124).
//
// OpenCL implementation of itk::ShrinkImageFilter

//------------------------------------------------------------------------------
// Apple OpenCL 1.0 support function
bool is_valid_3d( const uint3 index, const uint3 size )
{
  /* NOTE: More than three-level nested conditional statements (e.g.,
  if A && B && C..) invalidates command queue during kernel
  execution on Apple OpenCL 1.0 (such Macbook Pro with NVIDIA 9600M
  GT). Therefore, we flattened conditional statements. */
  if ( index.x >= size.x ) { return false; }
  if ( index.y >= size.y ) { return false; }
  if ( index.z >= size.z ) { return false; }
  return true;
}

//------------------------------------------------------------------------------
OUTPIXELTYPE Functor( const INPIXELTYPE in )
{
  OUTPIXELTYPE out = (OUTPIXELTYPE)in;

  return out;
}

//------------------------------------------------------------------------------
#ifdef DIM_1
__kernel void ShrinkImageFilter( __global const INPIXELTYPE *in,
  __global OUTPIXELTYPE *out,
  uint in_image_size, uint out_image_size,
  uint offset, uint shrinkfactors )
{
  uint index = get_global_id( 0 );

  if ( index < out_image_size )
  {
    uint input_index = mad24( index, shrinkfactors, offset );
    uint out_gidx = index;
    uint in_gidx = input_index;
    out[out_gidx] = Functor( in[in_gidx] );
  }
}

#endif

//------------------------------------------------------------------------------
#ifdef DIM_2
__kernel void ShrinkImageFilter( __global const INPIXELTYPE *in,
  __global OUTPIXELTYPE *out,
  uint2 image_size_in, uint2 image_size_out,
  uint2 offset, uint2 shrinkfactors )
{
  uint2 index_out = (uint2)( get_global_id( 0 ), get_global_id( 1 ) );

  if ( index_out.x < image_size_out.x && index_out.y < image_size_out.y )
  {
    uint2 index_in = mad24( index_out, shrinkfactors, offset );
    uint  gidx_in = mad24( image_size_in.x, index_in.y, index_in.x );
    uint  gidx_out = mad24( image_size_out.x, index_out.y, index_out.x );
    out[gidx_out] = Functor( in[gidx_in] );
  }
}

#endif

//------------------------------------------------------------------------------
#ifdef DIM_3
__kernel void ShrinkImageFilter( __global const INPIXELTYPE *in,
  __global OUTPIXELTYPE *out,
  uint3 image_size_in, uint3 image_size_out,
  uint3 offset, uint3 shrinkfactors )
{
  uint3 index_out = (uint3)( get_global_id( 0 ), get_global_id( 1 ), get_global_id( 2 ) );

  if ( is_valid_3d( index_out, image_size_out ) )
  {
    uint3 index_in = mad24( index_out, shrinkfactors, offset );
    uint  gidx_in = mad24( image_size_in.x, mad24( index_in.z, image_size_in.y, index_in.y ), index_in.x );
    uint  gidx_out = mad24( image_size_out.x, mad24( index_out.z, image_size_out.y, index_out.y ), index_out.x );
    out[gidx_out] = Functor( in[gidx_in] );
  }
}

#endif