File: hlsl.wavereduction.comp

package info (click to toggle)
glslang 16.2.0-1
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 51,720 kB
  • sloc: cpp: 92,305; yacc: 4,320; sh: 603; python: 305; ansic: 94; javascript: 74; makefile: 17
file content (125 lines) | stat: -rw-r--r-- 5,036 bytes parent folder | download | duplicates (16)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
struct Types
{
	uint4 u;
	int4 i;
	float4 f;
	double4 d;
};

RWStructuredBuffer<Types> data;

[numthreads(32, 16, 1)]
void CSMain(uint3 dti : SV_DispatchThreadID)
{
	data[dti.x].u = WaveActiveSum(data[dti.x].u);
	data[dti.x].u.x = WaveActiveSum(data[dti.x].u.x);
	data[dti.x].u.xy = WaveActiveSum(data[dti.x].u.xy);
	data[dti.x].u.xyz = WaveActiveSum(data[dti.x].u.xyz);

	data[dti.x].i = WaveActiveSum(data[dti.x].i);
	data[dti.x].i.x = WaveActiveSum(data[dti.x].i.x);
	data[dti.x].i.xy = WaveActiveSum(data[dti.x].i.xy);
	data[dti.x].i.xyz = WaveActiveSum(data[dti.x].i.xyz);

	data[dti.x].f = WaveActiveSum(data[dti.x].f);
	data[dti.x].f.x = WaveActiveSum(data[dti.x].f.x);
	data[dti.x].f.xy = WaveActiveSum(data[dti.x].f.xy);
	data[dti.x].f.xyz = WaveActiveSum(data[dti.x].f.xyz);

	data[dti.x].d = WaveActiveSum(data[dti.x].d);
	data[dti.x].d.x = WaveActiveSum(data[dti.x].d.x);
	data[dti.x].d.xy = WaveActiveSum(data[dti.x].d.xy);
	data[dti.x].d.xyz = WaveActiveSum(data[dti.x].d.xyz);

	data[dti.x].u = WaveActiveProduct(data[dti.x].u);
	data[dti.x].u.x = WaveActiveProduct(data[dti.x].u.x);
	data[dti.x].u.xy = WaveActiveProduct(data[dti.x].u.xy);
	data[dti.x].u.xyz = WaveActiveProduct(data[dti.x].u.xyz);

	data[dti.x].i = WaveActiveProduct(data[dti.x].i);
	data[dti.x].i.x = WaveActiveProduct(data[dti.x].i.x);
	data[dti.x].i.xy = WaveActiveProduct(data[dti.x].i.xy);
	data[dti.x].i.xyz = WaveActiveProduct(data[dti.x].i.xyz);

	data[dti.x].f = WaveActiveProduct(data[dti.x].f);
	data[dti.x].f.x = WaveActiveProduct(data[dti.x].f.x);
	data[dti.x].f.xy = WaveActiveProduct(data[dti.x].f.xy);
	data[dti.x].f.xyz = WaveActiveProduct(data[dti.x].f.xyz);

	data[dti.x].d = WaveActiveProduct(data[dti.x].d);
	data[dti.x].d.x = WaveActiveProduct(data[dti.x].d.x);
	data[dti.x].d.xy = WaveActiveProduct(data[dti.x].d.xy);
	data[dti.x].d.xyz = WaveActiveProduct(data[dti.x].d.xyz);

	data[dti.x].u = WaveActiveMin(data[dti.x].u);
	data[dti.x].u.x = WaveActiveMin(data[dti.x].u.x);
	data[dti.x].u.xy = WaveActiveMin(data[dti.x].u.xy);
	data[dti.x].u.xyz = WaveActiveMin(data[dti.x].u.xyz);

	data[dti.x].i = WaveActiveMin(data[dti.x].i);
	data[dti.x].i.x = WaveActiveMin(data[dti.x].i.x);
	data[dti.x].i.xy = WaveActiveMin(data[dti.x].i.xy);
	data[dti.x].i.xyz = WaveActiveMin(data[dti.x].i.xyz);

	data[dti.x].f = WaveActiveMin(data[dti.x].f);
	data[dti.x].f.x = WaveActiveMin(data[dti.x].f.x);
	data[dti.x].f.xy = WaveActiveMin(data[dti.x].f.xy);
	data[dti.x].f.xyz = WaveActiveMin(data[dti.x].f.xyz);

	data[dti.x].d = WaveActiveMin(data[dti.x].d);
	data[dti.x].d.x = WaveActiveMin(data[dti.x].d.x);
	data[dti.x].d.xy = WaveActiveMin(data[dti.x].d.xy);
	data[dti.x].d.xyz = WaveActiveMin(data[dti.x].d.xyz);

	data[dti.x].u = WaveActiveMax(data[dti.x].u);
	data[dti.x].u.x = WaveActiveMax(data[dti.x].u.x);
	data[dti.x].u.xy = WaveActiveMax(data[dti.x].u.xy);
	data[dti.x].u.xyz = WaveActiveMax(data[dti.x].u.xyz);

	data[dti.x].i = WaveActiveMax(data[dti.x].i);
	data[dti.x].i.x = WaveActiveMax(data[dti.x].i.x);
	data[dti.x].i.xy = WaveActiveMax(data[dti.x].i.xy);
	data[dti.x].i.xyz = WaveActiveMax(data[dti.x].i.xyz);

	data[dti.x].f = WaveActiveMax(data[dti.x].f);
	data[dti.x].f.x = WaveActiveMax(data[dti.x].f.x);
	data[dti.x].f.xy = WaveActiveMax(data[dti.x].f.xy);
	data[dti.x].f.xyz = WaveActiveMax(data[dti.x].f.xyz);

	data[dti.x].d = WaveActiveMax(data[dti.x].d);
	data[dti.x].d.x = WaveActiveMax(data[dti.x].d.x);
	data[dti.x].d.xy = WaveActiveMax(data[dti.x].d.xy);
	data[dti.x].d.xyz = WaveActiveMax(data[dti.x].d.xyz);

	data[dti.x].u = WaveActiveBitAnd(data[dti.x].u);
	data[dti.x].u.x = WaveActiveBitAnd(data[dti.x].u.x);
	data[dti.x].u.xy = WaveActiveBitAnd(data[dti.x].u.xy);
	data[dti.x].u.xyz = WaveActiveBitAnd(data[dti.x].u.xyz);

	data[dti.x].i = WaveActiveBitAnd(data[dti.x].i);
	data[dti.x].i.x = WaveActiveBitAnd(data[dti.x].i.x);
	data[dti.x].i.xy = WaveActiveBitAnd(data[dti.x].i.xy);
	data[dti.x].i.xyz = WaveActiveBitAnd(data[dti.x].i.xyz);

	data[dti.x].u = WaveActiveBitOr(data[dti.x].u);
	data[dti.x].u.x = WaveActiveBitOr(data[dti.x].u.x);
	data[dti.x].u.xy = WaveActiveBitOr(data[dti.x].u.xy);
	data[dti.x].u.xyz = WaveActiveBitOr(data[dti.x].u.xyz);

	data[dti.x].i = WaveActiveBitOr(data[dti.x].i);
	data[dti.x].i.x = WaveActiveBitOr(data[dti.x].i.x);
	data[dti.x].i.xy = WaveActiveBitOr(data[dti.x].i.xy);
	data[dti.x].i.xyz = WaveActiveBitOr(data[dti.x].i.xyz);

	data[dti.x].u = WaveActiveBitXor(data[dti.x].u);
	data[dti.x].u.x = WaveActiveBitXor(data[dti.x].u.x);
	data[dti.x].u.xy = WaveActiveBitXor(data[dti.x].u.xy);
	data[dti.x].u.xyz = WaveActiveBitXor(data[dti.x].u.xyz);

	data[dti.x].i = WaveActiveBitXor(data[dti.x].i);
	data[dti.x].i.x = WaveActiveBitXor(data[dti.x].i.x);
	data[dti.x].i.xy = WaveActiveBitXor(data[dti.x].i.xy);
	data[dti.x].i.xyz = WaveActiveBitXor(data[dti.x].i.xyz);

	data[dti.x].u.x = WaveActiveCountBits(data[dti.x].u.x == 0);
}