• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // Copyright 2016 The SwiftShader Authors. All Rights Reserved.
2 //
3 // Licensed under the Apache License, Version 2.0 (the "License");
4 // you may not use this file except in compliance with the License.
5 // You may obtain a copy of the License at
6 //
7 //    http://www.apache.org/licenses/LICENSE-2.0
8 //
9 // Unless required by applicable law or agreed to in writing, software
10 // distributed under the License is distributed on an "AS IS" BASIS,
11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 // See the License for the specific language governing permissions and
13 // limitations under the License.
14 
15 #include "Constants.hpp"
16 
17 #include "System/Half.hpp"
18 #include "System/Math.hpp"
19 
20 #include <cstring>
21 
22 namespace sw {
23 
24 constexpr float Constants::VkSampleLocations4[][2];
25 constexpr float Constants::SampleLocationsX[4];
26 constexpr float Constants::SampleLocationsY[4];
27 
Constants()28 Constants::Constants()
29 {
30 	static const unsigned int transposeBit0[16] = {
31 		0x00000000,
32 		0x00000001,
33 		0x00000010,
34 		0x00000011,
35 		0x00000100,
36 		0x00000101,
37 		0x00000110,
38 		0x00000111,
39 		0x00001000,
40 		0x00001001,
41 		0x00001010,
42 		0x00001011,
43 		0x00001100,
44 		0x00001101,
45 		0x00001110,
46 		0x00001111
47 	};
48 
49 	static const unsigned int transposeBit1[16] = {
50 		0x00000000,
51 		0x00000002,
52 		0x00000020,
53 		0x00000022,
54 		0x00000200,
55 		0x00000202,
56 		0x00000220,
57 		0x00000222,
58 		0x00002000,
59 		0x00002002,
60 		0x00002020,
61 		0x00002022,
62 		0x00002200,
63 		0x00002202,
64 		0x00002220,
65 		0x00002222
66 	};
67 
68 	static const unsigned int transposeBit2[16] = {
69 		0x00000000,
70 		0x00000004,
71 		0x00000040,
72 		0x00000044,
73 		0x00000400,
74 		0x00000404,
75 		0x00000440,
76 		0x00000444,
77 		0x00004000,
78 		0x00004004,
79 		0x00004040,
80 		0x00004044,
81 		0x00004400,
82 		0x00004404,
83 		0x00004440,
84 		0x00004444
85 	};
86 
87 	memcpy(&this->transposeBit0, transposeBit0, sizeof(transposeBit0));
88 	memcpy(&this->transposeBit1, transposeBit1, sizeof(transposeBit1));
89 	memcpy(&this->transposeBit2, transposeBit2, sizeof(transposeBit2));
90 
91 	static const ushort4 cWeight[17] = {
92 		{ 0xFFFF, 0xFFFF, 0xFFFF, 0xFFFF },  // 0xFFFF / 1  = 0xFFFF
93 		{ 0xFFFF, 0xFFFF, 0xFFFF, 0xFFFF },  // 0xFFFF / 1  = 0xFFFF
94 		{ 0x8000, 0x8000, 0x8000, 0x8000 },  // 0xFFFF / 2  = 0x8000
95 		{ 0x5555, 0x5555, 0x5555, 0x5555 },  // 0xFFFF / 3  = 0x5555
96 		{ 0x4000, 0x4000, 0x4000, 0x4000 },  // 0xFFFF / 4  = 0x4000
97 		{ 0x3333, 0x3333, 0x3333, 0x3333 },  // 0xFFFF / 5  = 0x3333
98 		{ 0x2AAA, 0x2AAA, 0x2AAA, 0x2AAA },  // 0xFFFF / 6  = 0x2AAA
99 		{ 0x2492, 0x2492, 0x2492, 0x2492 },  // 0xFFFF / 7  = 0x2492
100 		{ 0x2000, 0x2000, 0x2000, 0x2000 },  // 0xFFFF / 8  = 0x2000
101 		{ 0x1C71, 0x1C71, 0x1C71, 0x1C71 },  // 0xFFFF / 9  = 0x1C71
102 		{ 0x1999, 0x1999, 0x1999, 0x1999 },  // 0xFFFF / 10 = 0x1999
103 		{ 0x1745, 0x1745, 0x1745, 0x1745 },  // 0xFFFF / 11 = 0x1745
104 		{ 0x1555, 0x1555, 0x1555, 0x1555 },  // 0xFFFF / 12 = 0x1555
105 		{ 0x13B1, 0x13B1, 0x13B1, 0x13B1 },  // 0xFFFF / 13 = 0x13B1
106 		{ 0x1249, 0x1249, 0x1249, 0x1249 },  // 0xFFFF / 14 = 0x1249
107 		{ 0x1111, 0x1111, 0x1111, 0x1111 },  // 0xFFFF / 15 = 0x1111
108 		{ 0x1000, 0x1000, 0x1000, 0x1000 },  // 0xFFFF / 16 = 0x1000
109 	};
110 
111 	static const float4 uvWeight[17] = {
112 		{ 1.0f / 1.0f, 1.0f / 1.0f, 1.0f / 1.0f, 1.0f / 1.0f },
113 		{ 1.0f / 1.0f, 1.0f / 1.0f, 1.0f / 1.0f, 1.0f / 1.0f },
114 		{ 1.0f / 2.0f, 1.0f / 2.0f, 1.0f / 2.0f, 1.0f / 2.0f },
115 		{ 1.0f / 3.0f, 1.0f / 3.0f, 1.0f / 3.0f, 1.0f / 3.0f },
116 		{ 1.0f / 4.0f, 1.0f / 4.0f, 1.0f / 4.0f, 1.0f / 4.0f },
117 		{ 1.0f / 5.0f, 1.0f / 5.0f, 1.0f / 5.0f, 1.0f / 5.0f },
118 		{ 1.0f / 6.0f, 1.0f / 6.0f, 1.0f / 6.0f, 1.0f / 6.0f },
119 		{ 1.0f / 7.0f, 1.0f / 7.0f, 1.0f / 7.0f, 1.0f / 7.0f },
120 		{ 1.0f / 8.0f, 1.0f / 8.0f, 1.0f / 8.0f, 1.0f / 8.0f },
121 		{ 1.0f / 9.0f, 1.0f / 9.0f, 1.0f / 9.0f, 1.0f / 9.0f },
122 		{ 1.0f / 10.0f, 1.0f / 10.0f, 1.0f / 10.0f, 1.0f / 10.0f },
123 		{ 1.0f / 11.0f, 1.0f / 11.0f, 1.0f / 11.0f, 1.0f / 11.0f },
124 		{ 1.0f / 12.0f, 1.0f / 12.0f, 1.0f / 12.0f, 1.0f / 12.0f },
125 		{ 1.0f / 13.0f, 1.0f / 13.0f, 1.0f / 13.0f, 1.0f / 13.0f },
126 		{ 1.0f / 14.0f, 1.0f / 14.0f, 1.0f / 14.0f, 1.0f / 14.0f },
127 		{ 1.0f / 15.0f, 1.0f / 15.0f, 1.0f / 15.0f, 1.0f / 15.0f },
128 		{ 1.0f / 16.0f, 1.0f / 16.0f, 1.0f / 16.0f, 1.0f / 16.0f },
129 	};
130 
131 	static const float4 uvStart[17] = {
132 		{ -0.0f / 2.0f, -0.0f / 2.0f, -0.0f / 2.0f, -0.0f / 2.0f },
133 		{ -0.0f / 2.0f, -0.0f / 2.0f, -0.0f / 2.0f, -0.0f / 2.0f },
134 		{ -1.0f / 4.0f, -1.0f / 4.0f, -1.0f / 4.0f, -1.0f / 4.0f },
135 		{ -2.0f / 6.0f, -2.0f / 6.0f, -2.0f / 6.0f, -2.0f / 6.0f },
136 		{ -3.0f / 8.0f, -3.0f / 8.0f, -3.0f / 8.0f, -3.0f / 8.0f },
137 		{ -4.0f / 10.0f, -4.0f / 10.0f, -4.0f / 10.0f, -4.0f / 10.0f },
138 		{ -5.0f / 12.0f, -5.0f / 12.0f, -5.0f / 12.0f, -5.0f / 12.0f },
139 		{ -6.0f / 14.0f, -6.0f / 14.0f, -6.0f / 14.0f, -6.0f / 14.0f },
140 		{ -7.0f / 16.0f, -7.0f / 16.0f, -7.0f / 16.0f, -7.0f / 16.0f },
141 		{ -8.0f / 18.0f, -8.0f / 18.0f, -8.0f / 18.0f, -8.0f / 18.0f },
142 		{ -9.0f / 20.0f, -9.0f / 20.0f, -9.0f / 20.0f, -9.0f / 20.0f },
143 		{ -10.0f / 22.0f, -10.0f / 22.0f, -10.0f / 22.0f, -10.0f / 22.0f },
144 		{ -11.0f / 24.0f, -11.0f / 24.0f, -11.0f / 24.0f, -11.0f / 24.0f },
145 		{ -12.0f / 26.0f, -12.0f / 26.0f, -12.0f / 26.0f, -12.0f / 26.0f },
146 		{ -13.0f / 28.0f, -13.0f / 28.0f, -13.0f / 28.0f, -13.0f / 28.0f },
147 		{ -14.0f / 30.0f, -14.0f / 30.0f, -14.0f / 30.0f, -14.0f / 30.0f },
148 		{ -15.0f / 32.0f, -15.0f / 32.0f, -15.0f / 32.0f, -15.0f / 32.0f },
149 	};
150 
151 	memcpy(&this->cWeight, cWeight, sizeof(cWeight));
152 	memcpy(&this->uvWeight, uvWeight, sizeof(uvWeight));
153 	memcpy(&this->uvStart, uvStart, sizeof(uvStart));
154 
155 	static const unsigned int occlusionCount[16] = { 0, 1, 1, 2, 1, 2, 2, 3, 1, 2, 2, 3, 2, 3, 3, 4 };
156 
157 	memcpy(&this->occlusionCount, &occlusionCount, sizeof(occlusionCount));
158 
159 	for(int i = 0; i < 16; i++)
160 	{
161 		maskB4Q[i][0] = -(i >> 0 & 1);
162 		maskB4Q[i][1] = -(i >> 1 & 1);
163 		maskB4Q[i][2] = -(i >> 2 & 1);
164 		maskB4Q[i][3] = -(i >> 3 & 1);
165 		maskB4Q[i][4] = -(i >> 0 & 1);
166 		maskB4Q[i][5] = -(i >> 1 & 1);
167 		maskB4Q[i][6] = -(i >> 2 & 1);
168 		maskB4Q[i][7] = -(i >> 3 & 1);
169 
170 		invMaskB4Q[i][0] = ~maskB4Q[i][0];
171 		invMaskB4Q[i][1] = ~maskB4Q[i][1];
172 		invMaskB4Q[i][2] = ~maskB4Q[i][2];
173 		invMaskB4Q[i][3] = ~maskB4Q[i][3];
174 		invMaskB4Q[i][4] = ~maskB4Q[i][4];
175 		invMaskB4Q[i][5] = ~maskB4Q[i][5];
176 		invMaskB4Q[i][6] = ~maskB4Q[i][6];
177 		invMaskB4Q[i][7] = ~maskB4Q[i][7];
178 
179 		maskW4Q[i][0] = -(i >> 0 & 1);
180 		maskW4Q[i][1] = -(i >> 1 & 1);
181 		maskW4Q[i][2] = -(i >> 2 & 1);
182 		maskW4Q[i][3] = -(i >> 3 & 1);
183 
184 		invMaskW4Q[i][0] = ~maskW4Q[i][0];
185 		invMaskW4Q[i][1] = ~maskW4Q[i][1];
186 		invMaskW4Q[i][2] = ~maskW4Q[i][2];
187 		invMaskW4Q[i][3] = ~maskW4Q[i][3];
188 
189 		maskD4X[i][0] = -(i >> 0 & 1);
190 		maskD4X[i][1] = -(i >> 1 & 1);
191 		maskD4X[i][2] = -(i >> 2 & 1);
192 		maskD4X[i][3] = -(i >> 3 & 1);
193 
194 		invMaskD4X[i][0] = ~maskD4X[i][0];
195 		invMaskD4X[i][1] = ~maskD4X[i][1];
196 		invMaskD4X[i][2] = ~maskD4X[i][2];
197 		invMaskD4X[i][3] = ~maskD4X[i][3];
198 
199 		maskQ0Q[i] = -(i >> 0 & 1);
200 		maskQ1Q[i] = -(i >> 1 & 1);
201 		maskQ2Q[i] = -(i >> 2 & 1);
202 		maskQ3Q[i] = -(i >> 3 & 1);
203 
204 		invMaskQ0Q[i] = ~maskQ0Q[i];
205 		invMaskQ1Q[i] = ~maskQ1Q[i];
206 		invMaskQ2Q[i] = ~maskQ2Q[i];
207 		invMaskQ3Q[i] = ~maskQ3Q[i];
208 
209 		maskX0X[i][0] = maskX0X[i][1] = maskX0X[i][2] = maskX0X[i][3] = -(i >> 0 & 1);
210 		maskX1X[i][0] = maskX1X[i][1] = maskX1X[i][2] = maskX1X[i][3] = -(i >> 1 & 1);
211 		maskX2X[i][0] = maskX2X[i][1] = maskX2X[i][2] = maskX2X[i][3] = -(i >> 2 & 1);
212 		maskX3X[i][0] = maskX3X[i][1] = maskX3X[i][2] = maskX3X[i][3] = -(i >> 3 & 1);
213 
214 		invMaskX0X[i][0] = invMaskX0X[i][1] = invMaskX0X[i][2] = invMaskX0X[i][3] = ~maskX0X[i][0];
215 		invMaskX1X[i][0] = invMaskX1X[i][1] = invMaskX1X[i][2] = invMaskX1X[i][3] = ~maskX1X[i][0];
216 		invMaskX2X[i][0] = invMaskX2X[i][1] = invMaskX2X[i][2] = invMaskX2X[i][3] = ~maskX2X[i][0];
217 		invMaskX3X[i][0] = invMaskX3X[i][1] = invMaskX3X[i][2] = invMaskX3X[i][3] = ~maskX3X[i][0];
218 
219 		maskD01Q[i][0] = -(i >> 0 & 1);
220 		maskD01Q[i][1] = -(i >> 1 & 1);
221 		maskD23Q[i][0] = -(i >> 2 & 1);
222 		maskD23Q[i][1] = -(i >> 3 & 1);
223 
224 		invMaskD01Q[i][0] = ~maskD01Q[i][0];
225 		invMaskD01Q[i][1] = ~maskD01Q[i][1];
226 		invMaskD23Q[i][0] = ~maskD23Q[i][0];
227 		invMaskD23Q[i][1] = ~maskD23Q[i][1];
228 
229 		maskQ01X[i][0] = -(i >> 0 & 1);
230 		maskQ01X[i][1] = -(i >> 1 & 1);
231 		maskQ23X[i][0] = -(i >> 2 & 1);
232 		maskQ23X[i][1] = -(i >> 3 & 1);
233 
234 		invMaskQ01X[i][0] = ~maskQ01X[i][0];
235 		invMaskQ01X[i][1] = ~maskQ01X[i][1];
236 		invMaskQ23X[i][0] = ~maskQ23X[i][0];
237 		invMaskQ23X[i][1] = ~maskQ23X[i][1];
238 	}
239 
240 	for(int i = 0; i < 8; i++)
241 	{
242 		mask565Q[i] = word4((i & 0x1 ? 0x001F : 0) | (i & 0x2 ? 0x07E0 : 0) | (i & 0x4 ? 0xF800 : 0));
243 		mask11X[i] = dword4((i & 0x1 ? 0x000007FFu : 0) | (i & 0x2 ? 0x003FF800u : 0) | (i & 0x4 ? 0xFFC00000u : 0));
244 	}
245 
246 	for(int i = 0; i < 16; i++)
247 	{
248 		mask5551Q[i] = word4((i & 0x1 ? 0x001F : 0) | (i & 0x2 ? 0x03E0 : 0) | (i & 0x4 ? 0x7C00 : 0) | (i & 8 ? 0x8000 : 0));
249 		maskr5g5b5a1Q[i] = word4((i & 0x1 ? 0x003E : 0) | (i & 0x2 ? 0x07C0 : 0) | (i & 0x4 ? 0xF800 : 0) | (i & 8 ? 0x0001 : 0));
250 		maskb5g5r5a1Q[i] = word4((i & 0x1 ? 0xF800 : 0) | (i & 0x2 ? 0x07C0 : 0) | (i & 0x4 ? 0x003E : 0) | (i & 8 ? 0x0001 : 0));
251 		mask4rgbaQ[i] = word4((i & 0x1 ? 0x00F0 : 0) | (i & 0x2 ? 0x0F00 : 0) | (i & 0x4 ? 0xF000 : 0) | (i & 8 ? 0x000F : 0));
252 		mask4bgraQ[i] = word4((i & 0x1 ? 0xF000 : 0) | (i & 0x2 ? 0x0F00 : 0) | (i & 0x4 ? 0x00F0 : 0) | (i & 8 ? 0x000F : 0));
253 		mask4abgrQ[i] = word4((i & 0x1 ? 0x0F00 : 0) | (i & 0x2 ? 0x00F0 : 0) | (i & 0x4 ? 0x000F : 0) | (i & 8 ? 0xF000 : 0));
254 		mask4argbQ[i] = word4((i & 0x1 ? 0x000F : 0) | (i & 0x2 ? 0x00F0 : 0) | (i & 0x4 ? 0x0F00 : 0) | (i & 8 ? 0xF000 : 0));
255 	}
256 
257 	for(int i = 0; i < 4; i++)
258 	{
259 		maskW01Q[i][0] = -(i >> 0 & 1);
260 		maskW01Q[i][1] = -(i >> 1 & 1);
261 		maskW01Q[i][2] = -(i >> 0 & 1);
262 		maskW01Q[i][3] = -(i >> 1 & 1);
263 
264 		maskD01X[i][0] = -(i >> 0 & 1);
265 		maskD01X[i][1] = -(i >> 1 & 1);
266 		maskD01X[i][2] = -(i >> 0 & 1);
267 		maskD01X[i][3] = -(i >> 1 & 1);
268 	}
269 
270 	for(int i = 0; i < 16; i++)
271 	{
272 		mask10Q[i][0] = mask10Q[i][1] =
273 		    (i & 0x1 ? 0x3FF : 0) |
274 		    (i & 0x2 ? 0xFFC00 : 0) |
275 		    (i & 0x4 ? 0x3FF00000 : 0) |
276 		    (i & 0x8 ? 0xC0000000 : 0);
277 	}
278 
279 	for(int i = 0; i < 256; i++)
280 	{
281 		sRGBtoLinearFF_FF00[i] = (unsigned short)(sRGBtoLinear((float)i / 0xFF) * 0xFF00 + 0.5f);
282 	}
283 
284 	for(int i = 0; i < 0x1000; i++)
285 	{
286 		linearToSRGB12_16[i] = (unsigned short)(clamp(linearToSRGB((float)i / 0x0FFF) * 0xFFFF + 0.5f, 0.0f, (float)0xFFFF));
287 		sRGBtoLinear12_16[i] = (unsigned short)(clamp(sRGBtoLinear((float)i / 0x0FFF) * 0xFFFF + 0.5f, 0.0f, (float)0xFFFF));
288 	}
289 
290 	const float4 X[4] = {
291 		float4(SampleLocationsX[0]),
292 		float4(SampleLocationsX[1]),
293 		float4(SampleLocationsX[2]),
294 		float4(SampleLocationsX[3]),
295 	};
296 
297 	const float4 Y[4] = {
298 		float4(SampleLocationsY[0]),
299 		float4(SampleLocationsY[1]),
300 		float4(SampleLocationsY[2]),
301 		float4(SampleLocationsY[3]),
302 	};
303 
304 	for(int q = 0; q < 4; q++)
305 	{
306 		for(int c = 0; c < 16; c++)
307 		{
308 			for(int i = 0; i < 4; i++)
309 			{
310 				sampleX[q][c][i] = c & (1 << i) ? X[q][0] : 0.0f;
311 				sampleY[q][c][i] = c & (1 << i) ? Y[q][0] : 0.0f;
312 				weight[c][i] = c & (1 << i) ? 1.0f : 0.0f;
313 			}
314 		}
315 	}
316 
317 	constexpr auto subPixB = vk::SUBPIXEL_PRECISION_BITS;
318 
319 	const int Xf[4] = { toFixedPoint(X[0][0], subPixB), toFixedPoint(X[1][0], subPixB), toFixedPoint(X[2][0], subPixB), toFixedPoint(X[3][0], subPixB) };
320 	const int Yf[4] = { toFixedPoint(Y[0][0], subPixB), toFixedPoint(Y[1][0], subPixB), toFixedPoint(Y[2][0], subPixB), toFixedPoint(Y[3][0], subPixB) };
321 
322 	memcpy(&this->Xf, &Xf, sizeof(Xf));
323 	memcpy(&this->Yf, &Yf, sizeof(Yf));
324 
325 	memcpy(&this->X, &X, sizeof(X));
326 	memcpy(&this->Y, &Y, sizeof(Y));
327 
328 	const dword maxX[16] = { 0x00000000, 0x00000001, 0x00000100, 0x00000101, 0x00010000, 0x00010001, 0x00010100, 0x00010101, 0x01000000, 0x01000001, 0x01000100, 0x01000101, 0x01010000, 0x01010001, 0x01010100, 0x01010101 };
329 	const dword maxY[16] = { 0x00000000, 0x00000002, 0x00000200, 0x00000202, 0x00020000, 0x00020002, 0x00020200, 0x00020202, 0x02000000, 0x02000002, 0x02000200, 0x02000202, 0x02020000, 0x02020002, 0x02020200, 0x02020202 };
330 	const dword maxZ[16] = { 0x00000000, 0x00000004, 0x00000400, 0x00000404, 0x00040000, 0x00040004, 0x00040400, 0x00040404, 0x04000000, 0x04000004, 0x04000400, 0x04000404, 0x04040000, 0x04040004, 0x04040400, 0x04040404 };
331 	const dword minX[16] = { 0x00000000, 0x00000008, 0x00000800, 0x00000808, 0x00080000, 0x00080008, 0x00080800, 0x00080808, 0x08000000, 0x08000008, 0x08000800, 0x08000808, 0x08080000, 0x08080008, 0x08080800, 0x08080808 };
332 	const dword minY[16] = { 0x00000000, 0x00000010, 0x00001000, 0x00001010, 0x00100000, 0x00100010, 0x00101000, 0x00101010, 0x10000000, 0x10000010, 0x10001000, 0x10001010, 0x10100000, 0x10100010, 0x10101000, 0x10101010 };
333 	const dword minZ[16] = { 0x00000000, 0x00000020, 0x00002000, 0x00002020, 0x00200000, 0x00200020, 0x00202000, 0x00202020, 0x20000000, 0x20000020, 0x20002000, 0x20002020, 0x20200000, 0x20200020, 0x20202000, 0x20202020 };
334 	const dword fini[16] = { 0x00000000, 0x00000080, 0x00008000, 0x00008080, 0x00800000, 0x00800080, 0x00808000, 0x00808080, 0x80000000, 0x80000080, 0x80008000, 0x80008080, 0x80800000, 0x80800080, 0x80808000, 0x80808080 };
335 
336 	memcpy(&this->maxX, &maxX, sizeof(maxX));
337 	memcpy(&this->maxY, &maxY, sizeof(maxY));
338 	memcpy(&this->maxZ, &maxZ, sizeof(maxZ));
339 	memcpy(&this->minX, &minX, sizeof(minX));
340 	memcpy(&this->minY, &minY, sizeof(minY));
341 	memcpy(&this->minZ, &minZ, sizeof(minZ));
342 	memcpy(&this->fini, &fini, sizeof(fini));
343 
344 	static const float4 unscaleByte = { 1.0f / 0xFF, 1.0f / 0xFF, 1.0f / 0xFF, 1.0f / 0xFF };
345 	static const float4 unscaleSByte = { 1.0f / 0x7F, 1.0f / 0x7F, 1.0f / 0x7F, 1.0f / 0x7F };
346 	static const float4 unscaleShort = { 1.0f / 0x7FFF, 1.0f / 0x7FFF, 1.0f / 0x7FFF, 1.0f / 0x7FFF };
347 	static const float4 unscaleUShort = { 1.0f / 0xFFFF, 1.0f / 0xFFFF, 1.0f / 0xFFFF, 1.0f / 0xFFFF };
348 
349 	// NOTE: Using "1.0f / 0x7FFFFFF" below results in a compiler error, e.g.:
350 	// error: implicit conversion from 'int' to 'float' changes value from 2147483646 to 2147483648
351 	static const float4 unscaleInt = { (float)(1.0 / 0x7FFFFFFF), (float)(1.0 / 0x7FFFFFFF), (float)(1.0 / 0x7FFFFFFF), (float)(1.0 / 0x7FFFFFFF) };
352 	static const float4 unscaleUInt = { (float)(1.0 / 0xFFFFFFFF), (float)(1.0 / 0xFFFFFFFF), (float)(1.0 / 0xFFFFFFFF), (float)(1.0 / 0xFFFFFFFF) };
353 
354 	static const float4 unscaleFixed = { 1.0f / 0x00010000, 1.0f / 0x00010000, 1.0f / 0x00010000, 1.0f / 0x00010000 };
355 
356 	memcpy(&this->unscaleByte, &unscaleByte, sizeof(unscaleByte));
357 	memcpy(&this->unscaleSByte, &unscaleSByte, sizeof(unscaleSByte));
358 	memcpy(&this->unscaleShort, &unscaleShort, sizeof(unscaleShort));
359 	memcpy(&this->unscaleUShort, &unscaleUShort, sizeof(unscaleUShort));
360 	memcpy(&this->unscaleInt, &unscaleInt, sizeof(unscaleInt));
361 	memcpy(&this->unscaleUInt, &unscaleUInt, sizeof(unscaleUInt));
362 	memcpy(&this->unscaleFixed, &unscaleFixed, sizeof(unscaleFixed));
363 
364 	for(int i = 0; i <= 0xFFFF; i++)
365 	{
366 		half2float[i] = (float)reinterpret_cast<half &>(i);
367 	}
368 }
369 
370 }  // namespace sw
371