1 /*-------------------------------------------------------------------------
2 * drawElements Quality Program OpenGL ES 3.0 Module
3 * -------------------------------------------------
4 *
5 * Copyright 2014 The Android Open Source Project
6 *
7 * Licensed under the Apache License, Version 2.0 (the "License");
8 * you may not use this file except in compliance with the License.
9 * You may obtain a copy of the License at
10 *
11 * http://www.apache.org/licenses/LICENSE-2.0
12 *
13 * Unless required by applicable law or agreed to in writing, software
14 * distributed under the License is distributed on an "AS IS" BASIS,
15 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
16 * See the License for the specific language governing permissions and
17 * limitations under the License.
18 *
19 *//*!
20 * \file
21 * \brief Depth buffer performance tests.
22 *//*--------------------------------------------------------------------*/
23
24 #include "es3pDepthTests.hpp"
25
26 #include "glsCalibration.hpp"
27
28 #include "gluShaderProgram.hpp"
29 #include "gluObjectWrapper.hpp"
30 #include "gluPixelTransfer.hpp"
31
32 #include "glwFunctions.hpp"
33 #include "glwEnums.hpp"
34
35 #include "tcuTestLog.hpp"
36 #include "tcuStringTemplate.hpp"
37 #include "tcuCPUWarmup.hpp"
38 #include "tcuCommandLine.hpp"
39 #include "tcuResultCollector.hpp"
40
41 #include "deClock.h"
42 #include "deString.h"
43 #include "deMath.h"
44 #include "deStringUtil.hpp"
45 #include "deRandom.hpp"
46 #include "deUniquePtr.hpp"
47
48 #include <vector>
49 #include <algorithm>
50
51 namespace deqp
52 {
53 namespace gles3
54 {
55 namespace Performance
56 {
57 namespace
58 {
59 using namespace glw;
60 using de::MovePtr;
61 using tcu::TestContext;
62 using tcu::TestLog;
63 using tcu::Vec4;
64 using tcu::Vec3;
65 using tcu::Vec2;
66 using glu::RenderContext;
67 using glu::ProgramSources;
68 using glu::ShaderSource;
69 using std::vector;
70 using std::string;
71 using std::map;
72
73 struct Sample
74 {
75 deInt64 nullTime;
76 deInt64 baseTime;
77 deInt64 testTime;
78 int order;
79 int workload;
80 };
81
82 struct SampleParams
83 {
84 int step;
85 int measurement;
86
SampleParamsdeqp::gles3::Performance::__anon48f87f350111::SampleParams87 SampleParams(int step_, int measurement_) : step(step_), measurement(measurement_) {}
88 };
89
90 typedef vector<float> Geometry;
91
92 struct ObjectData
93 {
94 ProgramSources shader;
95 Geometry geometry;
96
ObjectDatadeqp::gles3::Performance::__anon48f87f350111::ObjectData97 ObjectData (const ProgramSources& shader_, const Geometry& geometry_) : shader(shader_), geometry(geometry_) {}
98 };
99
100 class RenderData
101 {
102 public:
103 RenderData (const ObjectData& object, const glu::RenderContext& renderCtx, TestLog& log);
~RenderData(void)104 ~RenderData (void) {}
105
106 const glu::ShaderProgram m_program;
107 const glu::VertexArray m_vao;
108 const glu::Buffer m_vbo;
109
110 const int m_numVertices;
111 };
112
RenderData(const ObjectData & object,const glu::RenderContext & renderCtx,TestLog & log)113 RenderData::RenderData (const ObjectData& object, const glu::RenderContext& renderCtx, TestLog& log)
114 : m_program (renderCtx, object.shader)
115 , m_vao (renderCtx.getFunctions())
116 , m_vbo (renderCtx.getFunctions())
117 , m_numVertices (int(object.geometry.size())/4)
118 {
119 const glw::Functions& gl = renderCtx.getFunctions();
120
121 if (!m_program.isOk())
122 log << m_program;
123
124 gl.bindBuffer(GL_ARRAY_BUFFER, *m_vbo);
125 gl.bufferData(GL_ARRAY_BUFFER, object.geometry.size() * sizeof(float), &object.geometry[0], GL_STATIC_DRAW);
126 gl.bindAttribLocation(m_program.getProgram(), 0, "a_position");
127
128 gl.bindVertexArray(*m_vao);
129 gl.vertexAttribPointer(0, 4, GL_FLOAT, GL_FALSE, 0, DE_NULL);
130 gl.enableVertexAttribArray(0);
131 gl.bindVertexArray(0);
132 }
133
134 namespace Utils
135 {
getFullscreenQuad(float depth)136 vector<float> getFullscreenQuad (float depth)
137 {
138 const float data[] =
139 {
140 +1.0f, +1.0f, depth, 0.0f, // .w is gl_VertexId%3 since Nexus 4&5 can't handle that on their own
141 +1.0f, -1.0f, depth, 1.0f,
142 -1.0f, -1.0f, depth, 2.0f,
143 -1.0f, -1.0f, depth, 0.0f,
144 -1.0f, +1.0f, depth, 1.0f,
145 +1.0f, +1.0f, depth, 2.0f,
146 };
147
148 return vector<float>(DE_ARRAY_BEGIN(data), DE_ARRAY_END(data));
149 }
150
getFullscreenQuadWithGradient(float depth0,float depth1)151 vector<float> getFullscreenQuadWithGradient (float depth0, float depth1)
152 {
153 const float data[] =
154 {
155 +1.0f, +1.0f, depth0, 0.0f,
156 +1.0f, -1.0f, depth0, 1.0f,
157 -1.0f, -1.0f, depth1, 2.0f,
158 -1.0f, -1.0f, depth1, 0.0f,
159 -1.0f, +1.0f, depth1, 1.0f,
160 +1.0f, +1.0f, depth0, 2.0f,
161 };
162
163 return vector<float>(DE_ARRAY_BEGIN(data), DE_ARRAY_END(data));
164 }
165
getPartScreenQuad(float coverage,float depth)166 vector<float> getPartScreenQuad (float coverage, float depth)
167 {
168 const float xMax = -1.0f + 2.0f*coverage;
169 const float data[] =
170 {
171 xMax, +1.0f, depth, 0.0f,
172 xMax, -1.0f, depth, 1.0f,
173 -1.0f, -1.0f, depth, 2.0f,
174 -1.0f, -1.0f, depth, 0.0f,
175 -1.0f, +1.0f, depth, 1.0f,
176 xMax, +1.0f, depth, 2.0f,
177 };
178
179 return vector<float>(DE_ARRAY_BEGIN(data), DE_ARRAY_END(data));
180 }
181
182 // Axis aligned grid. Depth of vertices is baseDepth +/- depthNoise
getFullScreenGrid(int resolution,deUint32 seed,float baseDepth,float depthNoise,float xyNoise)183 vector<float> getFullScreenGrid (int resolution, deUint32 seed, float baseDepth, float depthNoise, float xyNoise)
184 {
185 const int gridsize = resolution+1;
186 vector<Vec3> vertices (gridsize*gridsize);
187 vector<float> retval;
188 de::Random rng (seed);
189
190 for (int y = 0; y < gridsize; y++)
191 for (int x = 0; x < gridsize; x++)
192 {
193 const bool isEdge = x == 0 || y == 0 || x == resolution || y == resolution;
194 const float x_ = float(x)/float(resolution)*2.0f - 1.0f + (isEdge ? 0.0f : rng.getFloat(-xyNoise, +xyNoise));
195 const float y_ = float(y)/float(resolution)*2.0f - 1.0f + (isEdge ? 0.0f : rng.getFloat(-xyNoise, +xyNoise));
196 const float z_ = baseDepth + rng.getFloat(-depthNoise, +depthNoise);
197
198 vertices[y*gridsize + x] = Vec3(x_, y_, z_);
199 }
200
201 retval.reserve(resolution*resolution*6);
202
203 for (int y = 0; y < resolution; y++)
204 for (int x = 0; x < resolution; x++)
205 {
206 const Vec3& p0 = vertices[(y+0)*gridsize + (x+0)];
207 const Vec3& p1 = vertices[(y+0)*gridsize + (x+1)];
208 const Vec3& p2 = vertices[(y+1)*gridsize + (x+0)];
209 const Vec3& p3 = vertices[(y+1)*gridsize + (x+1)];
210
211 const float temp[6*4] =
212 {
213 p0.x(), p0.y(), p0.z(), 0.0f,
214 p2.x(), p2.y(), p2.z(), 1.0f,
215 p1.x(), p1.y(), p1.z(), 2.0f,
216
217 p3.x(), p3.y(), p3.z(), 0.0f,
218 p1.x(), p1.y(), p1.z(), 1.0f,
219 p2.x(), p2.y(), p2.z(), 2.0f,
220 };
221
222 retval.insert(retval.end(), DE_ARRAY_BEGIN(temp), DE_ARRAY_END(temp));
223 }
224
225 return retval;
226 }
227
228 // Outputs barycentric coordinates as v_bcoords. Otherwise a passthrough shader
getBaseVertexShader(void)229 string getBaseVertexShader (void)
230 {
231 return "#version 300 es\n"
232 "in highp vec4 a_position;\n"
233 "out mediump vec3 v_bcoords;\n"
234 "void main()\n"
235 "{\n"
236 " v_bcoords = vec3(0, 0, 0);\n"
237 " v_bcoords[int(a_position.w)] = 1.0;\n"
238 " gl_Position = vec4(a_position.xyz, 1.0);\n"
239 "}\n";
240 }
241
242 // Adds noise to coordinates based on InstanceID Outputs barycentric coordinates as v_bcoords
getInstanceNoiseVertexShader(void)243 string getInstanceNoiseVertexShader (void)
244 {
245 return "#version 300 es\n"
246 "in highp vec4 a_position;\n"
247 "out mediump vec3 v_bcoords;\n"
248 "void main()\n"
249 "{\n"
250 " v_bcoords = vec3(0, 0, 0);\n"
251 " v_bcoords[int(a_position.w)] = 1.0;\n"
252 " vec3 noise = vec3(sin(float(gl_InstanceID)*1.05), sin(float(gl_InstanceID)*1.23), sin(float(gl_InstanceID)*1.71));\n"
253 " gl_Position = vec4(a_position.xyz + noise * 0.005, 1.0);\n"
254 "}\n";
255 }
256
257 // Renders green triangles with edges highlighted. Exact shade depends on depth.
getDepthAsGreenFragmentShader(void)258 string getDepthAsGreenFragmentShader (void)
259 {
260 return "#version 300 es\n"
261 "in mediump vec3 v_bcoords;\n"
262 "out mediump vec4 fragColor;\n"
263 "void main()\n"
264 "{\n"
265 " mediump float d = gl_FragCoord.z;\n"
266 " if (v_bcoords.x < 0.02 || v_bcoords.y < 0.02 || v_bcoords.z < 0.02)\n"
267 " fragColor = vec4(d,1,d,1);\n"
268 " else\n"
269 " fragColor = vec4(0,d,0,1);\n"
270 "}\n";
271 }
272
273 // Renders green triangles with edges highlighted. Exact shade depends on depth.
getDepthAsRedFragmentShader(void)274 string getDepthAsRedFragmentShader (void)
275 {
276 return "#version 300 es\n"
277 "in mediump vec3 v_bcoords;\n"
278 "out mediump vec4 fragColor;\n"
279 "void main()\n"
280 "{\n"
281 " mediump float d = gl_FragCoord.z;\n"
282 " if (v_bcoords.x < 0.02 || v_bcoords.y < 0.02 || v_bcoords.z < 0.02)\n"
283 " fragColor = vec4(1,d,d,1);\n"
284 " else\n"
285 " fragColor = vec4(d,0,0,1);\n"
286 "}\n";
287 }
288
289 // Basic time waster. Renders red triangles with edges highlighted. Exact shade depends on depth.
getArithmeticWorkloadFragmentShader(void)290 string getArithmeticWorkloadFragmentShader (void)
291 {
292
293 return "#version 300 es\n"
294 "in mediump vec3 v_bcoords;\n"
295 "out mediump vec4 fragColor;\n"
296 "uniform mediump int u_iterations;\n"
297 "void main()\n"
298 "{\n"
299 " mediump float d = gl_FragCoord.z;\n"
300 " for (int i = 0; i<u_iterations; i++)\n"
301 // cos(a)^2 + sin(a)^2 == 1. since d is in range [0,1] this will lose a few ULP's of precision per iteration but should not significantly change the value of d without extreme iteration counts
302 " d = d*sin(d)*sin(d) + d*cos(d)*cos(d);\n"
303 " if (v_bcoords.x < 0.02 || v_bcoords.y < 0.02 || v_bcoords.z < 0.02)\n"
304 " fragColor = vec4(1,d,d,1);\n"
305 " else\n"
306 " fragColor = vec4(d,0,0,1);\n"
307 "}\n";
308 }
309
310 // Arithmetic workload shader but contains discard
getArithmeticWorkloadDiscardFragmentShader(void)311 string getArithmeticWorkloadDiscardFragmentShader (void)
312 {
313 return "#version 300 es\n"
314 "in mediump vec3 v_bcoords;\n"
315 "out mediump vec4 fragColor;\n"
316 "uniform mediump int u_iterations;\n"
317 "void main()\n"
318 "{\n"
319 " mediump float d = gl_FragCoord.z;\n"
320 " for (int i = 0; i<u_iterations; i++)\n"
321 " d = d*sin(d)*sin(d) + d*cos(d)*cos(d);\n"
322 " if (d < 0.5) discard;\n"
323 " if (v_bcoords.x < 0.02 || v_bcoords.y < 0.02 || v_bcoords.z < 0.02)\n"
324 " fragColor = vec4(1,d,d,1);\n"
325 " else\n"
326 " fragColor = vec4(d,0,0,1);\n"
327 "}\n";
328 }
329
330 // Texture fetch based time waster. Renders red triangles with edges highlighted. Exact shade depends on depth.
getTextureWorkloadFragmentShader(void)331 string getTextureWorkloadFragmentShader (void)
332 {
333 return "#version 300 es\n"
334 "in mediump vec3 v_bcoords;\n"
335 "out mediump vec4 fragColor;\n"
336 "uniform mediump int u_iterations;\n"
337 "uniform sampler2D u_texture;\n"
338 "void main()\n"
339 "{\n"
340 " mediump float d = gl_FragCoord.z;\n"
341 " for (int i = 0; i<u_iterations; i++)\n"
342 " d *= texture(u_texture, (gl_FragCoord.xy+vec2(i))/512.0).r;\n" // Texture is expected to be fully white
343 " if (v_bcoords.x < 0.02 || v_bcoords.y < 0.02 || v_bcoords.z < 0.02)\n"
344 " fragColor = vec4(1,1,1,1);\n"
345 " else\n"
346 " fragColor = vec4(d,0,0,1);\n"
347 "}\n";
348 }
349
350 // Discard fragments in a grid pattern
getGridDiscardFragmentShader(int gridsize)351 string getGridDiscardFragmentShader (int gridsize)
352 {
353 const string fragSrc = "#version 300 es\n"
354 "in mediump vec3 v_bcoords;\n"
355 "out mediump vec4 fragColor;\n"
356 "void main()\n"
357 "{\n"
358 " mediump float d = gl_FragCoord.z;\n"
359 " if ((int(gl_FragCoord.x)/${GRIDRENDER_SIZE} + int(gl_FragCoord.y)/${GRIDRENDER_SIZE})%2 == 0)\n"
360 " discard;\n"
361 " if (v_bcoords.x < 0.02 || v_bcoords.y < 0.02 || v_bcoords.z < 0.02)\n"
362 " fragColor = vec4(d,1,d,1);\n"
363 " else\n"
364 " fragColor = vec4(0,d,0,1);\n"
365 "}\n";
366 map<string, string> params;
367
368 params["GRIDRENDER_SIZE"] = de::toString(gridsize);
369
370 return tcu::StringTemplate(fragSrc).specialize(params);
371 }
372
373 // A static increment to frag depth
getStaticFragDepthFragmentShader(void)374 string getStaticFragDepthFragmentShader (void)
375 {
376 return "#version 300 es\n"
377 "in mediump vec3 v_bcoords;\n"
378 "out mediump vec4 fragColor;\n"
379 "void main()\n"
380 "{\n"
381 " mediump float d = gl_FragCoord.z;\n"
382 " gl_FragDepth = gl_FragCoord.z + 0.1;\n"
383 " if (v_bcoords.x < 0.02 || v_bcoords.y < 0.02 || v_bcoords.z < 0.02)\n"
384 " fragColor = vec4(d,1,d,1);\n"
385 " else\n"
386 " fragColor = vec4(0,d,0,1);\n"
387 "}\n";
388 }
389
390 // A trivial dynamic change to frag depth
getDynamicFragDepthFragmentShader(void)391 string getDynamicFragDepthFragmentShader (void)
392 {
393 return "#version 300 es\n"
394 "in mediump vec3 v_bcoords;\n"
395 "out mediump vec4 fragColor;\n"
396 "void main()\n"
397 "{\n"
398 " mediump float d = gl_FragCoord.z;\n"
399 " gl_FragDepth = gl_FragCoord.z + (v_bcoords.x + v_bcoords.y + v_bcoords.z)*0.05;\n" // Sum of v_bcoords components is allways 1
400 " if (v_bcoords.x < 0.02 || v_bcoords.y < 0.02 || v_bcoords.z < 0.02)\n"
401 " fragColor = vec4(d,1,d,1);\n"
402 " else\n"
403 " fragColor = vec4(0,d,0,1);\n"
404 "}\n";
405 }
406
407 // A static increment to frag depth
getStaticFragDepthArithmeticWorkloadFragmentShader(void)408 string getStaticFragDepthArithmeticWorkloadFragmentShader (void)
409 {
410 return "#version 300 es\n"
411 "in mediump vec3 v_bcoords;\n"
412 "out mediump vec4 fragColor;\n"
413 "uniform mediump int u_iterations;\n"
414 "void main()\n"
415 "{\n"
416 " mediump float d = gl_FragCoord.z;\n"
417 " gl_FragDepth = gl_FragCoord.z + 0.1;\n"
418 " for (int i = 0; i<u_iterations; i++)\n"
419 " d = d*sin(d)*sin(d) + d*cos(d)*cos(d);\n"
420 " if (v_bcoords.x < 0.02 || v_bcoords.y < 0.02 || v_bcoords.z < 0.02)\n"
421 " fragColor = vec4(1,d,d,1);\n"
422 " else\n"
423 " fragColor = vec4(d,0,0,1);\n"
424 "}\n";
425 }
426
427 // A trivial dynamic change to frag depth
getDynamicFragDepthArithmeticWorkloadFragmentShader(void)428 string getDynamicFragDepthArithmeticWorkloadFragmentShader (void)
429 {
430 return "#version 300 es\n"
431 "in mediump vec3 v_bcoords;\n"
432 "out mediump vec4 fragColor;\n"
433 "uniform mediump int u_iterations;\n"
434 "void main()\n"
435 "{\n"
436 " mediump float d = gl_FragCoord.z;\n"
437 " gl_FragDepth = gl_FragCoord.z + (v_bcoords.x + v_bcoords.y + v_bcoords.z)*0.05;\n" // Sum of v_bcoords components is allways 1
438 " for (int i = 0; i<u_iterations; i++)\n"
439 " d = d*sin(d)*sin(d) + d*cos(d)*cos(d);\n"
440 " if (v_bcoords.x < 0.02 || v_bcoords.y < 0.02 || v_bcoords.z < 0.02)\n"
441 " fragColor = vec4(1,d,d,1);\n"
442 " else\n"
443 " fragColor = vec4(d,0,0,1);\n"
444 "}\n";
445 }
446
getBaseShader(void)447 glu::ProgramSources getBaseShader (void)
448 {
449 return glu::makeVtxFragSources(getBaseVertexShader(), getDepthAsGreenFragmentShader());
450 }
451
getArithmeticWorkloadShader(void)452 glu::ProgramSources getArithmeticWorkloadShader (void)
453 {
454 return glu::makeVtxFragSources(getBaseVertexShader(), getArithmeticWorkloadFragmentShader());
455 }
456
getArithmeticWorkloadDiscardShader(void)457 glu::ProgramSources getArithmeticWorkloadDiscardShader (void)
458 {
459 return glu::makeVtxFragSources(getBaseVertexShader(), getArithmeticWorkloadDiscardFragmentShader());
460 }
461
getTextureWorkloadShader(void)462 glu::ProgramSources getTextureWorkloadShader (void)
463 {
464 return glu::makeVtxFragSources(getBaseVertexShader(), getTextureWorkloadFragmentShader());
465 }
466
getGridDiscardShader(int gridsize)467 glu::ProgramSources getGridDiscardShader (int gridsize)
468 {
469 return glu::makeVtxFragSources(getBaseVertexShader(), getGridDiscardFragmentShader(gridsize));
470 }
471
quadWith(const glu::ProgramSources & shader,float depth)472 inline ObjectData quadWith (const glu::ProgramSources& shader, float depth)
473 {
474 return ObjectData(shader, getFullscreenQuad(depth));
475 }
476
quadWith(const string & fragShader,float depth)477 inline ObjectData quadWith (const string& fragShader, float depth)
478 {
479 return ObjectData(glu::makeVtxFragSources(getBaseVertexShader(), fragShader), getFullscreenQuad(depth));
480 }
481
variableQuad(float depth)482 inline ObjectData variableQuad (float depth)
483 {
484 return ObjectData(glu::makeVtxFragSources(getInstanceNoiseVertexShader(), getDepthAsRedFragmentShader()), getFullscreenQuad(depth));
485 }
486
fastQuad(float depth)487 inline ObjectData fastQuad (float depth)
488 {
489 return ObjectData(getBaseShader(), getFullscreenQuad(depth));
490 }
491
slowQuad(float depth)492 inline ObjectData slowQuad (float depth)
493 {
494 return ObjectData(getArithmeticWorkloadShader(), getFullscreenQuad(depth));
495 }
496
fastQuadWithGradient(float depth0,float depth1)497 inline ObjectData fastQuadWithGradient (float depth0, float depth1)
498 {
499 return ObjectData(getBaseShader(), getFullscreenQuadWithGradient(depth0, depth1));
500 }
501 } // Utils
502
503 // Shared base
504 class BaseCase : public tcu::TestCase
505 {
506 public:
507 enum {RENDER_SIZE = 512};
508
509 BaseCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc);
~BaseCase(void)510 virtual ~BaseCase (void) {}
511
512 virtual IterateResult iterate (void);
513
514 protected:
515 void logSamples (const vector<Sample>& samples, const string& name, const string& desc);
516 void logGeometry (const tcu::ConstPixelBufferAccess& sample, const glu::ShaderProgram& occluderProg, const glu::ShaderProgram& occludedProg);
517 virtual void logAnalysis (const vector<Sample>& samples) = 0;
518 virtual void logDescription (void) = 0;
519
520 virtual ObjectData genOccluderGeometry (void) const = 0;
521 virtual ObjectData genOccludedGeometry (void) const = 0;
522
523 virtual int calibrate (void) const = 0;
524 virtual Sample renderSample (const RenderData& occluder, const RenderData& occluded, int workload) const = 0;
525
526 void render (const RenderData& data) const;
527 void render (const RenderData& data, int instances) const;
528
529 const RenderContext& m_renderCtx;
530 tcu::ResultCollector m_results;
531
532 enum {ITERATION_STEPS = 10, ITERATION_SAMPLES = 16};
533 };
534
BaseCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)535 BaseCase::BaseCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
536 : TestCase (testCtx, tcu::NODETYPE_PERFORMANCE, name, desc)
537 , m_renderCtx (renderCtx)
538 {
539 }
540
iterate(void)541 BaseCase::IterateResult BaseCase::iterate (void)
542 {
543 typedef de::MovePtr<RenderData> RenderDataP;
544
545 const glw::Functions& gl = m_renderCtx.getFunctions();
546 TestLog& log = m_testCtx.getLog();
547
548 const glu::Framebuffer framebuffer (gl);
549 const glu::Renderbuffer renderbuffer (gl);
550 const glu::Renderbuffer depthbuffer (gl);
551
552 vector<Sample> results;
553 vector<int> params;
554 RenderDataP occluderData;
555 RenderDataP occludedData;
556 tcu::TextureLevel resultTex (tcu::TextureFormat(tcu::TextureFormat::RGBA, tcu::TextureFormat::UNORM_INT8), RENDER_SIZE, RENDER_SIZE);
557 int maxWorkload = 0;
558 de::Random rng (deInt32Hash(deStringHash(getName())) ^ m_testCtx.getCommandLine().getBaseSeed());
559
560 logDescription();
561
562 gl.bindRenderbuffer(GL_RENDERBUFFER, *renderbuffer);
563 gl.renderbufferStorage(GL_RENDERBUFFER, GL_RGBA8, RENDER_SIZE, RENDER_SIZE);
564 gl.bindRenderbuffer(GL_RENDERBUFFER, *depthbuffer);
565 gl.renderbufferStorage(GL_RENDERBUFFER, GL_DEPTH24_STENCIL8, RENDER_SIZE, RENDER_SIZE);
566
567 gl.bindFramebuffer(GL_FRAMEBUFFER, *framebuffer);
568 gl.framebufferRenderbuffer(GL_FRAMEBUFFER, GL_COLOR_ATTACHMENT0, GL_RENDERBUFFER, *renderbuffer);
569 gl.framebufferRenderbuffer(GL_FRAMEBUFFER, GL_DEPTH_ATTACHMENT, GL_RENDERBUFFER, *depthbuffer);
570 gl.viewport(0, 0, RENDER_SIZE, RENDER_SIZE);
571 gl.clearColor(0.125f, 0.25f, 0.5f, 1.0f);
572
573 maxWorkload = calibrate();
574
575 // Setup data
576 occluderData = RenderDataP(new RenderData (genOccluderGeometry(), m_renderCtx, log));
577 occludedData = RenderDataP(new RenderData (genOccludedGeometry(), m_renderCtx, log));
578
579 TCU_CHECK(occluderData->m_program.isOk());
580 TCU_CHECK(occludedData->m_program.isOk());
581
582 // Force initialization of GPU resources
583 gl.clear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT | GL_STENCIL_BUFFER_BIT);
584 gl.enable(GL_DEPTH_TEST);
585
586 render(*occluderData);
587 render(*occludedData);
588 glu::readPixels(m_renderCtx, 0, 0, resultTex.getAccess());
589
590 logGeometry(resultTex.getAccess(), occluderData->m_program, occludedData->m_program);
591
592 params.reserve(ITERATION_STEPS*ITERATION_SAMPLES);
593
594 // Setup parameters
595 for (int step = 0; step < ITERATION_STEPS; step++)
596 {
597 const int workload = maxWorkload*step/ITERATION_STEPS;
598
599 for (int count = 0; count < ITERATION_SAMPLES; count++)
600 params.push_back(workload);
601 }
602
603 rng.shuffle(params.begin(), params.end());
604
605 // Render samples
606 for (size_t ndx = 0; ndx < params.size(); ndx++)
607 {
608 const int workload = params[ndx];
609 Sample sample = renderSample(*occluderData, *occludedData, workload);
610
611 sample.workload = workload;
612 sample.order = int(ndx);
613
614 results.push_back(sample);
615 }
616
617 logSamples(results, "Samples", "Samples");
618 logAnalysis(results);
619
620 m_results.setTestContextResult(m_testCtx);
621
622 return STOP;
623 }
624
logSamples(const vector<Sample> & samples,const string & name,const string & desc)625 void BaseCase::logSamples (const vector<Sample>& samples, const string& name, const string& desc)
626 {
627 TestLog& log = m_testCtx.getLog();
628
629 bool testOnly = true;
630
631 for (size_t ndx = 0; ndx < samples.size(); ndx++)
632 {
633 if (samples[ndx].baseTime != 0 || samples[ndx].nullTime != 0)
634 {
635 testOnly = false;
636 break;
637 }
638 }
639
640 log << TestLog::SampleList(name, desc);
641
642 if (testOnly)
643 {
644 log << TestLog::SampleInfo
645 << TestLog::ValueInfo("Workload", "Workload", "", QP_SAMPLE_VALUE_TAG_PREDICTOR)
646 << TestLog::ValueInfo("Order", "Order of sample", "", QP_SAMPLE_VALUE_TAG_PREDICTOR)
647 << TestLog::ValueInfo("TestTime", "Test render time", "us", QP_SAMPLE_VALUE_TAG_RESPONSE)
648 << TestLog::EndSampleInfo;
649
650 for (size_t sampleNdx = 0; sampleNdx < samples.size(); sampleNdx++)
651 {
652 const Sample& sample = samples[sampleNdx];
653
654 log << TestLog::Sample << sample.workload << sample.order << sample.testTime << TestLog::EndSample;
655 }
656 }
657 else
658 {
659 log << TestLog::SampleInfo
660 << TestLog::ValueInfo("Workload", "Workload", "", QP_SAMPLE_VALUE_TAG_PREDICTOR)
661 << TestLog::ValueInfo("Order", "Order of sample", "", QP_SAMPLE_VALUE_TAG_PREDICTOR)
662 << TestLog::ValueInfo("TestTime", "Test render time", "us", QP_SAMPLE_VALUE_TAG_RESPONSE)
663 << TestLog::ValueInfo("NullTime", "Read pixels time", "us", QP_SAMPLE_VALUE_TAG_RESPONSE)
664 << TestLog::ValueInfo("BaseTime", "Base render time", "us", QP_SAMPLE_VALUE_TAG_RESPONSE)
665 << TestLog::EndSampleInfo;
666
667 for (size_t sampleNdx = 0; sampleNdx < samples.size(); sampleNdx++)
668 {
669 const Sample& sample = samples[sampleNdx];
670
671 log << TestLog::Sample << sample.workload << sample.order << sample.testTime << sample.nullTime << sample.baseTime << TestLog::EndSample;
672 }
673 }
674
675 log << TestLog::EndSampleList;
676 }
677
logGeometry(const tcu::ConstPixelBufferAccess & sample,const glu::ShaderProgram & occluderProg,const glu::ShaderProgram & occludedProg)678 void BaseCase::logGeometry (const tcu::ConstPixelBufferAccess& sample, const glu::ShaderProgram& occluderProg, const glu::ShaderProgram& occludedProg)
679 {
680 TestLog& log = m_testCtx.getLog();
681
682 log << TestLog::Section("Geometry", "Geometry");
683 log << TestLog::Message << "Occluding geometry is green with shade dependent on depth (rgb == 0, depth, 0)" << TestLog::EndMessage;
684 log << TestLog::Message << "Occluded geometry is red with shade dependent on depth (rgb == depth, 0, 0)" << TestLog::EndMessage;
685 log << TestLog::Message << "Primitive edges are a lighter shade of red/green" << TestLog::EndMessage;
686
687 log << TestLog::Image("Test Geometry", "Test Geometry", sample);
688 log << TestLog::EndSection;
689
690 log << TestLog::Section("Occluder", "Occluder");
691 log << occluderProg;
692 log << TestLog::EndSection;
693
694 log << TestLog::Section("Occluded", "Occluded");
695 log << occludedProg;
696 log << TestLog::EndSection;
697 }
698
render(const RenderData & data) const699 void BaseCase::render (const RenderData& data) const
700 {
701 const glw::Functions& gl = m_renderCtx.getFunctions();
702
703 gl.useProgram(data.m_program.getProgram());
704
705 gl.bindVertexArray(*data.m_vao);
706 gl.drawArrays(GL_TRIANGLES, 0, data.m_numVertices);
707 gl.bindVertexArray(0);
708 }
709
render(const RenderData & data,int instances) const710 void BaseCase::render (const RenderData& data, int instances) const
711 {
712 const glw::Functions& gl = m_renderCtx.getFunctions();
713
714 gl.useProgram(data.m_program.getProgram());
715
716 gl.bindVertexArray(*data.m_vao);
717 gl.drawArraysInstanced(GL_TRIANGLES, 0, data.m_numVertices, instances);
718 gl.bindVertexArray(0);
719 }
720
721 // Render occluder once, then repeatedly render occluded geometry. Sample with multiple repetition counts & establish time per call with linear regression
722 class RenderCountCase : public BaseCase
723 {
724 public:
725 RenderCountCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc);
~RenderCountCase(void)726 ~RenderCountCase (void) {}
727
728 protected:
729 virtual void logAnalysis (const vector<Sample>& samples);
730
731 private:
732 virtual int calibrate (void) const;
733 virtual Sample renderSample (const RenderData& occluder, const RenderData& occluded, int callcount) const;
734 };
735
RenderCountCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)736 RenderCountCase::RenderCountCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
737 : BaseCase (testCtx, renderCtx, name, desc)
738 {
739 }
740
logAnalysis(const vector<Sample> & samples)741 void RenderCountCase::logAnalysis (const vector<Sample>& samples)
742 {
743 using namespace gls;
744
745 TestLog& log = m_testCtx.getLog();
746 int maxWorkload = 0;
747 vector<Vec2> testSamples (samples.size());
748
749 for (size_t ndx = 0; ndx < samples.size(); ndx++)
750 {
751 const Sample& sample = samples[ndx];
752
753 testSamples[ndx] = Vec2((float)sample.workload, (float)sample.testTime);
754
755 maxWorkload = de::max(maxWorkload, sample.workload);
756 }
757
758 {
759 const float confidence = 0.60f;
760 const LineParametersWithConfidence testParam = theilSenSiegelLinearRegression(testSamples, confidence);
761 const float usPerCall = testParam.coefficient;
762 const float pxPerCall = RENDER_SIZE*RENDER_SIZE;
763 const float pxPerUs = pxPerCall/usPerCall;
764 const float mpxPerS = pxPerUs;
765
766 log << TestLog::Section("Linear Regression", "Linear Regression");
767 log << TestLog::Message << "Offset & coefficient presented as [confidence interval min, estimate, confidence interval max]. Reported confidence interval for this test is " << confidence << TestLog::EndMessage;
768 log << TestLog::Message << "Render time for scene with depth test was\n\t"
769 << "[" << testParam.offsetConfidenceLower << ", " << testParam.offset << ", " << testParam.offsetConfidenceUpper << "]us +"
770 << "[" << testParam.coefficientConfidenceLower << ", " << testParam.coefficient << ", " << testParam.coefficientConfidenceUpper << "]"
771 << "us/workload" << TestLog::EndMessage;
772 log << TestLog::EndSection;
773
774 log << TestLog::Section("Result", "Result");
775
776 if (testParam.coefficientConfidenceLower < 0.0f)
777 {
778 log << TestLog::Message << "Coefficient confidence bounds include values below 0.0, the operation likely has neglible per-pixel cost" << TestLog::EndMessage;
779 m_results.addResult(QP_TEST_RESULT_PASS, "Pass");
780 }
781 else if (testParam.coefficientConfidenceLower < testParam.coefficientConfidenceUpper*0.25)
782 {
783 log << TestLog::Message << "Coefficient confidence range is extremely large, cannot give reliable result" << TestLog::EndMessage;
784 m_results.addResult(QP_TEST_RESULT_PASS, "Result confidence extremely low");
785 }
786 else
787 {
788 log << TestLog::Message << "Culled hidden pixels @ " << mpxPerS << "Mpx/s" << TestLog::EndMessage;
789 m_results.addResult(QP_TEST_RESULT_PASS, de::floatToString(mpxPerS, 2));
790 }
791
792 log << TestLog::EndSection;
793 }
794 }
795
renderSample(const RenderData & occluder,const RenderData & occluded,int callcount) const796 Sample RenderCountCase::renderSample (const RenderData& occluder, const RenderData& occluded, int callcount) const
797 {
798 const glw::Functions& gl = m_renderCtx.getFunctions();
799 Sample sample;
800 deUint64 now = 0;
801 deUint64 prev = 0;
802 deUint8 buffer[4];
803
804 // Stabilize
805 {
806 gl.clear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT | GL_STENCIL_BUFFER_BIT);
807 gl.enable(GL_DEPTH_TEST);
808 gl.readPixels(0, 0, 1, 1, GL_RGBA, GL_UNSIGNED_BYTE, buffer);
809 }
810
811 prev = deGetMicroseconds();
812
813 gl.clear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT | GL_STENCIL_BUFFER_BIT);
814 gl.enable(GL_DEPTH_TEST);
815
816 render(occluder);
817 render(occluded, callcount);
818
819 gl.readPixels(0, 0, 1, 1, GL_RGBA, GL_UNSIGNED_BYTE, buffer);
820
821 now = deGetMicroseconds();
822
823 sample.testTime = now - prev;
824 sample.baseTime = 0;
825 sample.nullTime = 0;
826 sample.workload = callcount;
827
828 return sample;
829 }
830
calibrate(void) const831 int RenderCountCase::calibrate (void) const
832 {
833 using namespace gls;
834
835 const glw::Functions& gl = m_renderCtx.getFunctions();
836 TestLog& log = m_testCtx.getLog();
837
838 const RenderData occluderGeometry (genOccluderGeometry(), m_renderCtx, log);
839 const RenderData occludedGeometry (genOccludedGeometry(), m_renderCtx, log);
840
841 TheilSenCalibrator calibrator (CalibratorParameters(20, // Initial workload
842 10, // Max iteration frames
843 20.0f, // Iteration shortcut threshold ms
844 20, // Max iterations
845 33.0f, // Target frame time
846 40.0f, // Frame time cap
847 1000.0f // Target measurement duration
848 ));
849
850 while (true)
851 {
852 switch(calibrator.getState())
853 {
854 case TheilSenCalibrator::STATE_FINISHED:
855 logCalibrationInfo(m_testCtx.getLog(), calibrator);
856 return calibrator.getCallCount();
857
858 case TheilSenCalibrator::STATE_MEASURE:
859 {
860 deUint8 buffer[4];
861 deInt64 now;
862 deInt64 prev;
863
864 prev = deGetMicroseconds();
865
866 gl.clear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT | GL_STENCIL_BUFFER_BIT);
867 gl.disable(GL_DEPTH_TEST);
868
869 render(occluderGeometry);
870 render(occludedGeometry, calibrator.getCallCount());
871
872 gl.readPixels(0, 0, 1, 1, GL_RGBA, GL_UNSIGNED_BYTE, buffer);
873
874 now = deGetMicroseconds();
875
876 calibrator.recordIteration(now - prev);
877 break;
878 }
879
880 case TheilSenCalibrator::STATE_RECOMPUTE_PARAMS:
881 calibrator.recomputeParameters();
882 break;
883 default:
884 DE_ASSERT(false);
885 return 1;
886 }
887 }
888 }
889
890 // Compares time/workload gradients of same geometry with and without depth testing
891 class RelativeChangeCase : public BaseCase
892 {
893 public:
894 RelativeChangeCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc);
~RelativeChangeCase(void)895 virtual ~RelativeChangeCase (void) {}
896
897 protected:
898 Sample renderSample (const RenderData& occluder, const RenderData& occluded, int workload) const;
899
900 virtual void logAnalysis (const vector<Sample>& samples);
901
902 private:
903 int calibrate (void) const;
904 };
905
RelativeChangeCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)906 RelativeChangeCase::RelativeChangeCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
907 : BaseCase (testCtx, renderCtx, name, desc)
908 {
909 }
910
calibrate(void) const911 int RelativeChangeCase::calibrate (void) const
912 {
913 using namespace gls;
914
915 const glw::Functions& gl = m_renderCtx.getFunctions();
916 TestLog& log = m_testCtx.getLog();
917
918 const RenderData geom (genOccludedGeometry(), m_renderCtx, log);
919
920 TheilSenCalibrator calibrator(CalibratorParameters( 20, // Initial workload
921 10, // Max iteration frames
922 20.0f, // Iteration shortcut threshold ms
923 20, // Max iterations
924 33.0f, // Target frame time
925 40.0f, // Frame time cap
926 1000.0f // Target measurement duration
927 ));
928
929 while (true)
930 {
931 switch(calibrator.getState())
932 {
933 case TheilSenCalibrator::STATE_FINISHED:
934 logCalibrationInfo(m_testCtx.getLog(), calibrator);
935 return calibrator.getCallCount();
936
937 case TheilSenCalibrator::STATE_MEASURE:
938 {
939 deUint8 buffer[4];
940 const GLuint program = geom.m_program.getProgram();
941
942 gl.useProgram(program);
943 gl.uniform1i(gl.getUniformLocation(program, "u_iterations"), calibrator.getCallCount());
944
945 const deInt64 prev = deGetMicroseconds();
946
947 gl.clear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT | GL_STENCIL_BUFFER_BIT);
948 gl.disable(GL_DEPTH_TEST);
949
950 render(geom);
951
952 gl.readPixels(0, 0, 1, 1, GL_RGBA, GL_UNSIGNED_BYTE, buffer);
953
954 const deInt64 now = deGetMicroseconds();
955
956 calibrator.recordIteration(now - prev);
957 break;
958 }
959
960 case TheilSenCalibrator::STATE_RECOMPUTE_PARAMS:
961 calibrator.recomputeParameters();
962 break;
963 default:
964 DE_ASSERT(false);
965 return 1;
966 }
967 }
968 }
969
renderSample(const RenderData & occluder,const RenderData & occluded,int workload) const970 Sample RelativeChangeCase::renderSample (const RenderData& occluder, const RenderData& occluded, int workload) const
971 {
972 const glw::Functions& gl = m_renderCtx.getFunctions();
973 const GLuint program = occluded.m_program.getProgram();
974 Sample sample;
975 deUint64 now = 0;
976 deUint64 prev = 0;
977 deUint8 buffer[4];
978
979 gl.useProgram(program);
980 gl.uniform1i(gl.getUniformLocation(program, "u_iterations"), workload);
981
982 // Warmup (this workload seems to reduce variation in following workloads)
983 {
984 gl.clear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT | GL_STENCIL_BUFFER_BIT);
985 gl.disable(GL_DEPTH_TEST);
986
987 gl.readPixels(0, 0, 1, 1, GL_RGBA, GL_UNSIGNED_BYTE, buffer);
988 }
989
990 // Null time
991 {
992 prev = deGetMicroseconds();
993
994 gl.clear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT | GL_STENCIL_BUFFER_BIT);
995 gl.disable(GL_DEPTH_TEST);
996
997 gl.readPixels(0, 0, 1, 1, GL_RGBA, GL_UNSIGNED_BYTE, buffer);
998
999 now = deGetMicroseconds();
1000
1001 sample.nullTime = now - prev;
1002 }
1003
1004 // Test time
1005 {
1006 prev = deGetMicroseconds();
1007
1008 gl.clear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT | GL_STENCIL_BUFFER_BIT);
1009 gl.enable(GL_DEPTH_TEST);
1010
1011 render(occluder);
1012 render(occluded);
1013
1014 gl.readPixels(0, 0, 1, 1, GL_RGBA, GL_UNSIGNED_BYTE, buffer);
1015
1016 now = deGetMicroseconds();
1017
1018 sample.testTime = now - prev;
1019 }
1020
1021 // Base time
1022 {
1023 prev = deGetMicroseconds();
1024
1025 gl.clear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT | GL_STENCIL_BUFFER_BIT);
1026 gl.disable(GL_DEPTH_TEST);
1027
1028 render(occluder);
1029 render(occluded);
1030
1031 gl.readPixels(0, 0, 1, 1, GL_RGBA, GL_UNSIGNED_BYTE, buffer);
1032
1033 now = deGetMicroseconds();
1034
1035 sample.baseTime = now - prev;
1036 }
1037
1038 sample.workload = 0;
1039
1040 return sample;
1041 }
1042
logAnalysis(const vector<Sample> & samples)1043 void RelativeChangeCase::logAnalysis (const vector<Sample>& samples)
1044 {
1045 using namespace gls;
1046
1047 TestLog& log = m_testCtx.getLog();
1048
1049 int maxWorkload = 0;
1050
1051 vector<Vec2> nullSamples (samples.size());
1052 vector<Vec2> baseSamples (samples.size());
1053 vector<Vec2> testSamples (samples.size());
1054
1055 for (size_t ndx = 0; ndx < samples.size(); ndx++)
1056 {
1057 const Sample& sample = samples[ndx];
1058
1059 nullSamples[ndx] = Vec2((float)sample.workload, (float)sample.nullTime);
1060 baseSamples[ndx] = Vec2((float)sample.workload, (float)sample.baseTime);
1061 testSamples[ndx] = Vec2((float)sample.workload, (float)sample.testTime);
1062
1063 maxWorkload = de::max(maxWorkload, sample.workload);
1064 }
1065
1066 {
1067 const float confidence = 0.60f;
1068
1069 const LineParametersWithConfidence nullParam = theilSenSiegelLinearRegression(nullSamples, confidence);
1070 const LineParametersWithConfidence baseParam = theilSenSiegelLinearRegression(baseSamples, confidence);
1071 const LineParametersWithConfidence testParam = theilSenSiegelLinearRegression(testSamples, confidence);
1072
1073 if (!de::inRange(0.0f, nullParam.coefficientConfidenceLower, nullParam.coefficientConfidenceUpper))
1074 {
1075 m_results.addResult(QP_TEST_RESULT_FAIL, "Constant operation sequence duration not constant");
1076 log << TestLog::Message << "Constant operation sequence timing may vary as a function of workload. Result quality extremely low" << TestLog::EndMessage;
1077 }
1078
1079 if (de::inRange(0.0f, baseParam.coefficientConfidenceLower, baseParam.coefficientConfidenceUpper))
1080 {
1081 m_results.addResult(QP_TEST_RESULT_FAIL, "Workload has no effect on duration");
1082 log << TestLog::Message << "Workload factor has no effect on duration of sample (smart optimizer?)" << TestLog::EndMessage;
1083 }
1084
1085 log << TestLog::Section("Linear Regression", "Linear Regression");
1086 log << TestLog::Message << "Offset & coefficient presented as [confidence interval min, estimate, confidence interval max]. Reported confidence interval for this test is " << confidence << TestLog::EndMessage;
1087
1088 log << TestLog::Message << "Render time for empty scene was\n\t"
1089 << "[" << nullParam.offsetConfidenceLower << ", " << nullParam.offset << ", " << nullParam.offsetConfidenceUpper << "]us +"
1090 << "[" << nullParam.coefficientConfidenceLower << ", " << nullParam.coefficient << ", " << nullParam.coefficientConfidenceUpper << "]"
1091 << "us/workload" << TestLog::EndMessage;
1092
1093 log << TestLog::Message << "Render time for scene without depth test was\n\t"
1094 << "[" << baseParam.offsetConfidenceLower << ", " << baseParam.offset << ", " << baseParam.offsetConfidenceUpper << "]us +"
1095 << "[" << baseParam.coefficientConfidenceLower << ", " << baseParam.coefficient << ", " << baseParam.coefficientConfidenceUpper << "]"
1096 << "us/workload" << TestLog::EndMessage;
1097
1098 log << TestLog::Message << "Render time for scene with depth test was\n\t"
1099 << "[" << testParam.offsetConfidenceLower << ", " << testParam.offset << ", " << testParam.offsetConfidenceUpper << "]us +"
1100 << "[" << testParam.coefficientConfidenceLower << ", " << testParam.coefficient << ", " << testParam.coefficientConfidenceUpper << "]"
1101 << "us/workload" << TestLog::EndMessage;
1102
1103 log << TestLog::EndSection;
1104
1105 if (de::inRange(0.0f, testParam.coefficientConfidenceLower, testParam.coefficientConfidenceUpper))
1106 {
1107 log << TestLog::Message << "Test duration not dependent on culled workload" << TestLog::EndMessage;
1108 m_results.addResult(QP_TEST_RESULT_PASS, "0.0");
1109 }
1110 else if (testParam.coefficientConfidenceLower < testParam.coefficientConfidenceUpper*0.25)
1111 {
1112 log << TestLog::Message << "Coefficient confidence range is extremely large, cannot give reliable result" << TestLog::EndMessage;
1113 m_results.addResult(QP_TEST_RESULT_PASS, "Result confidence extremely low");
1114 }
1115 else if (baseParam.coefficientConfidenceLower < baseParam.coefficientConfidenceUpper*0.25)
1116 {
1117 log << TestLog::Message << "Coefficient confidence range for base render time is extremely large, cannot give reliable result" << TestLog::EndMessage;
1118 m_results.addResult(QP_TEST_RESULT_PASS, "Result confidence extremely low");
1119 }
1120 else
1121 {
1122 log << TestLog::Message << "Test duration is dependent on culled workload" << TestLog::EndMessage;
1123 m_results.addResult(QP_TEST_RESULT_PASS, de::floatToString(de::abs(testParam.coefficient)/de::abs(baseParam.coefficient), 2));
1124 }
1125 }
1126 }
1127
1128 // Speed of trivial culling
1129 class BaseCostCase : public RenderCountCase
1130 {
1131 public:
BaseCostCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)1132 BaseCostCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
1133 : RenderCountCase (testCtx, renderCtx, name, desc) {}
1134
~BaseCostCase(void)1135 ~BaseCostCase (void) {}
1136
1137 private:
genOccluderGeometry(void) const1138 virtual ObjectData genOccluderGeometry (void) const { return Utils::fastQuad(0.2f); }
genOccludedGeometry(void) const1139 virtual ObjectData genOccludedGeometry (void) const { return Utils::variableQuad(0.8f); }
1140
logDescription(void)1141 virtual void logDescription (void)
1142 {
1143 TestLog& log = m_testCtx.getLog();
1144
1145 log << TestLog::Section("Description", "Test description");
1146 log << TestLog::Message << "Testing hidden fragment culling speed" << TestLog::EndMessage;
1147 log << TestLog::Message << "Geometry consists of two fullsceen quads. The first (occluding) is rendered once, the second (occluded) is rendered repeatedly" << TestLog::EndMessage;
1148 log << TestLog::Message << "Workload indicates the number of times the occluded quad is rendered" << TestLog::EndMessage;
1149 log << TestLog::Message << "The time per culled pixel is estimated from the rate of change of rendering time as a function of workload" << TestLog::EndMessage;
1150 log << TestLog::EndSection;
1151 }
1152 };
1153
1154 // Gradient
1155 class GradientCostCase : public RenderCountCase
1156 {
1157 public:
GradientCostCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc,float gradientDistance)1158 GradientCostCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc, float gradientDistance)
1159 : RenderCountCase (testCtx, renderCtx, name, desc)
1160 , m_gradientDistance (gradientDistance)
1161 {
1162 }
1163
~GradientCostCase(void)1164 ~GradientCostCase (void) {}
1165
1166 private:
genOccluderGeometry(void) const1167 virtual ObjectData genOccluderGeometry (void) const { return Utils::fastQuadWithGradient(0.0f, 1.0f - m_gradientDistance); }
genOccludedGeometry(void) const1168 virtual ObjectData genOccludedGeometry (void) const
1169 {
1170 return ObjectData(glu::makeVtxFragSources(Utils::getInstanceNoiseVertexShader(), Utils::getDepthAsRedFragmentShader()), Utils::getFullscreenQuadWithGradient(m_gradientDistance, 1.0f));
1171 }
1172
logDescription(void)1173 virtual void logDescription (void)
1174 {
1175 TestLog& log = m_testCtx.getLog();
1176
1177 log << TestLog::Section("Description", "Test description");
1178 log << TestLog::Message << "Testing hidden fragment culling speed" << TestLog::EndMessage;
1179 log << TestLog::Message << "Geometry consists of two fullsceen quads. The first (occluding) is rendered once, the second (occluded) is rendered repeatedly" << TestLog::EndMessage;
1180 log << TestLog::Message << "Workload indicates the number of times the occluded quad is rendered" << TestLog::EndMessage;
1181 log << TestLog::Message << "The quads are tilted so that the left edge of the occluded quad has a depth of 1.0 and the right edge of the occluding quad has a depth of 0.0." << TestLog::EndMessage;
1182 log << TestLog::Message << "The quads are spaced to have a depth difference of " << m_gradientDistance << " at all points." << TestLog::EndMessage;
1183 log << TestLog::Message << "The time per culled pixel is estimated from the rate of change of rendering time as a function of workload" << TestLog::EndMessage;
1184 log << TestLog::EndSection;
1185 }
1186
1187 const float m_gradientDistance;
1188 };
1189
1190 // Constant offset to frag depth in occluder
1191 class OccluderStaticFragDepthCostCase : public RenderCountCase
1192 {
1193 public:
OccluderStaticFragDepthCostCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)1194 OccluderStaticFragDepthCostCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
1195 : RenderCountCase(testCtx, renderCtx, name, desc)
1196 {
1197 }
1198
~OccluderStaticFragDepthCostCase(void)1199 ~OccluderStaticFragDepthCostCase (void) {}
1200
1201 private:
genOccluderGeometry(void) const1202 virtual ObjectData genOccluderGeometry (void) const { return Utils::quadWith(Utils::getStaticFragDepthFragmentShader(), 0.2f); }
genOccludedGeometry(void) const1203 virtual ObjectData genOccludedGeometry (void) const { return Utils::fastQuad(0.8f); }
1204
logDescription(void)1205 virtual void logDescription (void)
1206 {
1207 TestLog& log = m_testCtx.getLog();
1208
1209 log << TestLog::Section("Description", "Test description");
1210 log << TestLog::Message << "Testing hidden fragment culling speed" << TestLog::EndMessage;
1211 log << TestLog::Message << "Geometry consists of two fullsceen quads. The first (occluding) is rendered once, the second (occluded) is rendered repeatedly" << TestLog::EndMessage;
1212 log << TestLog::Message << "Workload indicates the number of times the occluded quad is rendered" << TestLog::EndMessage;
1213 log << TestLog::Message << "The occluder quad has a static offset applied to gl_FragDepth" << TestLog::EndMessage;
1214 log << TestLog::Message << "The time per culled pixel is estimated from the rate of change of rendering time as a function of workload" << TestLog::EndMessage;
1215 log << TestLog::EndSection;
1216 }
1217 };
1218
1219 // Dynamic offset to frag depth in occluder
1220 class OccluderDynamicFragDepthCostCase : public RenderCountCase
1221 {
1222 public:
OccluderDynamicFragDepthCostCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)1223 OccluderDynamicFragDepthCostCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
1224 : RenderCountCase(testCtx, renderCtx, name, desc)
1225 {
1226 }
1227
~OccluderDynamicFragDepthCostCase(void)1228 ~OccluderDynamicFragDepthCostCase (void) {}
1229
1230 private:
genOccluderGeometry(void) const1231 virtual ObjectData genOccluderGeometry (void) const { return Utils::quadWith(Utils::getDynamicFragDepthFragmentShader(), 0.2f); }
genOccludedGeometry(void) const1232 virtual ObjectData genOccludedGeometry (void) const { return Utils::fastQuad(0.8f); }
1233
logDescription(void)1234 virtual void logDescription (void)
1235 {
1236 TestLog& log = m_testCtx.getLog();
1237
1238 log << TestLog::Section("Description", "Test description");
1239 log << TestLog::Message << "Testing hidden fragment culling speed" << TestLog::EndMessage;
1240 log << TestLog::Message << "Geometry consists of two fullsceen quads. The first (occluding) is rendered once, the second (occluded) is rendered repeatedly" << TestLog::EndMessage;
1241 log << TestLog::Message << "Workload indicates the number of times the occluded quad is rendered" << TestLog::EndMessage;
1242 log << TestLog::Message << "The occluder quad has a dynamic offset applied to gl_FragDepth" << TestLog::EndMessage;
1243 log << TestLog::Message << "The time per culled pixel is estimated from the rate of change of rendering time as a function of workload" << TestLog::EndMessage;
1244 log << TestLog::EndSection;
1245 }
1246 };
1247
1248 // Constant offset to frag depth in occluder
1249 class OccludedStaticFragDepthCostCase : public RenderCountCase
1250 {
1251 public:
OccludedStaticFragDepthCostCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)1252 OccludedStaticFragDepthCostCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
1253 : RenderCountCase(testCtx, renderCtx, name, desc)
1254 {
1255 }
1256
~OccludedStaticFragDepthCostCase(void)1257 ~OccludedStaticFragDepthCostCase (void) {}
1258
1259 private:
genOccluderGeometry(void) const1260 virtual ObjectData genOccluderGeometry (void) const { return Utils::fastQuad(0.2f); }
genOccludedGeometry(void) const1261 virtual ObjectData genOccludedGeometry (void) const { return Utils::quadWith(Utils::getStaticFragDepthFragmentShader(), 0.2f); }
1262
logDescription(void)1263 virtual void logDescription (void)
1264 {
1265 TestLog& log = m_testCtx.getLog();
1266
1267 log << TestLog::Section("Description", "Test description");
1268 log << TestLog::Message << "Testing hidden fragment culling speed" << TestLog::EndMessage;
1269 log << TestLog::Message << "Geometry consists of two fullsceen quads. The first (occluding) is rendered once, the second (occluded) is rendered repeatedly" << TestLog::EndMessage;
1270 log << TestLog::Message << "Workload indicates the number of times the occluded quad is rendered" << TestLog::EndMessage;
1271 log << TestLog::Message << "The occluded quad has a static offset applied to gl_FragDepth" << TestLog::EndMessage;
1272 log << TestLog::Message << "The time per culled pixel is estimated from the rate of change of rendering time as a function of workload" << TestLog::EndMessage;
1273 log << TestLog::EndSection;
1274 }
1275 };
1276
1277 // Dynamic offset to frag depth in occluder
1278 class OccludedDynamicFragDepthCostCase : public RenderCountCase
1279 {
1280 public:
OccludedDynamicFragDepthCostCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)1281 OccludedDynamicFragDepthCostCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
1282 : RenderCountCase(testCtx, renderCtx, name, desc)
1283 {
1284 }
1285
~OccludedDynamicFragDepthCostCase(void)1286 ~OccludedDynamicFragDepthCostCase (void) {}
1287
1288 private:
genOccluderGeometry(void) const1289 virtual ObjectData genOccluderGeometry (void) const { return Utils::fastQuad(0.2f); }
genOccludedGeometry(void) const1290 virtual ObjectData genOccludedGeometry (void) const { return Utils::quadWith(Utils::getDynamicFragDepthFragmentShader(), 0.2f); }
1291
logDescription(void)1292 virtual void logDescription (void)
1293 {
1294 TestLog& log = m_testCtx.getLog();
1295
1296 log << TestLog::Section("Description", "Test description");
1297 log << TestLog::Message << "Testing hidden fragment culling speed" << TestLog::EndMessage;
1298 log << TestLog::Message << "Geometry consists of two fullsceen quads. The first (occluding) is rendered once, the second (occluded) is rendered repeatedly" << TestLog::EndMessage;
1299 log << TestLog::Message << "Workload indicates the number of times the occluded quad is rendered" << TestLog::EndMessage;
1300 log << TestLog::Message << "The occluded quad has a dynamic offset applied to gl_FragDepth" << TestLog::EndMessage;
1301 log << TestLog::Message << "The time per culled pixel is estimated from the rate of change of rendering time as a function of workload" << TestLog::EndMessage;
1302 log << TestLog::EndSection;
1303 }
1304 };
1305
1306 // Culling speed with slightly less trivial geometry
1307 class OccludingGeometryComplexityCostCase : public RenderCountCase
1308 {
1309 public:
OccludingGeometryComplexityCostCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc,int resolution,float xyNoise,float zNoise)1310 OccludingGeometryComplexityCostCase (TestContext& testCtx,
1311 const RenderContext& renderCtx,
1312 const char* name,
1313 const char* desc,
1314 int resolution,
1315 float xyNoise,
1316 float zNoise)
1317 : RenderCountCase (testCtx, renderCtx, name, desc)
1318 , m_resolution (resolution)
1319 , m_xyNoise (xyNoise)
1320 , m_zNoise (zNoise)
1321 {
1322 }
1323
~OccludingGeometryComplexityCostCase(void)1324 ~OccludingGeometryComplexityCostCase (void) {}
1325
1326 private:
genOccluderGeometry(void) const1327 virtual ObjectData genOccluderGeometry (void) const
1328 {
1329 return ObjectData(Utils::getBaseShader(),
1330 Utils::getFullScreenGrid(m_resolution,
1331 deInt32Hash(deStringHash(getName())) ^ m_testCtx.getCommandLine().getBaseSeed(),
1332 0.2f,
1333 m_zNoise,
1334 m_xyNoise));
1335 }
1336
genOccludedGeometry(void) const1337 virtual ObjectData genOccludedGeometry (void) const { return Utils::variableQuad(0.8f); }
1338
logDescription(void)1339 virtual void logDescription (void)
1340 {
1341 TestLog& log = m_testCtx.getLog();
1342
1343 log << TestLog::Section("Description", "Test description");
1344 log << TestLog::Message << "Testing hidden fragment culling speed" << TestLog::EndMessage;
1345 log << TestLog::Message << "Geometry consists of an occluding grid and an occluded fullsceen quad. The occluding geometry is rendered once, the occluded one is rendered repeatedly" << TestLog::EndMessage;
1346 log << TestLog::Message << "Workload indicates the number of times the occluded quad is rendered" << TestLog::EndMessage;
1347 log << TestLog::Message << "The time per culled pixel is estimated from the rate of change of rendering time as a function of workload" << TestLog::EndMessage;
1348 log << TestLog::EndSection;
1349 }
1350
1351 const int m_resolution;
1352 const float m_xyNoise;
1353 const float m_zNoise;
1354 };
1355
1356
1357 // Cases with varying workloads in the fragment shader
1358 class FragmentWorkloadCullCase : public RelativeChangeCase
1359 {
1360 public:
1361 FragmentWorkloadCullCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc);
~FragmentWorkloadCullCase(void)1362 virtual ~FragmentWorkloadCullCase (void) {}
1363
1364 private:
genOccluderGeometry(void) const1365 virtual ObjectData genOccluderGeometry (void) const { return Utils::fastQuad(0.2f); }
1366
1367 virtual void logDescription (void);
1368 };
1369
FragmentWorkloadCullCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)1370 FragmentWorkloadCullCase::FragmentWorkloadCullCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
1371 : RelativeChangeCase (testCtx, renderCtx, name, desc)
1372 {
1373 }
1374
logDescription(void)1375 void FragmentWorkloadCullCase::logDescription (void)
1376 {
1377 TestLog& log = m_testCtx.getLog();
1378
1379 log << TestLog::Section("Description", "Test description");
1380 log << TestLog::Message << "Testing effects of culled fragment workload on render time" << TestLog::EndMessage;
1381 log << TestLog::Message << "Geometry consists of two fullsceen quads. The first (occluding) quad uses a trivial shader,"
1382 "the second (occluded) contains significant fragment shader work" << TestLog::EndMessage;
1383 log << TestLog::Message << "Workload indicates the number of iterations of dummy work done in the occluded quad's fragment shader" << TestLog::EndMessage;
1384 log << TestLog::Message << "The ratio of rendering times of this scene with/without depth testing are compared" << TestLog::EndMessage;
1385 log << TestLog::Message << "Successfull early Z-testing should result in no correlation between workload and render time" << TestLog::EndMessage;
1386 log << TestLog::EndSection;
1387 }
1388
1389 // Additional workload consists of texture lookups
1390 class FragmentTextureWorkloadCullCase : public FragmentWorkloadCullCase
1391 {
1392 public:
1393 FragmentTextureWorkloadCullCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc);
~FragmentTextureWorkloadCullCase(void)1394 virtual ~FragmentTextureWorkloadCullCase (void) {}
1395
1396 virtual void init (void);
1397 virtual void deinit (void);
1398
1399 private:
1400 typedef MovePtr<glu::Texture> TexPtr;
1401
genOccludedGeometry(void) const1402 virtual ObjectData genOccludedGeometry (void) const
1403 {
1404 return ObjectData(Utils::getTextureWorkloadShader(), Utils::getFullscreenQuad(0.8f));
1405 }
1406
1407 TexPtr m_texture;
1408 };
1409
FragmentTextureWorkloadCullCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)1410 FragmentTextureWorkloadCullCase::FragmentTextureWorkloadCullCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
1411 : FragmentWorkloadCullCase (testCtx, renderCtx, name, desc)
1412 {
1413 }
1414
init(void)1415 void FragmentTextureWorkloadCullCase::init (void)
1416 {
1417 const glw::Functions& gl = m_renderCtx.getFunctions();
1418 const int size = 128;
1419 const vector<deUint8> data (size*size*4, 255);
1420
1421 m_texture = MovePtr<glu::Texture>(new glu::Texture(gl));
1422
1423 gl.bindTexture(GL_TEXTURE_2D, m_texture);
1424 gl.texImage2D(GL_TEXTURE_2D, 0, GL_RGBA8, size, size, 0, GL_RGBA, GL_UNSIGNED_BYTE, &data[0]);
1425 gl.texParameteri(GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER, GL_NEAREST);
1426 gl.texParameteri(GL_TEXTURE_2D, GL_TEXTURE_MAG_FILTER, GL_NEAREST);
1427 }
1428
deinit(void)1429 void FragmentTextureWorkloadCullCase::deinit (void)
1430 {
1431 m_texture.clear();
1432 }
1433
1434 // Additional workload consists of arithmetic
1435 class FragmentArithmeticWorkloadCullCase : public FragmentWorkloadCullCase
1436 {
1437 public:
FragmentArithmeticWorkloadCullCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)1438 FragmentArithmeticWorkloadCullCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
1439 : FragmentWorkloadCullCase (testCtx, renderCtx, name, desc)
1440 {
1441 }
~FragmentArithmeticWorkloadCullCase(void)1442 virtual ~FragmentArithmeticWorkloadCullCase (void) {}
1443
1444 private:
genOccludedGeometry(void) const1445 virtual ObjectData genOccludedGeometry (void) const
1446 {
1447 return ObjectData(Utils::getArithmeticWorkloadShader(), Utils::getFullscreenQuad(0.8f));
1448 }
1449 };
1450
1451 // Contains dynamicly unused discard after a series of calculations
1452 class FragmentDiscardArithmeticWorkloadCullCase : public FragmentWorkloadCullCase
1453 {
1454 public:
FragmentDiscardArithmeticWorkloadCullCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)1455 FragmentDiscardArithmeticWorkloadCullCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
1456 : FragmentWorkloadCullCase (testCtx, renderCtx, name, desc)
1457 {
1458 }
1459
~FragmentDiscardArithmeticWorkloadCullCase(void)1460 virtual ~FragmentDiscardArithmeticWorkloadCullCase (void) {}
1461
1462 private:
genOccludedGeometry(void) const1463 virtual ObjectData genOccludedGeometry (void) const
1464 {
1465 return ObjectData(Utils::getArithmeticWorkloadDiscardShader(), Utils::getFullscreenQuad(0.8f));
1466 }
1467
logDescription(void)1468 virtual void logDescription (void)
1469 {
1470 TestLog& log = m_testCtx.getLog();
1471
1472 log << TestLog::Section("Description", "Test description");
1473 log << TestLog::Message << "Testing effects of culled fragment workload on render time" << TestLog::EndMessage;
1474 log << TestLog::Message << "Geometry consists of two fullsceen quads. The first (occluding) quad uses a trivial shader,"
1475 "the second (occluded) contains significant fragment shader work and a discard that is never triggers but has a dynamic condition" << TestLog::EndMessage;
1476 log << TestLog::Message << "Workload indicates the number of iterations of dummy work done in the occluded quad's fragment shader" << TestLog::EndMessage;
1477 log << TestLog::Message << "The ratio of rendering times of this scene with/without depth testing are compared" << TestLog::EndMessage;
1478 log << TestLog::Message << "Successfull early Z-testing should result in no correlation between workload and render time" << TestLog::EndMessage;
1479 log << TestLog::EndSection;
1480 }
1481 };
1482
1483 // Discards fragments from the occluder in a grid pattern
1484 class PartialOccluderDiscardCullCase : public RelativeChangeCase
1485 {
1486 public:
PartialOccluderDiscardCullCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc,int gridsize)1487 PartialOccluderDiscardCullCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc, int gridsize)
1488 : RelativeChangeCase (testCtx, renderCtx, name, desc)
1489 , m_gridsize (gridsize)
1490 {
1491 }
~PartialOccluderDiscardCullCase(void)1492 virtual ~PartialOccluderDiscardCullCase (void) {}
1493
1494 private:
genOccluderGeometry(void) const1495 virtual ObjectData genOccluderGeometry (void) const { return Utils::quadWith(Utils::getGridDiscardShader(m_gridsize), 0.2f); }
genOccludedGeometry(void) const1496 virtual ObjectData genOccludedGeometry (void) const { return Utils::slowQuad(0.8f); }
1497
logDescription(void)1498 virtual void logDescription (void)
1499 {
1500 TestLog& log = m_testCtx.getLog();
1501
1502 log << TestLog::Section("Description", "Test description");
1503 log << TestLog::Message << "Testing effects of partially discarded occluder on rendering time" << TestLog::EndMessage;
1504 log << TestLog::Message << "Geometry consists of two fullsceen quads. The first (occluding) quad discards half the "
1505 "fragments in a grid pattern, the second (partially occluded) contains significant fragment shader work" << TestLog::EndMessage;
1506 log << TestLog::Message << "Workload indicates the number of iterations of dummy work done in the occluded quad's fragment shader" << TestLog::EndMessage;
1507 log << TestLog::Message << "The ratio of rendering times of this scene with/without depth testing are compared" << TestLog::EndMessage;
1508 log << TestLog::Message << "Successfull early Z-testing should result in depth testing halving the render time" << TestLog::EndMessage;
1509 log << TestLog::EndSection;
1510 }
1511
1512 const int m_gridsize;
1513 };
1514
1515 // Trivial occluder covering part of screen
1516 class PartialOccluderCullCase : public RelativeChangeCase
1517 {
1518 public:
PartialOccluderCullCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc,float coverage)1519 PartialOccluderCullCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc, float coverage)
1520 : RelativeChangeCase (testCtx, renderCtx, name, desc)
1521 , m_coverage (coverage)
1522 {
1523 }
~PartialOccluderCullCase(void)1524 ~PartialOccluderCullCase (void) {}
1525
1526 private:
genOccluderGeometry(void) const1527 virtual ObjectData genOccluderGeometry (void) const { return ObjectData(Utils::getBaseShader(), Utils::getPartScreenQuad(m_coverage, 0.2f)); }
genOccludedGeometry(void) const1528 virtual ObjectData genOccludedGeometry (void) const {return Utils::slowQuad(0.8f); }
1529
logDescription(void)1530 virtual void logDescription (void)
1531 {
1532 TestLog& log = m_testCtx.getLog();
1533
1534 log << TestLog::Section("Description", "Test description");
1535 log << TestLog::Message << "Testing effects of partial occluder on rendering time" << TestLog::EndMessage;
1536 log << TestLog::Message << "Geometry consists of two quads. The first (occluding) quad covers " << m_coverage*100.0f
1537 << "% of the screen, while the second (partially occluded, fullscreen) contains significant fragment shader work" << TestLog::EndMessage;
1538 log << TestLog::Message << "Workload indicates the number of iterations of dummy work done in the occluded quad's fragment shader" << TestLog::EndMessage;
1539 log << TestLog::Message << "The ratio of rendering times of this scene with/without depth testing are compared" << TestLog::EndMessage;
1540 log << TestLog::Message << "Successfull early Z-testing should result in render time increasing proportionally with unoccluded area" << TestLog::EndMessage;
1541 log << TestLog::EndSection;
1542 }
1543
1544 const float m_coverage;
1545 };
1546
1547 // Constant offset to frag depth in occluder
1548 class StaticOccluderFragDepthCullCase : public RelativeChangeCase
1549 {
1550 public:
StaticOccluderFragDepthCullCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)1551 StaticOccluderFragDepthCullCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
1552 : RelativeChangeCase(testCtx, renderCtx, name, desc)
1553 {
1554 }
1555
~StaticOccluderFragDepthCullCase(void)1556 ~StaticOccluderFragDepthCullCase (void) {}
1557
1558 private:
genOccluderGeometry(void) const1559 virtual ObjectData genOccluderGeometry (void) const { return Utils::quadWith(Utils::getStaticFragDepthFragmentShader(), 0.2f); }
genOccludedGeometry(void) const1560 virtual ObjectData genOccludedGeometry (void) const { return Utils::slowQuad(0.8f); }
1561
logDescription(void)1562 virtual void logDescription (void)
1563 {
1564 TestLog& log = m_testCtx.getLog();
1565
1566 log << TestLog::Section("Description", "Test description");
1567 log << TestLog::Message << "Testing effects of non-default frag depth on culling efficiency" << TestLog::EndMessage;
1568 log << TestLog::Message << "Geometry consists of two fullscreen quads. The first (occluding) quad is trivial, while the second (occluded) contains significant fragment shader work" << TestLog::EndMessage;
1569 log << TestLog::Message << "Workload indicates the number of iterations of dummy work done in the occluded quad's fragment shader" << TestLog::EndMessage;
1570 log << TestLog::Message << "The occluder quad has a static offset applied to gl_FragDepth" << TestLog::EndMessage;
1571 log << TestLog::Message << "The ratio of rendering times of this scene with/without depth testing are compared" << TestLog::EndMessage;
1572 log << TestLog::Message << "Successfull early Z-testing should result in no correlation between workload and render time" << TestLog::EndMessage;
1573 log << TestLog::EndSection;
1574 }
1575 };
1576
1577 // Dynamic offset to frag depth in occluder
1578 class DynamicOccluderFragDepthCullCase : public RelativeChangeCase
1579 {
1580 public:
DynamicOccluderFragDepthCullCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)1581 DynamicOccluderFragDepthCullCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
1582 : RelativeChangeCase(testCtx, renderCtx, name, desc)
1583 {
1584 }
1585
~DynamicOccluderFragDepthCullCase(void)1586 ~DynamicOccluderFragDepthCullCase (void) {}
1587
1588 private:
genOccluderGeometry(void) const1589 virtual ObjectData genOccluderGeometry (void) const { return Utils::quadWith(Utils::getDynamicFragDepthFragmentShader(), 0.2f); }
genOccludedGeometry(void) const1590 virtual ObjectData genOccludedGeometry (void) const { return Utils::slowQuad(0.8f); }
1591
logDescription(void)1592 virtual void logDescription (void)
1593 {
1594 TestLog& log = m_testCtx.getLog();
1595
1596 log << TestLog::Section("Description", "Test description");
1597 log << TestLog::Message << "Testing effects of non-default frag depth on culling efficiency" << TestLog::EndMessage;
1598 log << TestLog::Message << "Geometry consists of two fullscreen quads. The first (occluding) quad is trivial, while the second (occluded) contains significant fragment shader work" << TestLog::EndMessage;
1599 log << TestLog::Message << "Workload indicates the number of iterations of dummy work done in the occluded quad's fragment shader" << TestLog::EndMessage;
1600 log << TestLog::Message << "The occluder quad has a dynamic offset applied to gl_FragDepth" << TestLog::EndMessage;
1601 log << TestLog::Message << "The ratio of rendering times of this scene with/without depth testing are compared" << TestLog::EndMessage;
1602 log << TestLog::Message << "Successfull early Z-testing should result in no correlation between workload and render time" << TestLog::EndMessage;
1603 log << TestLog::EndSection;
1604 }
1605 };
1606
1607 // Constant offset to frag depth in occluded
1608 class StaticOccludedFragDepthCullCase : public RelativeChangeCase
1609 {
1610 public:
StaticOccludedFragDepthCullCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)1611 StaticOccludedFragDepthCullCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
1612 : RelativeChangeCase(testCtx, renderCtx, name, desc)
1613 {
1614 }
1615
~StaticOccludedFragDepthCullCase(void)1616 ~StaticOccludedFragDepthCullCase (void) {}
1617
1618 private:
genOccluderGeometry(void) const1619 virtual ObjectData genOccluderGeometry (void) const { return Utils::fastQuad(0.2f); }
genOccludedGeometry(void) const1620 virtual ObjectData genOccludedGeometry (void) const { return Utils::quadWith(Utils::getStaticFragDepthArithmeticWorkloadFragmentShader(), 0.2f); }
1621
logDescription(void)1622 virtual void logDescription (void)
1623 {
1624 TestLog& log = m_testCtx.getLog();
1625
1626 log << TestLog::Section("Description", "Test description");
1627 log << TestLog::Message << "Testing effects of non-default frag depth on rendering time" << TestLog::EndMessage;
1628 log << TestLog::Message << "Geometry consists of two fullscreen quads. The first (occluding) quad is trivial, while the second (occluded) contains significant fragment shader work" << TestLog::EndMessage;
1629 log << TestLog::Message << "Workload indicates the number of iterations of dummy work done in the occluded quad's fragment shader" << TestLog::EndMessage;
1630 log << TestLog::Message << "The occluded quad has a static offset applied to gl_FragDepth" << TestLog::EndMessage;
1631 log << TestLog::Message << "The ratio of rendering times of this scene with/without depth testing are compared" << TestLog::EndMessage;
1632 log << TestLog::Message << "Successfull early Z-testing should result in no correlation between workload and render time" << TestLog::EndMessage;
1633 log << TestLog::EndSection;
1634 }
1635 };
1636
1637 // Dynamic offset to frag depth in occluded
1638 class DynamicOccludedFragDepthCullCase : public RelativeChangeCase
1639 {
1640 public:
DynamicOccludedFragDepthCullCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)1641 DynamicOccludedFragDepthCullCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
1642 : RelativeChangeCase(testCtx, renderCtx, name, desc)
1643 {
1644 }
1645
~DynamicOccludedFragDepthCullCase(void)1646 ~DynamicOccludedFragDepthCullCase (void) {}
1647
1648 private:
genOccluderGeometry(void) const1649 virtual ObjectData genOccluderGeometry (void) const { return Utils::fastQuad(0.2f); }
genOccludedGeometry(void) const1650 virtual ObjectData genOccludedGeometry (void) const { return Utils::quadWith(Utils::getDynamicFragDepthArithmeticWorkloadFragmentShader(), 0.2f); }
1651
logDescription(void)1652 virtual void logDescription (void)
1653 {
1654 TestLog& log = m_testCtx.getLog();
1655
1656 log << TestLog::Section("Description", "Test description");
1657 log << TestLog::Message << "Testing effects of non-default frag depth on rendering time" << TestLog::EndMessage;
1658 log << TestLog::Message << "Geometry consists of two fullscreen quads. The first (occluding) quad is trivial, while the second (occluded) contains significant fragment shader work" << TestLog::EndMessage;
1659 log << TestLog::Message << "Workload indicates the number of iterations of dummy work done in the occluded quad's fragment shader" << TestLog::EndMessage;
1660 log << TestLog::Message << "The occluded quad has a dynamic offset applied to gl_FragDepth" << TestLog::EndMessage;
1661 log << TestLog::Message << "The ratio of rendering times of this scene with/without depth testing are compared" << TestLog::EndMessage;
1662 log << TestLog::Message << "Successfull early Z-testing should result in no correlation between workload and render time" << TestLog::EndMessage;
1663 log << TestLog::EndSection;
1664 }
1665 };
1666
1667 // Dynamic offset to frag depth in occluded
1668 class ReversedDepthOrderCullCase : public RelativeChangeCase
1669 {
1670 public:
ReversedDepthOrderCullCase(TestContext & testCtx,const RenderContext & renderCtx,const char * name,const char * desc)1671 ReversedDepthOrderCullCase (TestContext& testCtx, const RenderContext& renderCtx, const char* name, const char* desc)
1672 : RelativeChangeCase(testCtx, renderCtx, name, desc)
1673 {
1674 }
1675
~ReversedDepthOrderCullCase(void)1676 ~ReversedDepthOrderCullCase (void) {}
1677
1678 private:
genOccluderGeometry(void) const1679 virtual ObjectData genOccluderGeometry (void) const { return Utils::fastQuad(0.2f); }
genOccludedGeometry(void) const1680 virtual ObjectData genOccludedGeometry (void) const { return Utils::slowQuad(0.8f); }
1681
logDescription(void)1682 virtual void logDescription (void)
1683 {
1684 TestLog& log = m_testCtx.getLog();
1685
1686 log << TestLog::Section("Description", "Test description");
1687 log << TestLog::Message << "Testing effects of of back first rendering order on culling efficiency" << TestLog::EndMessage;
1688 log << TestLog::Message << "Geometry consists of two fullscreen quads. The second (occluding) quad is trivial, while the first (occluded) contains significant fragment shader work" << TestLog::EndMessage;
1689 log << TestLog::Message << "Workload indicates the number of iterations of dummy work done in the occluded quad's fragment shader" << TestLog::EndMessage;
1690 log << TestLog::Message << "The ratio of rendering times of this scene with/without depth testing are compared" << TestLog::EndMessage;
1691 log << TestLog::Message << "Successfull early Z-testing should result in no correlation between workload and render time" << TestLog::EndMessage;
1692 log << TestLog::EndSection;
1693 }
1694
1695 // Rendering order of occluder & occluded is reversed, otherwise identical to parent version
renderSample(const RenderData & occluder,const RenderData & occluded,int workload) const1696 Sample renderSample (const RenderData& occluder, const RenderData& occluded, int workload) const
1697 {
1698 const glw::Functions& gl = m_renderCtx.getFunctions();
1699 const GLuint program = occluded.m_program.getProgram();
1700 Sample sample;
1701 deUint64 now = 0;
1702 deUint64 prev = 0;
1703 deUint8 buffer[4];
1704
1705 gl.useProgram(program);
1706 gl.uniform1i(gl.getUniformLocation(program, "u_iterations"), workload);
1707
1708 // Warmup (this workload seems to reduce variation in following workloads)
1709 {
1710 gl.clear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT | GL_STENCIL_BUFFER_BIT);
1711 gl.disable(GL_DEPTH_TEST);
1712
1713 gl.readPixels(0, 0, 1, 1, GL_RGBA, GL_UNSIGNED_BYTE, buffer);
1714 }
1715
1716 // Null time
1717 {
1718 prev = deGetMicroseconds();
1719
1720 gl.clear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT | GL_STENCIL_BUFFER_BIT);
1721 gl.disable(GL_DEPTH_TEST);
1722
1723 gl.readPixels(0, 0, 1, 1, GL_RGBA, GL_UNSIGNED_BYTE, buffer);
1724
1725 now = deGetMicroseconds();
1726
1727 sample.nullTime = now - prev;
1728 }
1729
1730 // Test time
1731 {
1732 prev = deGetMicroseconds();
1733
1734 gl.clear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT | GL_STENCIL_BUFFER_BIT);
1735 gl.enable(GL_DEPTH_TEST);
1736
1737 render(occluded);
1738 render(occluder);
1739
1740 gl.readPixels(0, 0, 1, 1, GL_RGBA, GL_UNSIGNED_BYTE, buffer);
1741
1742 now = deGetMicroseconds();
1743
1744 sample.testTime = now - prev;
1745 }
1746
1747 // Base time
1748 {
1749 prev = deGetMicroseconds();
1750
1751 gl.clear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT | GL_STENCIL_BUFFER_BIT);
1752 gl.disable(GL_DEPTH_TEST);
1753
1754 render(occluded);
1755 render(occluder);
1756
1757 gl.readPixels(0, 0, 1, 1, GL_RGBA, GL_UNSIGNED_BYTE, buffer);
1758
1759 now = deGetMicroseconds();
1760
1761 sample.baseTime = now - prev;
1762 }
1763
1764 sample.workload = 0;
1765
1766 return sample;
1767 }
1768 };
1769
1770 } // Anonymous
1771
DepthTests(Context & context)1772 DepthTests::DepthTests (Context& context)
1773 : TestCaseGroup (context, "depth", "Depth culling performance")
1774 {
1775 }
1776
init(void)1777 void DepthTests::init (void)
1778 {
1779 TestContext& testCtx = m_context.getTestContext();
1780 const RenderContext& renderCtx = m_context.getRenderContext();
1781
1782 {
1783 tcu::TestCaseGroup* const cullEfficiencyGroup = new tcu::TestCaseGroup(m_testCtx, "cull_efficiency", "Fragment cull efficiency");
1784
1785 addChild(cullEfficiencyGroup);
1786
1787 {
1788 tcu::TestCaseGroup* const group = new tcu::TestCaseGroup(m_testCtx, "workload", "Workload");
1789
1790 cullEfficiencyGroup->addChild(group);
1791
1792 group->addChild(new FragmentTextureWorkloadCullCase( testCtx, renderCtx, "workload_texture", "Fragment shader with texture lookup workload"));
1793 group->addChild(new FragmentArithmeticWorkloadCullCase( testCtx, renderCtx, "workload_arithmetic", "Fragment shader with arithmetic workload"));
1794 group->addChild(new FragmentDiscardArithmeticWorkloadCullCase( testCtx, renderCtx, "workload_arithmetic_discard", "Fragment shader that may discard with arithmetic workload"));
1795 }
1796
1797 {
1798 tcu::TestCaseGroup* const group = new tcu::TestCaseGroup(m_testCtx, "occluder_discard", "Discard");
1799
1800 cullEfficiencyGroup->addChild(group);
1801
1802 group->addChild(new PartialOccluderDiscardCullCase(testCtx, renderCtx, "grid_256", "Parts of occluder geometry discarded", 256));
1803 group->addChild(new PartialOccluderDiscardCullCase(testCtx, renderCtx, "grid_128", "Parts of occluder geometry discarded", 128));
1804 group->addChild(new PartialOccluderDiscardCullCase(testCtx, renderCtx, "grid_64", "Parts of occluder geometry discarded", 64));
1805 group->addChild(new PartialOccluderDiscardCullCase(testCtx, renderCtx, "grid_32", "Parts of occluder geometry discarded", 32));
1806 group->addChild(new PartialOccluderDiscardCullCase(testCtx, renderCtx, "grid_16", "Parts of occluder geometry discarded", 16));
1807 group->addChild(new PartialOccluderDiscardCullCase(testCtx, renderCtx, "grid_8", "Parts of occluder geometry discarded", 8));
1808 group->addChild(new PartialOccluderDiscardCullCase(testCtx, renderCtx, "grid_4", "Parts of occluder geometry discarded", 4));
1809 group->addChild(new PartialOccluderDiscardCullCase(testCtx, renderCtx, "grid_2", "Parts of occluder geometry discarded", 2));
1810 group->addChild(new PartialOccluderDiscardCullCase(testCtx, renderCtx, "grid_1", "Parts of occluder geometry discarded", 1));
1811 }
1812
1813 {
1814 tcu::TestCaseGroup* const group = new tcu::TestCaseGroup(m_testCtx, "partial_coverage", "Partial Coverage");
1815
1816 cullEfficiencyGroup->addChild(group);
1817
1818 group->addChild(new PartialOccluderCullCase(testCtx, renderCtx, "100", "Occluder covering only part of occluded geometry", 1.00f));
1819 group->addChild(new PartialOccluderCullCase(testCtx, renderCtx, "099", "Occluder covering only part of occluded geometry", 0.99f));
1820 group->addChild(new PartialOccluderCullCase(testCtx, renderCtx, "095", "Occluder covering only part of occluded geometry", 0.95f));
1821 group->addChild(new PartialOccluderCullCase(testCtx, renderCtx, "090", "Occluder covering only part of occluded geometry", 0.90f));
1822 group->addChild(new PartialOccluderCullCase(testCtx, renderCtx, "080", "Occluder covering only part of occluded geometry", 0.80f));
1823 group->addChild(new PartialOccluderCullCase(testCtx, renderCtx, "070", "Occluder covering only part of occluded geometry", 0.70f));
1824 group->addChild(new PartialOccluderCullCase(testCtx, renderCtx, "050", "Occluder covering only part of occluded geometry", 0.50f));
1825 group->addChild(new PartialOccluderCullCase(testCtx, renderCtx, "025", "Occluder covering only part of occluded geometry", 0.25f));
1826 group->addChild(new PartialOccluderCullCase(testCtx, renderCtx, "010", "Occluder covering only part of occluded geometry", 0.10f));
1827 }
1828
1829 {
1830 tcu::TestCaseGroup* const group = new tcu::TestCaseGroup(m_testCtx, "frag_depth", "Partial Coverage");
1831
1832 cullEfficiencyGroup->addChild(group);
1833
1834 group->addChild(new StaticOccluderFragDepthCullCase( testCtx, renderCtx, "occluder_static", ""));
1835 group->addChild(new DynamicOccluderFragDepthCullCase(testCtx, renderCtx, "occluder_dynamic", ""));
1836 group->addChild(new StaticOccludedFragDepthCullCase( testCtx, renderCtx, "occluded_static", ""));
1837 group->addChild(new DynamicOccludedFragDepthCullCase(testCtx, renderCtx, "occluded_dynamic", ""));
1838 }
1839
1840 {
1841 tcu::TestCaseGroup* const group = new tcu::TestCaseGroup(m_testCtx, "order", "Rendering order");
1842
1843 cullEfficiencyGroup->addChild(group);
1844
1845 group->addChild(new ReversedDepthOrderCullCase(testCtx, renderCtx, "reversed", "Back to front rendering order"));
1846 }
1847 }
1848
1849 {
1850 tcu::TestCaseGroup* const testCostGroup = new tcu::TestCaseGroup(m_testCtx, "culled_pixel_cost", "Fragment cull efficiency");
1851
1852 addChild(testCostGroup);
1853
1854 {
1855 tcu::TestCaseGroup* const group = new tcu::TestCaseGroup(m_testCtx, "gradient", "Gradients with small depth differences");
1856
1857 testCostGroup->addChild(group);
1858
1859 group->addChild(new BaseCostCase(testCtx, renderCtx, "flat", ""));
1860 group->addChild(new GradientCostCase(testCtx, renderCtx, "gradient_050", "", 0.50f));
1861 group->addChild(new GradientCostCase(testCtx, renderCtx, "gradient_010", "", 0.10f));
1862 group->addChild(new GradientCostCase(testCtx, renderCtx, "gradient_005", "", 0.05f));
1863 group->addChild(new GradientCostCase(testCtx, renderCtx, "gradient_002", "", 0.02f));
1864 group->addChild(new GradientCostCase(testCtx, renderCtx, "gradient_001", "", 0.01f));
1865 }
1866
1867 {
1868 tcu::TestCaseGroup* const group = new tcu::TestCaseGroup(m_testCtx, "occluder_geometry", "Occluders with varying geometry complexity");
1869
1870 testCostGroup->addChild(group);
1871
1872 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "flat_uniform_grid_5", "", 5, 0.0f, 0.0f));
1873 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "flat_uniform_grid_15", "", 15, 0.0f, 0.0f));
1874 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "flat_uniform_grid_25", "", 25, 0.0f, 0.0f));
1875 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "flat_uniform_grid_50", "", 50, 0.0f, 0.0f));
1876 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "flat_uniform_grid_100", "", 100, 0.0f, 0.0f));
1877
1878 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "flat_noisy_grid_5", "", 5, 1.0f/5.0f, 0.0f));
1879 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "flat_noisy_grid_15", "", 15, 1.0f/15.0f, 0.0f));
1880 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "flat_noisy_grid_25", "", 25, 1.0f/25.0f, 0.0f));
1881 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "flat_noisy_grid_50", "", 50, 1.0f/50.0f, 0.0f));
1882 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "flat_noisy_grid_100", "", 100, 1.0f/100.0f, 0.0f));
1883
1884 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "uneven_uniform_grid_5", "", 5, 0.0f, 0.2f));
1885 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "uneven_uniform_grid_15", "", 15, 0.0f, 0.2f));
1886 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "uneven_uniform_grid_25", "", 25, 0.0f, 0.2f));
1887 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "uneven_uniform_grid_50", "", 50, 0.0f, 0.2f));
1888 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "uneven_uniform_grid_100", "", 100, 0.0f, 0.2f));
1889
1890 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "uneven_noisy_grid_5", "", 5, 1.0f/5.0f, 0.2f));
1891 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "uneven_noisy_grid_15", "", 15, 1.0f/15.0f, 0.2f));
1892 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "uneven_noisy_grid_25", "", 25, 1.0f/25.0f, 0.2f));
1893 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "uneven_noisy_grid_50", "", 50, 1.0f/50.0f, 0.2f));
1894 group->addChild(new OccludingGeometryComplexityCostCase(testCtx, renderCtx, "uneven_noisy_grid_100", "", 100, 1.0f/100.0f, 0.2f));
1895 }
1896
1897 {
1898 tcu::TestCaseGroup* const group = new tcu::TestCaseGroup(m_testCtx, "frag_depth", "Modifying gl_FragDepth");
1899
1900 testCostGroup->addChild(group);
1901
1902 group->addChild(new OccluderStaticFragDepthCostCase( testCtx, renderCtx, "occluder_static", ""));
1903 group->addChild(new OccluderDynamicFragDepthCostCase(testCtx, renderCtx, "occluder_dynamic", ""));
1904 group->addChild(new OccludedStaticFragDepthCostCase( testCtx, renderCtx, "occluded_static", ""));
1905 group->addChild(new OccludedDynamicFragDepthCostCase(testCtx, renderCtx, "occluded_dynamic", ""));
1906 }
1907 }
1908 }
1909
1910 } // Performance
1911 } // gles3
1912 } // deqp
1913