1 /**************************************************************************
3 * Copyright 2011 Jose Fonseca
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
24 **************************************************************************/
29 #include "retrace.hpp"
31 #include "glstate.hpp"
32 #include "glretrace.hpp"
33 #include "os_time.hpp"
35 /* Synchronous debug output may reduce performance however,
36 * without it the callNo in the callback may be inaccurate
37 * as the callback may be called at any time.
39 #define DEBUG_OUTPUT_SYNCHRONOUS 0
43 bool insideList = false;
44 bool insideGlBeginEnd = false;
52 const trace::FunctionSig *sig;
57 static bool supportsElapsed = true;
58 static bool supportsTimestamp = true;
59 static bool supportsOcclusion = true;
60 static bool supportsDebugOutput = true;
62 static std::list<CallQuery> callQueries;
65 debugOutputCallback(GLenum source, GLenum type, GLuint id, GLenum severity, GLsizei length, const GLchar* message, GLvoid* userParam);
68 checkGlError(trace::Call &call) {
69 GLenum error = glGetError();
70 while (error != GL_NO_ERROR) {
71 std::ostream & os = retrace::warning(call);
79 os << "GL_INVALID_ENUM";
81 case GL_INVALID_VALUE:
82 os << "GL_INVALID_VALUE";
84 case GL_INVALID_OPERATION:
85 os << "GL_INVALID_OPERATION";
87 case GL_STACK_OVERFLOW:
88 os << "GL_STACK_OVERFLOW";
90 case GL_STACK_UNDERFLOW:
91 os << "GL_STACK_UNDERFLOW";
93 case GL_OUT_OF_MEMORY:
94 os << "GL_OUT_OF_MEMORY";
96 case GL_INVALID_FRAMEBUFFER_OPERATION:
97 os << "GL_INVALID_FRAMEBUFFER_OPERATION";
99 case GL_TABLE_TOO_LARGE:
100 os << "GL_TABLE_TOO_LARGE";
108 error = glGetError();
113 getCurrentTimes(int64_t& cpuTime, int64_t& gpuTime) {
116 if (retrace::profilingGpuTimes && supportsTimestamp) {
117 glGenQueries(1, &query);
118 glQueryCounter(query, GL_TIMESTAMP);
119 glGetQueryObjecti64vEXT(query, GL_QUERY_RESULT, &gpuTime);
124 if (retrace::profilingCpuTimes) {
125 cpuTime = os::getTime();
130 if (retrace::profilingGpuTimes && supportsTimestamp) {
131 glDeleteQueries(1, &query);
136 completeCallQuery(CallQuery& query) {
137 /* Get call start and duration */
138 int64_t gpuStart = 0, gpuDuration = 0, cpuDuration = 0, pixels = 0;
141 if (retrace::profilingGpuTimes) {
142 if (supportsTimestamp) {
143 glGetQueryObjecti64vEXT(query.ids[0], GL_QUERY_RESULT, &gpuStart);
146 glGetQueryObjecti64vEXT(query.ids[1], GL_QUERY_RESULT, &gpuDuration);
149 if (retrace::profilingPixelsDrawn) {
150 glGetQueryObjecti64vEXT(query.ids[2], GL_QUERY_RESULT, &pixels);
153 glDeleteQueries(3, query.ids);
158 if (retrace::profilingCpuTimes) {
159 cpuDuration = query.cpuEnd - query.cpuStart;
162 /* Add call to profile */
163 retrace::profiler.addCall(query.call, query.sig->name, query.program, pixels, gpuStart, gpuDuration, query.cpuStart, cpuDuration);
168 for (std::list<CallQuery>::iterator itr = callQueries.begin(); itr != callQueries.end(); ++itr) {
169 completeCallQuery(*itr);
176 beginProfile(trace::Call &call, bool isDraw) {
177 glretrace::Context *currentContext = glretrace::getCurrentContext();
179 /* Create call query */
181 query.isDraw = isDraw;
182 query.call = call.no;
183 query.sig = call.sig;
184 query.program = currentContext ? currentContext->activeProgram : 0;
186 /* GPU profiling only for draw calls */
188 glGenQueries(3, query.ids);
190 if (retrace::profilingGpuTimes) {
191 if (supportsTimestamp) {
192 glQueryCounter(query.ids[0], GL_TIMESTAMP);
195 glBeginQuery(GL_TIME_ELAPSED, query.ids[1]);
198 if (retrace::profilingPixelsDrawn) {
199 glBeginQuery(GL_SAMPLES_PASSED, query.ids[2]);
203 callQueries.push_back(query);
205 /* CPU profiling for all calls */
206 if (retrace::profilingCpuTimes) {
207 callQueries.back().cpuStart = os::getTime();
212 endProfile(trace::Call &call, bool isDraw) {
213 GLint64 time = os::getTime();
215 /* CPU profiling for all calls */
216 if (retrace::profilingCpuTimes) {
217 CallQuery& query = callQueries.back();
221 /* GPU profiling only for draw calls */
223 if (retrace::profilingGpuTimes) {
224 glEndQuery(GL_TIME_ELAPSED);
227 if (retrace::profilingPixelsDrawn) {
228 glEndQuery(GL_SAMPLES_PASSED);
235 glretrace::Context *currentContext = glretrace::getCurrentContext();
237 /* Ensure we have adequate extension support */
238 assert(currentContext);
239 supportsTimestamp = currentContext->hasExtension("GL_ARB_timer_query");
240 supportsElapsed = currentContext->hasExtension("GL_EXT_timer_query") || supportsTimestamp;
241 supportsOcclusion = currentContext->hasExtension("GL_ARB_occlusion_query");
242 supportsDebugOutput = currentContext->hasExtension("GL_ARB_debug_output");
244 /* Check for timer query support */
245 if (retrace::profilingGpuTimes) {
246 if (!supportsTimestamp && !supportsElapsed) {
247 std::cout << "Error: Cannot run profile, GL_EXT_timer_query extension is not supported." << std::endl;
252 glGetQueryiv(GL_TIME_ELAPSED, GL_QUERY_COUNTER_BITS, &bits);
255 std::cout << "Error: Cannot run profile, GL_QUERY_COUNTER_BITS == 0." << std::endl;
260 /* Check for occlusion query support */
261 if (retrace::profilingPixelsDrawn && !supportsOcclusion) {
262 std::cout << "Error: Cannot run profile, GL_ARB_occlusion_query extension is not supported." << std::endl;
266 /* Setup debug message call back */
267 if (retrace::debug && supportsDebugOutput) {
268 glretrace::Context *currentContext = glretrace::getCurrentContext();
269 glDebugMessageCallbackARB(&debugOutputCallback, currentContext);
271 if (DEBUG_OUTPUT_SYNCHRONOUS) {
272 glEnable(GL_DEBUG_OUTPUT_SYNCHRONOUS_ARB);
276 /* Sync the gpu and cpu start times */
277 if (retrace::profilingCpuTimes || retrace::profilingGpuTimes) {
278 if (!retrace::profiler.hasBaseTimes()) {
279 GLint64 gpuTime, cpuTime;
281 getCurrentTimes(cpuTime, gpuTime);
282 retrace::profiler.setBaseCpuTime(cpuTime);
283 retrace::profiler.setBaseGpuTime(gpuTime);
289 frame_complete(trace::Call &call) {
290 if (retrace::profiling) {
291 /* Complete any remaining queries */
294 /* GPU time drifts due to being relative times, not absolute and can be
295 * affected by the gpu switch between processes.
297 * To attempt to compensate we resynchronise on frame end however there is
298 * still noticeable drift within a single frame which we do not account for.
300 if (retrace::profilingCpuTimes || retrace::profilingGpuTimes) {
301 int64_t cpuTime, gpuTime, error;
303 getCurrentTimes(cpuTime, gpuTime);
304 cpuTime = cpuTime - retrace::profiler.getBaseCpuTime();
305 gpuTime = gpuTime - retrace::profiler.getBaseGpuTime();
306 error = gpuTime - cpuTime * (1.0E9 / os::timeFrequency);
308 retrace::profiler.setBaseGpuTime(retrace::profiler.getBaseGpuTime() + error);
311 /* Indicate end of current frame */
312 retrace::profiler.addFrameEnd();
315 retrace::frameComplete(call);
317 glretrace::Context *currentContext = glretrace::getCurrentContext();
318 if (!currentContext) {
322 assert(currentContext->drawable);
323 if (retrace::debug && !currentContext->drawable->visible) {
324 retrace::warning(call) << "could not infer drawable size (glViewport never called)\n";
329 getDebugOutputSource(GLenum source) {
331 case GL_DEBUG_SOURCE_API_ARB:
333 case GL_DEBUG_SOURCE_WINDOW_SYSTEM_ARB:
334 return "Window System";
335 case GL_DEBUG_SOURCE_SHADER_COMPILER_ARB:
336 return "Shader Compiler";
337 case GL_DEBUG_SOURCE_THIRD_PARTY_ARB:
338 return "Third Party";
339 case GL_DEBUG_SOURCE_APPLICATION_ARB:
340 return "Application";
341 case GL_DEBUG_SOURCE_OTHER_ARB:
348 getDebugOutputType(GLenum type) {
350 case GL_DEBUG_TYPE_ERROR_ARB:
352 case GL_DEBUG_TYPE_DEPRECATED_BEHAVIOR_ARB:
353 return "deprecated behaviour";
354 case GL_DEBUG_TYPE_UNDEFINED_BEHAVIOR_ARB:
355 return "undefined behaviour";
356 case GL_DEBUG_TYPE_PORTABILITY_ARB:
357 return "portability issue";
358 case GL_DEBUG_TYPE_PERFORMANCE_ARB:
359 return "performance issue";
360 case GL_DEBUG_TYPE_OTHER_ARB:
362 return "unknown issue";
367 getDebugOutputSeverity(GLenum severity) {
369 case GL_DEBUG_SEVERITY_HIGH_ARB:
371 case GL_DEBUG_SEVERITY_MEDIUM_ARB:
373 case GL_DEBUG_SEVERITY_LOW_ARB:
381 debugOutputCallback(GLenum source, GLenum type, GLuint id, GLenum severity, GLsizei length, const GLchar* message, GLvoid* userParam) {
382 std::cerr << retrace::callNo << ": ";
383 std::cerr << "glDebugOutputCallback: ";
384 std::cerr << getDebugOutputSeverity(severity) << " severity ";
385 std::cerr << getDebugOutputSource(source) << " " << getDebugOutputType(type);
386 std::cerr << " " << id;
387 std::cerr << ", " << message;
388 std::cerr << std::endl;
391 } /* namespace glretrace */
394 class GLDumper : public retrace::Dumper {
398 if (!glretrace::getCurrentContext()) {
401 return glstate::getDrawBufferImage();
405 dumpState(std::ostream &os) {
406 glretrace::Context *currentContext = glretrace::getCurrentContext();
407 if (glretrace::insideGlBeginEnd ||
411 glstate::dumpCurrentContext(os);
416 static GLDumper glDumper;
420 retrace::setUp(void) {
427 retrace::addCallbacks(retrace::Retracer &retracer)
429 retracer.addCallbacks(glretrace::gl_callbacks);
430 retracer.addCallbacks(glretrace::glx_callbacks);
431 retracer.addCallbacks(glretrace::wgl_callbacks);
432 retracer.addCallbacks(glretrace::cgl_callbacks);
433 retracer.addCallbacks(glretrace::egl_callbacks);
438 retrace::flushRendering(void) {
439 glretrace::Context *currentContext = glretrace::getCurrentContext();
440 if (currentContext) {
441 glretrace::flushQueries();
447 retrace::waitForInput(void) {
448 while (glws::processEvents()) {
454 retrace::cleanUp(void) {