summaryrefslogtreecommitdiff
path: root/Runtime/Profiler/GPUProfiler.cpp
blob: c452853ab08a7a902808d3b9bb12e82f4ad40469 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
#include "UnityPrefix.h"
#if ENABLE_PROFILER

#include "GPUProfiler.h"
#include "Runtime/GfxDevice/GfxDevice.h"
#include "Runtime/GfxDevice/GfxTimerQuery.h"
#include "ProfilerImpl.h"
#include "ProfilerFrameData.h"

PROFILER_INFORMATION(gBeginQueriesProf, "GPUProfiler.BeginQueries", kProfilerOverhead)
PROFILER_INFORMATION(gEndQueriesProf, "GPUProfiler.EndQueries", kProfilerOverhead)


void GPUProfiler::GPUTimeSample()
{
	// GPU samples should only be added on the main thread.
	DebugAssert (Thread::CurrentThreadIsMainThread ());
	
	UnityProfilerPerThread* prof = UnityProfilerPerThread::ms_InstanceTLS;
	DebugAssert(prof);
	if (!prof->GetIsActive() || !gGraphicsCaps.hasTimerQuery || gGraphicsCaps.buggyTimerQuery)
		return;

	GfxTimerQuery* timer = ProfilerFrameData::AllocTimerQuery();
	timer->Measure();
	ProfilerData::GPUTime sample = {prof->GetActiveSampleIndex(), timer, 0xFFFFFFFF, g_CurrentGPUSection};
	prof->AddGPUSample(sample);
}

void GPUProfiler::BeginFrame()
{	
	PROFILER_AUTO(gBeginQueriesProf, NULL);
	GetGfxDevice().BeginTimerQueries();
}

void GPUProfiler::EndFrame()
{
	GPU_TIMESTAMP();
	PROFILER_AUTO(gEndQueriesProf, NULL);
	GetGfxDevice().EndTimerQueries();
}

bool GPUProfiler::CollectGPUTime( dynamic_array<ProfilerData::GPUTime>& gpuSamples, bool wait )
{
	if(!gGraphicsCaps.hasTimerQuery)
		return false;

	UInt32 flags = wait ? GfxTimerQuery::kWaitAll : GfxTimerQuery::kWaitRenderThread;

	// Gather query times
	for(int i = 0; i < gpuSamples.size(); i++)
	{
		ProfilerData::GPUTime& sample = gpuSamples[i];
		if (sample.timerQuery != NULL)
		{
			ProfileTimeFormat elapsed = sample.timerQuery->GetElapsed(flags);
			sample.gpuTimeInMicroSec = elapsed == kInvalidProfileTime? 0xFFFFFFFF: elapsed/1000;
			if (wait || sample.gpuTimeInMicroSec != 0xFFFFFFFF)
			{
				// Recycle query object
				ProfilerFrameData::ReleaseTimerQuery(sample.timerQuery);
				sample.timerQuery = NULL;
			}
		}
	}
	return true;
}

int GPUProfiler::ComputeGPUTime( dynamic_array<ProfilerData::GPUTime>& gpuSamples )
{
	if (!CollectGPUTime(gpuSamples, true))
		return 0;

	// Why is the first sample invalid?
	if (!gpuSamples.empty())
		gpuSamples[0].gpuTimeInMicroSec = 0;

	int totalTimeMicroSec = 0;
	for(int i = 0; i < gpuSamples.size(); i++)
	{
		totalTimeMicroSec += gpuSamples[i].gpuTimeInMicroSec;
	}	
	return totalTimeMicroSec;
}

void GPUProfiler::ClearTimerQueries ( dynamic_array<ProfilerData::GPUTime>& gpuSamples )
{
	for(int i = 0; i < gpuSamples.size(); i++)
	{
		ProfilerData::GPUTime& sample = gpuSamples[i];
		if (sample.timerQuery != NULL)
		{
			// Recycle query object
			ProfilerFrameData::ReleaseTimerQuery(sample.timerQuery);
			sample.timerQuery = NULL;
		}
	}
}

#endif // ENABLE_PROFILER