diff --git a/drape/drape_common.pri b/drape/drape_common.pri index 3a036a878a..f08aad14cd 100644 --- a/drape/drape_common.pri +++ b/drape/drape_common.pri @@ -42,6 +42,7 @@ SOURCES += \ $$DRAPE_DIR/glyph_manager.cpp \ $$DRAPE_DIR/utils/vertex_decl.cpp \ $$DRAPE_DIR/utils/projection.cpp \ + $$DRAPE_DIR/utils/gpu_mem_tracker.cpp \ HEADERS += \ $$ROOT_DIR/3party/sdf_image/sdf_image.h \ @@ -90,3 +91,4 @@ HEADERS += \ $$DRAPE_DIR/glyph_manager.hpp \ $$DRAPE_DIR/utils/vertex_decl.hpp \ $$DRAPE_DIR/utils/projection.hpp \ + $$DRAPE_DIR/utils/gpu_mem_tracker.hpp \ diff --git a/drape/drape_tests/glfunctions.cpp b/drape/drape_tests/glfunctions.cpp index 85a04553aa..4df55b8dfc 100644 --- a/drape/drape_tests/glfunctions.cpp +++ b/drape/drape_tests/glfunctions.cpp @@ -241,7 +241,6 @@ int32_t GLFunctions::glGetInteger(glConst pname) void CheckGLError(my::SrcPoint const & /*srcPt*/) {} -// @TODO add actual unit tests void GLFunctions::glEnable(glConst mode) {} void GLFunctions::glBlendEquation(glConst function) {} @@ -259,3 +258,5 @@ void GLFunctions::glUnmapBuffer(glConst target) {} void GLFunctions::glDrawElements(uint16_t indexCount) {} void GLFunctions::glPixelStore(glConst name, uint32_t value) {} + +int32_t GLFunctions::glGetBufferParameter(glConst target, glConst name) { return 0; } diff --git a/drape/glconstants.cpp b/drape/glconstants.cpp index bd7d524899..aef150ccd2 100644 --- a/drape/glconstants.cpp +++ b/drape/glconstants.cpp @@ -45,6 +45,9 @@ const glConst GLMaxTextureSize = GL_MAX_TEXTURE_SIZE; const glConst GLArrayBuffer = GL_ARRAY_BUFFER; const glConst GLElementArrayBuffer = GL_ELEMENT_ARRAY_BUFFER; +const glConst GLBufferSize = GL_BUFFER_SIZE; +const glConst GLBufferUsage = GL_BUFFER_USAGE; + const glConst GLWriteOnly = WRITE_ONLY_DEF; const glConst GLStaticDraw = GL_STATIC_DRAW; diff --git a/drape/glconstants.hpp b/drape/glconstants.hpp index ec226720e9..c5deea0a7a 100644 --- a/drape/glconstants.hpp +++ b/drape/glconstants.hpp @@ -17,6 +17,10 @@ extern const glConst GLMaxTextureSize; extern const glConst GLArrayBuffer; extern const glConst GLElementArrayBuffer; +/// Buffer params +extern const glConst GLBufferSize; +extern const glConst GLBufferUsage; + /// VBO Access extern const glConst GLWriteOnly; diff --git a/drape/glfunctions.cpp b/drape/glfunctions.cpp index 1fede51b83..69392b331e 100644 --- a/drape/glfunctions.cpp +++ b/drape/glfunctions.cpp @@ -58,6 +58,7 @@ namespace void * (APIENTRY *glMapBufferFn)(GLenum target, GLenum access) = NULL; GLboolean (APIENTRY *glUnmapBufferFn)(GLenum target) = NULL; + /// Shaders GLuint (APIENTRY *glCreateShaderFn)(GLenum type) = NULL; void (APIENTRY *glShaderSourceFn)(GLuint shaderID, GLsizei count, GLchar const ** string, GLint const * length) = NULL; @@ -253,6 +254,11 @@ void GLFunctions::glFlush() GLCHECK(glFlushFn()); } +void GLFunctions::glFinish() +{ + GLCHECK(::glFinish()); +} + void GLFunctions::glPixelStore(glConst name, uint32_t value) { GLCHECK(::glPixelStorei(name, value)); @@ -265,6 +271,13 @@ int32_t GLFunctions::glGetInteger(glConst pname) return (int32_t)value; } +int32_t GLFunctions::glGetBufferParameter(glConst target, glConst name) +{ + GLint result; + GLCHECK(::glGetBufferParameteriv(target, name, &result)); + return static_cast(result); +} + void GLFunctions::glEnable(glConst mode) { GLCHECK(::glEnable(mode)); diff --git a/drape/glfunctions.hpp b/drape/glfunctions.hpp index d5c6e9fed4..4ba325784d 100644 --- a/drape/glfunctions.hpp +++ b/drape/glfunctions.hpp @@ -17,10 +17,14 @@ public: static void glClearDepth(); static void glViewport(uint32_t x, uint32_t y, uint32_t w, uint32_t h); static void glFlush(); + static void glFinish(); static void glPixelStore(glConst name, uint32_t value); static int32_t glGetInteger(glConst pname); + /// target = { gl_const::GLArrayBuffer, gl_const::GLElementArrayBuffer } + /// name = { gl_const::GLBufferSize, gl_const::GLBufferUsage } + static int32_t glGetBufferParameter(glConst target, glConst name); static void glEnable(glConst mode); static void glDisable(glConst mode); diff --git a/drape/gpu_buffer.cpp b/drape/gpu_buffer.cpp index 5577ec860d..3e0e4117c2 100644 --- a/drape/gpu_buffer.cpp +++ b/drape/gpu_buffer.cpp @@ -1,11 +1,14 @@ #include "drape/gpu_buffer.hpp" #include "drape/glfunctions.hpp" #include "drape/glextensions_list.hpp" +#include "drape/utils/gpu_mem_tracker.hpp" #include "base/assert.hpp" #include "std/cstring.hpp" +#define CHECK_VBO_BOUNDS + namespace dp { @@ -27,7 +30,7 @@ glConst glTarget(GPUBuffer::Target t) } GPUBuffer::GPUBuffer(Target t, uint8_t elementSize, uint16_t capacity) - : base_t(elementSize, capacity) + : TBase(elementSize, capacity) , m_t(t) #ifdef DEBUG , m_isMapped(false) @@ -41,6 +44,10 @@ GPUBuffer::~GPUBuffer() { GLFunctions::glBindBuffer(0, glTarget(m_t)); GLFunctions::glDeleteBuffer(m_bufferID); + +#if defined(TRACK_GPU_MEM) + dp::GPUMemTracker::Inst().RemoveDeallocated("VBO", m_bufferID); +#endif } void GPUBuffer::UploadData(void const * data, uint16_t elementCount) @@ -51,8 +58,19 @@ void GPUBuffer::UploadData(void const * data, uint16_t elementCount) uint8_t elementSize = GetElementSize(); ASSERT(GetCapacity() >= elementCount + currentSize, ("Not enough memory to upload ", elementCount, " elements")); Bind(); + +#if defined(CHECK_VBO_BOUNDS) + int32_t size = GLFunctions::glGetBufferParameter(glTarget(m_t), gl_const::GLBufferSize); + ASSERT_EQUAL(GetCapacity() * elementSize, size, ()); + ASSERT_LESS_OR_EQUAL((elementCount + currentSize) * elementSize, size,()); +#endif + GLFunctions::glBufferSubData(glTarget(m_t), elementCount * elementSize, data, currentSize * elementSize); - base_t::UploadData(elementCount); + TBase::UploadData(elementCount); + +#if defined(TRACK_GPU_MEM) + dp::GPUMemTracker::Inst().SetUsed("VBO", m_bufferID, (currentSize + elementCount) * elementSize); +#endif } void GPUBuffer::Bind() @@ -75,10 +93,18 @@ void * GPUBuffer::Map() void GPUBuffer::UpdateData(void * gpuPtr, void const * data, uint16_t elementOffset, uint16_t elementCount) { - uint16_t const elementSize = GetElementSize(); - uint32_t const byteOffset = elementOffset * (uint32_t)elementSize; - uint32_t const byteCount = elementCount * (uint32_t)elementSize; + uint32_t const elementSize = static_cast(GetElementSize()); + uint32_t const byteOffset = elementOffset * elementSize; + uint32_t const byteCount = elementCount * elementSize; + uint32_t const byteCapacity = GetCapacity() * elementSize; ASSERT(m_isMapped == true, ()); + +#if defined(CHECK_VBO_BOUNDS) + int32_t size = GLFunctions::glGetBufferParameter(glTarget(m_t), gl_const::GLBufferSize); + ASSERT_EQUAL(size, byteCapacity, ()); + ASSERT_LESS(byteOffset + byteCount, size, ()); +#endif + if (IsMapBufferSupported()) { ASSERT(gpuPtr != NULL, ()); @@ -87,7 +113,7 @@ void GPUBuffer::UpdateData(void * gpuPtr, void const * data, uint16_t elementOff else { ASSERT(gpuPtr == NULL, ()); - if (byteOffset == 0 && byteCount == GetCapacity()) + if (byteOffset == 0 && byteCount == byteCapacity) GLFunctions::glBufferData(glTarget(m_t), byteCount, data, gl_const::GLStaticDraw); else GLFunctions::glBufferSubData(glTarget(m_t), byteCount, data, byteOffset); @@ -106,9 +132,14 @@ void GPUBuffer::Unmap() void GPUBuffer::Resize(uint16_t elementCount) { - base_t::Resize(elementCount); + TBase::Resize(elementCount); Bind(); - GLFunctions::glBufferData(glTarget(m_t), GetCapacity() * GetElementSize(), NULL, gl_const::GLStaticDraw); + GLFunctions::glBufferData(glTarget(m_t), GetCapacity() * GetElementSize(), NULL, gl_const::GLDynamicDraw); +#if defined(TRACK_GPU_MEM) + dp::GPUMemTracker & memTracker = dp::GPUMemTracker::Inst(); + memTracker.RemoveDeallocated("VBO", m_bufferID); + memTracker.AddAllocated("VBO", m_bufferID, GetCapacity() * GetElementSize()); +#endif } //////////////////////////////////////////////////////////////////////////// diff --git a/drape/gpu_buffer.hpp b/drape/gpu_buffer.hpp index 7617379c09..4762c71e80 100644 --- a/drape/gpu_buffer.hpp +++ b/drape/gpu_buffer.hpp @@ -8,7 +8,7 @@ namespace dp class GPUBuffer : public BufferBase { - typedef BufferBase base_t; + typedef BufferBase TBase; public: enum Target { diff --git a/drape/texture.cpp b/drape/texture.cpp index cca15b3c16..6e05267ce0 100644 --- a/drape/texture.cpp +++ b/drape/texture.cpp @@ -2,6 +2,7 @@ #include "drape/glfunctions.hpp" #include "drape/glextensions_list.hpp" +#include "drape/utils/gpu_mem_tracker.hpp" #include "base/math.hpp" @@ -31,7 +32,12 @@ Texture::Texture() Texture::~Texture() { if (m_textureID != -1) + { GLFunctions::glDeleteTexture(m_textureID); +#if defined(TRACK_GPU_MEM) + dp::GPUMemTracker::Inst().RemoveDeallocated("Texture", m_textureID); +#endif + } } void Texture::Create(uint32_t width, uint32_t height, TextureFormat format) @@ -60,6 +66,21 @@ void Texture::Create(uint32_t width, uint32_t height, TextureFormat format, RefP GLFunctions::glTexImage2D(m_width, m_height, layout, pixelType, data.GetRaw()); SetFilterParams(gl_const::GLLinear, gl_const::GLLinear); SetWrapMode(gl_const::GLClampToEdge, gl_const::GLClampToEdge); + +#if defined(TRACK_GPU_MEM) + uint32_t channelBitSize = 8; + uint32_t channelCount = 4; + if (pixelType == gl_const::GL4BitOnChannel) + channelBitSize = 4; + + if (layout == gl_const::GLAlpha) + channelCount = 1; + + uint32_t bitCount = channelBitSize * channelCount * m_width * m_height; + uint32_t memSize = bitCount >> 3; + dp::GPUMemTracker::Inst().AddAllocated("Texture", m_textureID, memSize); + dp::GPUMemTracker::Inst().SetUsed("Texture", m_textureID, memSize); +#endif } void Texture::SetFilterParams(glConst minFilter, glConst magFilter) diff --git a/drape/utils/gpu_mem_tracker.cpp b/drape/utils/gpu_mem_tracker.cpp new file mode 100644 index 0000000000..8c867ba49d --- /dev/null +++ b/drape/utils/gpu_mem_tracker.cpp @@ -0,0 +1,75 @@ +#include "gpu_mem_tracker.hpp" + +#include "../../std/tuple.hpp" +#include "../../std/sstream.hpp" + +namespace dp +{ + +GPUMemTracker & GPUMemTracker::Inst() +{ + static GPUMemTracker s_inst; + return s_inst; +} + +string GPUMemTracker::Report() +{ + uint32_t summaryUsed = 0; + uint32_t summaryAllocated = 0; + + typedef tuple TTagStat; + map tagStats; + + for (auto const it : m_memTracker) + { + TTagStat & stat = tagStats[it.first.first]; + stat.get<0>()++; + stat.get<1>() += it.second.first; + stat.get<2>() += it.second.second; + + summaryAllocated += it.second.first; + summaryUsed += it.second.second; + } + + float byteToMb = static_cast(1024 * 1024); + + ostringstream ss; + ss << " ===== Mem Report ===== \n"; + ss << " Summary Allocated = " << summaryAllocated / byteToMb << "\n"; + ss << " Summary Used = " << summaryUsed / byteToMb << "\n"; + ss << " Tags registered = " << tagStats.size() << "\n"; + + for (auto const it : tagStats) + { + ss << " Tag = " << it.first << " \n"; + ss << " Object count = " << it.second.get<0>() << "\n"; + ss << " Allocated = " << it.second.get<1>() / byteToMb << "\n"; + ss << " Used = " << it.second.get<2>() / byteToMb << "\n"; + } + + ss << " ===== Mem Report ===== \n"; + + return move(ss.str()); +} + +void GPUMemTracker::AddAllocated(string const & tag, uint32_t id, uint32_t size) +{ + threads::MutexGuard g(m_mutex); + m_memTracker[make_pair(tag, id)].first = size; +} + +void GPUMemTracker::SetUsed(string const & tag, uint32_t id, uint32_t size) +{ + threads::MutexGuard g(m_mutex); + TAlocUsedMem & node = m_memTracker[make_pair(tag, id)]; + node.second = size; + ASSERT_LESS_OR_EQUAL(node.second, node.first, ("Can't use more then allocated")); +} + +void GPUMemTracker::RemoveDeallocated(string const & tag, uint32_t id) +{ + threads::MutexGuard g(m_mutex); + m_memTracker.erase(make_pair(tag, id)); +} + +} // namespace dp diff --git a/drape/utils/gpu_mem_tracker.hpp b/drape/utils/gpu_mem_tracker.hpp new file mode 100644 index 0000000000..16e1034fa0 --- /dev/null +++ b/drape/utils/gpu_mem_tracker.hpp @@ -0,0 +1,34 @@ +#pragma once + +#include "../../base/mutex.hpp" + +#include "../../std/map.hpp" +#include "../../std/noncopyable.hpp" + +//#define TRACK_GPU_MEM + +namespace dp +{ + +class GPUMemTracker : private noncopyable +{ +public: + static GPUMemTracker & Inst(); + + string Report(); + void AddAllocated(string const & tag, uint32_t id, uint32_t size); + void SetUsed(string const & tag, uint32_t id, uint32_t size); + void RemoveDeallocated(string const & tag, uint32_t id); + +private: + GPUMemTracker() = default; + +private: + typedef pair TAlocUsedMem; + typedef pair TMemTag; + map m_memTracker; + + threads::Mutex m_mutex; +}; + +} // namespace dp