From e55caa234cf5769fd7704199957b134dc0fd38c1 Mon Sep 17 00:00:00 2001 From: MediaPipe Team Date: Thu, 14 Dec 2023 22:22:57 -0800 Subject: [PATCH] No public description PiperOrigin-RevId: 591148449 --- mediapipe/framework/formats/tensor.cc | 8 +- mediapipe/framework/formats/tensor.h | 4 + .../framework/formats/tensor_ahwb_gpu_test.cc | 133 +++++++++++++++--- 3 files changed, 122 insertions(+), 23 deletions(-) diff --git a/mediapipe/framework/formats/tensor.cc b/mediapipe/framework/formats/tensor.cc index 49987791a1..bf856f5a98 100644 --- a/mediapipe/framework/formats/tensor.cc +++ b/mediapipe/framework/formats/tensor.cc @@ -359,7 +359,13 @@ Tensor::OpenGlBufferView Tensor::GetOpenGlBufferReadView() const { } return {opengl_buffer_, std::move(lock), #ifdef MEDIAPIPE_TENSOR_USE_AHWB - &ssbo_read_ + // ssbo_read_ is passed to be populated on OpenGlBufferView + // destruction in order to perform delayed resources releasing (see + // tensor_ahwb.cc/DelayedReleaser) only when AHWB is in use. + // + // Not passing for the case when AHWB is not in use to avoid creation + // of unnecessary sync object and memory leak. + use_ahwb_ ? &ssbo_read_ : nullptr #else nullptr #endif // MEDIAPIPE_TENSOR_USE_AHWB diff --git a/mediapipe/framework/formats/tensor.h b/mediapipe/framework/formats/tensor.h index 361883a675..863e5fdd3a 100644 --- a/mediapipe/framework/formats/tensor.h +++ b/mediapipe/framework/formats/tensor.h @@ -288,18 +288,22 @@ class Tensor { class OpenGlBufferView : public View { public: GLuint name() const { return name_; } + OpenGlBufferView(OpenGlBufferView&& src) : View(std::move(src)) { name_ = std::exchange(src.name_, GL_INVALID_INDEX); ssbo_read_ = std::exchange(src.ssbo_read_, nullptr); } ~OpenGlBufferView() { if (ssbo_read_) { + // TODO: update tensor to properly handle cases when + // multiple views were requested multiple sync fence may be needed. *ssbo_read_ = glFenceSync(GL_SYNC_GPU_COMMANDS_COMPLETE, 0); } } protected: friend class Tensor; + OpenGlBufferView(GLuint name, std::unique_ptr&& lock, GLsync* ssbo_read) : View(std::move(lock)), name_(name), ssbo_read_(ssbo_read) {} diff --git a/mediapipe/framework/formats/tensor_ahwb_gpu_test.cc b/mediapipe/framework/formats/tensor_ahwb_gpu_test.cc index b06bd3ef27..bfafc44aa7 100644 --- a/mediapipe/framework/formats/tensor_ahwb_gpu_test.cc +++ b/mediapipe/framework/formats/tensor_ahwb_gpu_test.cc @@ -6,6 +6,7 @@ #include +#include "absl/algorithm/container.h" #include "mediapipe/framework/formats/tensor.h" #include "mediapipe/framework/formats/tensor/views/data_types.h" #include "mediapipe/gpu/gpu_test_base.h" @@ -18,7 +19,7 @@ // Then the test requests the CPU view and compares the values. // Float32 and Float16 tests are there. -namespace { +namespace mediapipe { using mediapipe::Float16; using mediapipe::Tensor; @@ -27,6 +28,16 @@ MATCHER_P(NearWithPrecision, precision, "") { return std::abs(std::get<0>(arg) - std::get<1>(arg)) < precision; } +template +std::vector CreateReferenceData(int num_elements) { + std::vector reference; + reference.resize(num_elements); + for (int i = 0; i < num_elements; i++) { + reference[i] = static_cast(i) / 10.0f; + } + return reference; +} + #if MEDIAPIPE_OPENGL_ES_VERSION >= MEDIAPIPE_OPENGL_ES_31 // Utility function to fill the GPU buffer. @@ -110,11 +121,7 @@ TEST_F(TensorAhwbGpuTest, TestGpuToCpuFloat32) { }); auto ptr = tensor.GetCpuReadView().buffer(); ASSERT_NE(ptr, nullptr); - std::vector reference; - reference.resize(num_elements); - for (int i = 0; i < num_elements; i++) { - reference[i] = static_cast(i) / 10.0f; - } + std::vector reference = CreateReferenceData(num_elements); EXPECT_THAT(absl::Span(ptr, num_elements), testing::Pointwise(testing::FloatEq(), reference)); } @@ -137,11 +144,7 @@ TEST_F(TensorAhwbGpuTest, TestGpuToCpuFloat16) { }); auto ptr = tensor.GetCpuReadView().buffer(); ASSERT_NE(ptr, nullptr); - std::vector reference; - reference.resize(num_elements); - for (int i = 0; i < num_elements; i++) { - reference[i] = static_cast(i) / 10.0f; - } + std::vector reference = CreateReferenceData(num_elements); // Precision is set to a reasonable value for Float16. EXPECT_THAT(absl::Span(ptr, num_elements), testing::Pointwise(NearWithPrecision(0.001), reference)); @@ -166,11 +169,7 @@ TEST_F(TensorAhwbGpuTest, TestReplacingCpuByAhwb) { } auto ptr = tensor.GetCpuReadView().buffer(); ASSERT_NE(ptr, nullptr); - std::vector reference; - reference.resize(num_elements); - for (int i = 0; i < num_elements; i++) { - reference[i] = static_cast(i) / 10.0f; - } + std::vector reference = CreateReferenceData(num_elements); EXPECT_THAT(absl::Span(ptr, num_elements), testing::Pointwise(testing::FloatEq(), reference)); } @@ -194,17 +193,107 @@ TEST_F(TensorAhwbGpuTest, TestReplacingGpuByAhwb) { } auto ptr = tensor.GetCpuReadView().buffer(); ASSERT_NE(ptr, nullptr); - std::vector reference; - reference.resize(num_elements); - for (int i = 0; i < num_elements; i++) { - reference[i] = static_cast(i) / 10.0f; - } + std::vector reference = CreateReferenceData(num_elements); EXPECT_THAT(absl::Span(ptr, num_elements), testing::Pointwise(testing::FloatEq(), reference)); } +std::vector ReadGlBufferView(const Tensor::OpenGlBufferView& view, + int num_elements) { + glBindBuffer(GL_SHADER_STORAGE_BUFFER, view.name()); + int bytes = num_elements * sizeof(float); + void* ptr = + glMapBufferRange(GL_SHADER_STORAGE_BUFFER, 0, bytes, GL_MAP_READ_BIT); + ABSL_CHECK(ptr) << "glMapBufferRange failed: " << glGetError(); + + std::vector data; + data.resize(num_elements); + std::memcpy(data.data(), ptr, bytes); + glUnmapBuffer(GL_SHADER_STORAGE_BUFFER); + return data; +} + +TEST_F(TensorAhwbGpuTest, TestGetOpenGlBufferReadViewNoAhwb) { + constexpr size_t kNumElements = 20; + std::vector reference = CreateReferenceData(kNumElements); + + Tensor tensor(Tensor::ElementType::kFloat32, Tensor::Shape({kNumElements})); + { + // Populate tensor on CPU and make sure view is destroyed + absl::c_copy(reference, tensor.GetCpuWriteView().buffer()); + } + + RunInGlContext([&] { + // Triggers conversion to GL buffer. + auto ssbo_view = tensor.GetOpenGlBufferReadView(); + ASSERT_NE(ssbo_view.name(), 0); + // ssbo_read_ must NOT be populated, as there's no AHWB associated with + // GL buffer + ASSERT_EQ(ssbo_view.ssbo_read_, nullptr); + + std::vector output = ReadGlBufferView(ssbo_view, kNumElements); + EXPECT_THAT(output, testing::Pointwise(testing::FloatEq(), reference)); + }); +} + +TEST_F(TensorAhwbGpuTest, TestGetOpenGlBufferReadViewAhwbFromCpu) { + constexpr size_t kNumElements = 20; + std::vector reference = CreateReferenceData(kNumElements); + + Tensor tensor(Tensor::ElementType::kFloat32, Tensor::Shape({kNumElements})); + { + // Populate tensor on CPU and make sure view is destroyed + absl::c_copy(reference, tensor.GetCpuWriteView().buffer()); + } + + { + // Make tensor to allocate ahwb and make sure view is destroyed. + ASSERT_NE(tensor.GetAHardwareBufferReadView().handle(), nullptr); + } + + RunInGlContext([&] { + // Triggers conversion to GL buffer. + auto ssbo_view = tensor.GetOpenGlBufferReadView(); + ASSERT_NE(ssbo_view.name(), 0); + // ssbo_read_ must be populated, so during view destruction it's set + // properly for further AHWB destruction + ASSERT_NE(ssbo_view.ssbo_read_, nullptr); + + std::vector output = ReadGlBufferView(ssbo_view, kNumElements); + EXPECT_THAT(output, testing::Pointwise(testing::FloatEq(), reference)); + }); +} + +TEST_F(TensorAhwbGpuTest, TestGetOpenGlBufferReadViewAhwbFromGpu) { + constexpr size_t kNumElements = 20; + std::vector reference = CreateReferenceData(kNumElements); + + Tensor tensor(Tensor::ElementType::kFloat32, Tensor::Shape({kNumElements})); + { + // Make tensor to allocate ahwb and make sure view is destroyed. + ASSERT_NE(tensor.GetAHardwareBufferWriteView().handle(), nullptr); + } + + RunInGlContext([&] { + FillGpuBuffer(tensor.GetOpenGlBufferWriteView().name(), + tensor.shape().num_elements(), tensor.element_type()); + }); + + RunInGlContext([&] { + // Triggers conversion to GL buffer. + auto ssbo_view = tensor.GetOpenGlBufferReadView(); + ASSERT_NE(ssbo_view.name(), 0); + // ssbo_read_ must be populated, so during view destruction it's set + // properly for further AHWB destruction + ASSERT_NE(ssbo_view.ssbo_read_, nullptr); + + std::vector output = ReadGlBufferView(ssbo_view, kNumElements); + EXPECT_THAT(output, testing::Pointwise(testing::FloatEq(), reference)); + }); +} + #endif // MEDIAPIPE_OPENGL_ES_VERSION >= MEDIAPIPE_OPENGL_ES_31 -} // namespace +} // namespace mediapipe #endif // !defined(MEDIAPIPE_NO_JNI) && (__ANDROID_API__ >= 26 || // defined(__ANDROID_UNAVAILABLE_SYMBOLS_ARE_WEAK__))