From ed1275b673a1b534874bfe1a974ba8b8e5ae96b0 Mon Sep 17 00:00:00 2001 From: Maksym Walczak Date: Mon, 3 Jan 2022 15:42:27 +0100 Subject: [PATCH 01/14] Add pose tracking subproject --- mediapipe/pose_tracking_dll/BUILD | 59 ++++++ mediapipe/pose_tracking_dll/README.md | 30 +++ mediapipe/pose_tracking_dll/pose_tracking.cpp | 179 ++++++++++++++++++ mediapipe/pose_tracking_dll/pose_tracking.h | 99 ++++++++++ .../pose_tracking_dll/windows_dll_library.bzl | 62 ++++++ 5 files changed, 429 insertions(+) create mode 100644 mediapipe/pose_tracking_dll/BUILD create mode 100644 mediapipe/pose_tracking_dll/README.md create mode 100644 mediapipe/pose_tracking_dll/pose_tracking.cpp create mode 100644 mediapipe/pose_tracking_dll/pose_tracking.h create mode 100644 mediapipe/pose_tracking_dll/windows_dll_library.bzl diff --git a/mediapipe/pose_tracking_dll/BUILD b/mediapipe/pose_tracking_dll/BUILD new file mode 100644 index 000000000..98b5f9dc9 --- /dev/null +++ b/mediapipe/pose_tracking_dll/BUILD @@ -0,0 +1,59 @@ +# Copyright 2020 The MediaPipe Authors. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +load("windows_dll_library.bzl", "windows_dll_library") +licenses(["notice"]) + +package(default_visibility = ["//mediapipe/examples:__subpackages__"]) + +# Define the shared library +windows_dll_library( + name = "pose_tracking_lib", + srcs = ["pose_tracking.cpp"], + hdrs = ["pose_tracking.h"], + # Define COMPILING_DLL to export symbols during compiling the DLL. + copts = ["-DCOMPILING_DLL"], + deps = [ + "//mediapipe/framework:calculator_framework", + "//mediapipe/framework/formats:image_frame", + "//mediapipe/framework/formats:image_frame_opencv", + "//mediapipe/framework/formats:landmark_cc_proto", + "//mediapipe/framework/formats:rect_cc_proto", + "//mediapipe/framework/port:file_helpers", + "//mediapipe/framework/port:opencv_highgui", + "//mediapipe/framework/port:opencv_imgproc", + "//mediapipe/framework/port:opencv_video", + "//mediapipe/framework/port:parse_text_proto", + "//mediapipe/framework/port:status", + "@com_google_absl//absl/flags:flag", + "@com_google_absl//absl/flags:parse", + + "//mediapipe/calculators/core:constant_side_packet_calculator", + "//mediapipe/calculators/core:packet_presence_calculator", + "//mediapipe/calculators/core:flow_limiter_calculator", + "//mediapipe/calculators/tflite:tflite_model_calculator", + "//mediapipe/calculators/util:local_file_contents_calculator", + "//mediapipe/graphs/pose_tracking:pose_tracking_cpu_deps", + ] +) + +# **Implicitly link to face_mesh_lib.dll** +cc_binary( + name = "pose_tracking_cpu", + deps = [ + "//mediapipe/examples/desktop:demo_run_graph_main", + "//mediapipe/graphs/pose_tracking:pose_tracking_cpu_deps", + ":pose_tracking_lib" + ], +) diff --git a/mediapipe/pose_tracking_dll/README.md b/mediapipe/pose_tracking_dll/README.md new file mode 100644 index 000000000..a183c4f2b --- /dev/null +++ b/mediapipe/pose_tracking_dll/README.md @@ -0,0 +1,30 @@ +## Description +The pose_tracking_dll module allows for building a dll library that can be used with any C++ project. All the dependencies such as tensorflow are built statically into the dll. + +Currently, the following features are supported: +- Segmenting the person(s) of interest +- Segmenting the skeleton(s) +- Accessing the 3D coordinates of each node of the skeleton by name (using enum) + +## Prerequisites +Follow the guidelines on the official Mediapipe website: https://google.github.io/mediapipe/getting_started/install.html#installing-on-windows + +IMPORTANT: The tutorial does not specify which version of Bazel to install. Install Bazel version 3.7.2 + +## How to build +Assuming you're in the root of the repository: + +cd mediapipe + +bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 pose_tracking_dll:pose_tracking_cpu + +The results will be stored in bazel-bin\mediapipe\pose_tracking_dll folder. + +## How to use +Go to bazel-bin\mediapipe\pose_tracking_dll + +Link pose_tracking_cpu.lib and pose_tracking_lib.dll.if.lib statically in your project. + +Make sure the opencv_world3410.dll and pose_tracking_lib.dll are accessible in your working directory. + +Use mediapipe\pose_tracking_dll\pose_tracking.h header file to access the methods of the library. diff --git a/mediapipe/pose_tracking_dll/pose_tracking.cpp b/mediapipe/pose_tracking_dll/pose_tracking.cpp new file mode 100644 index 000000000..65f9f619f --- /dev/null +++ b/mediapipe/pose_tracking_dll/pose_tracking.cpp @@ -0,0 +1,179 @@ +#include +#include + +#include "pose_tracking.h" + +#include "absl/flags/flag.h" +#include "absl/flags/parse.h" +#include "mediapipe/framework/formats/landmark.pb.h" +#include "mediapipe/framework/calculator_framework.h" +#include "mediapipe/framework/formats/image_frame.h" +#include "mediapipe/framework/formats/image_frame_opencv.h" +#include "mediapipe/framework/port/file_helpers.h" +#include "mediapipe/framework/port/opencv_highgui_inc.h" +#include "mediapipe/framework/port/opencv_imgproc_inc.h" +#include "mediapipe/framework/port/opencv_video_inc.h" +#include "mediapipe/framework/port/parse_text_proto.h" +#include "mediapipe/framework/port/status.h" + +class PoseTrackingImpl { +public: + PoseTrackingImpl(const std::string& calculatorGraphConfigFile) { + auto status = initialize(calculatorGraphConfigFile); + if (!status.ok()) { + LOG(WARNING) << "Warning: " << status; + } + } + + absl::Status initialize(const std::string& calculatorGraphConfigFile) { + std::string graphContents; + MP_RETURN_IF_ERROR(mediapipe::file::GetContents( + calculatorGraphConfigFile, + &graphContents)); + + mediapipe::CalculatorGraphConfig config = + mediapipe::ParseTextProtoOrDie( + graphContents); + + MP_RETURN_IF_ERROR(graph.Initialize(config)); + ASSIGN_OR_RETURN(mediapipe::OutputStreamPoller poller, + graph.AddOutputStreamPoller(kOutputSegmentationStream)); + + ASSIGN_OR_RETURN(mediapipe::OutputStreamPoller landmarksPoller, + graph.AddOutputStreamPoller(kOutpuLandmarksStream)); + + ASSIGN_OR_RETURN(mediapipe::OutputStreamPoller posePresencePoller, + graph.AddOutputStreamPoller(kOutpuPosePresenceStream)); + + + maskPollerPtr = std::make_unique(std::move(poller)); + + landmarksPollerPtr = std::make_unique( + std::move(landmarksPoller)); + + posePresencePollerPtr = std::make_unique( + std::move(posePresencePoller)); + + MP_RETURN_IF_ERROR(graph.StartRun({})); + } + + bool processFrame(const cv::Mat& inputRGB8Bit) { + // Wrap Mat into an ImageFrame. + auto inputFrame = absl::make_unique( + mediapipe::ImageFormat::SRGB, inputRGB8Bit.cols, inputRGB8Bit.rows, + mediapipe::ImageFrame::kDefaultAlignmentBoundary); + cv::Mat inputFrameMat = mediapipe::formats::MatView(inputFrame.get()); + inputRGB8Bit.copyTo(inputFrameMat); + + // Send image packet into the graph. + size_t frameTimestampUs = + (double)cv::getTickCount() / (double)cv::getTickFrequency() * 1e6; + auto status = graph.AddPacketToInputStream( + kInputStream, mediapipe::Adopt(inputFrame.release()) + .At(mediapipe::Timestamp(frameTimestampUs))); + + if (!status.ok()) { + LOG(WARNING) << "Graph execution failed: " << status; + return false; + } + + mediapipe::Packet posePresencePacket; + if (!posePresencePollerPtr || !posePresencePollerPtr->Next(&posePresencePacket)) return false; + auto landmarksDetected = posePresencePacket.Get(); + + if (!landmarksDetected) { + return false; + } + + // Get the graph result packet, or stop if that fails. + mediapipe::Packet maskPacket; + if (!maskPollerPtr || !maskPollerPtr->Next(&maskPacket)) return false; + auto& outputFrame = maskPacket.Get(); + + // Get pose landmarks. + if (!landmarksPollerPtr || + !landmarksPollerPtr->Next(&poseLandmarksPacket)) { + return false; + } + + // Convert back to opencv for display or saving. + auto mask = mediapipe::formats::MatView(&outputFrame); + segmentedMask = mask.clone(); + + absl::Status landmarksStatus = detectLandmarksWithStatus(poseLandmarks); + + return landmarksStatus.ok(); + } + + absl::Status detectLandmarksWithStatus( + nimagna::cv_wrapper::Point3f* poseLandmarks) { + + if (poseLandmarksPacket.IsEmpty()) { + return absl::CancelledError("Pose landmarks packet is empty."); + } + + auto retrievedLandmarks = + poseLandmarksPacket + .Get<::mediapipe::NormalizedLandmarkList>(); + + // Convert landmarks to cv::Point3f**. + const auto landmarksCount = retrievedLandmarks.landmark_size(); + + for (int j = 0; j < landmarksCount; ++j) { + const auto& landmark = retrievedLandmarks.landmark(j); + poseLandmarks[j].x = landmark.x(); + poseLandmarks[j].y = landmark.y(); + poseLandmarks[j].z = landmark.z(); + } + + return absl::OkStatus(); + } + + nimagna::cv_wrapper::Point3f* lastDetectedLandmarks() { + return poseLandmarks; + } + + cv::Mat lastSegmentedFrame() { + return segmentedMask; + } + + static constexpr size_t kLandmarksCount = 33u; + +private: + mediapipe::Packet poseLandmarksPacket; + cv::Mat segmentedMask; + nimagna::cv_wrapper::Point3f poseLandmarks[kLandmarksCount]; + std::unique_ptr posePresencePollerPtr; + std::unique_ptr maskPollerPtr; + std::unique_ptr landmarksPollerPtr; + mediapipe::CalculatorGraph graph; + const char* kInputStream = "input_video"; + const char* kOutputSegmentationStream = "segmentation_mask"; + const char* kOutpuLandmarksStream = "pose_landmarks"; + const char* kOutpuPosePresenceStream = "pose_presence"; +}; + +namespace nimagna { + PoseTracking::PoseTracking(const char* calculatorGraphConfigFile) { + myInstance = new PoseTrackingImpl(calculatorGraphConfigFile); + } + + bool PoseTracking::processFrame(const cv_wrapper::Mat& inputRGB8Bit) { + auto* instance = static_cast(myInstance); + const auto frame = cv::Mat(inputRGB8Bit.rows, inputRGB8Bit.cols, CV_8UC3, inputRGB8Bit.data); + return instance->processFrame(frame); + } + + cv_wrapper::Point3f* PoseTracking::lastDetectedLandmarks() { + auto* instance = static_cast(myInstance); + return instance->lastDetectedLandmarks(); + } + + cv_wrapper::Mat PoseTracking::lastSegmentedFrame() { + auto* instance = static_cast(myInstance); + const cv::Mat result = instance->lastSegmentedFrame(); + + return cv_wrapper::Mat(result.rows, result.cols, result.data); + } + +} diff --git a/mediapipe/pose_tracking_dll/pose_tracking.h b/mediapipe/pose_tracking_dll/pose_tracking.h new file mode 100644 index 000000000..34161506c --- /dev/null +++ b/mediapipe/pose_tracking_dll/pose_tracking.h @@ -0,0 +1,99 @@ +#ifndef POSE_TRACKING_LIBRARY_H +#define POSE_TRACKING_LIBRARY_H + +#ifdef COMPILING_DLL +#define DLLEXPORT __declspec(dllexport) +#else +#define DLLEXPORT __declspec(dllimport) +#endif + +namespace nimagna { + namespace cv_wrapper { + struct Point2f { + float x = 0; + float y = 0; + + Point2f() = default; + Point2f(float x, float y) : x(x), y(y) {} + }; + struct Point3f { + float x = 0; + float y = 0; + float z = 0; + + Point3f() = default; + Point3f(float x, float y, float z) : x(x), y(y), z(z) {} + }; + + struct Rect { + int x = 0; + int y = 0; + int width = 0; + int height = 0; + + Rect() = default; + Rect(int x, int y, int width, int height) : x(x), y(y), width(width), height(height) {} + }; + + struct Mat { + int rows = 0; + int cols = 0; + unsigned char* data = 0; + + Mat(int rows, int cols, unsigned char* data) : rows(rows), cols(cols), data(data) {} + }; + } + + class DLLEXPORT PoseTracking { + public: + static constexpr size_t landmarksCount = 33u; + enum LandmarkNames { + NOSE = 0, + LEFT_EYE_INNER, + LEFT_EYE, + LEFT_EYE_OUTER, + RIGHT_EYE_INNER, + RIGHT_EYE, + RIGHT_EYE_OUTER, + LEFT_EAR, + RIGHT_EAR, + MOUTH_LEFT, + MOUTH_RIGHT, + LEFT_SHOULDER, + RIGHT_SHOULDER, + LEFT_ELBOW, + RIGHT_ELBOW, + LEFT_WRIST, + RIGHT_WRIST, + LEFT_PINKY, + RIGHT_PINKY, + LEFT_INDEX, + RIGHT_INDEX, + LEFT_THUMB, + RIGHT_THUMB, + LEFT_HIP, + RIGHT_HIP, + LEFT_KNEE, + RIGHT_KNEE, + LEFT_ANKLE, + RIGHT_ANKLE, + LEFT_HEEL, + RIGHT_HEEL, + LEFT_FOOT_INDEX, + RIGHT_FOOT_INDEX, + COUNT = landmarksCount + }; + + PoseTracking(const char* calculatorGraphConfigFile); + ~PoseTracking() { delete myInstance; } + + bool processFrame(const cv_wrapper::Mat& inputRGB8Bit); + cv_wrapper::Mat lastSegmentedFrame(); + cv_wrapper::Point3f* lastDetectedLandmarks(); + + private: + void* myInstance; + }; +} + +#endif \ No newline at end of file diff --git a/mediapipe/pose_tracking_dll/windows_dll_library.bzl b/mediapipe/pose_tracking_dll/windows_dll_library.bzl new file mode 100644 index 000000000..69c243d60 --- /dev/null +++ b/mediapipe/pose_tracking_dll/windows_dll_library.bzl @@ -0,0 +1,62 @@ +""" +This is a simple windows_dll_library rule for builing a DLL Windows +that can be depended on by other cc rules. +Example useage: + windows_dll_library( + name = "hellolib", + srcs = [ + "hello-library.cpp", + ], + hdrs = ["hello-library.h"], + # Define COMPILING_DLL to export symbols during compiling the DLL. + copts = ["/DCOMPILING_DLL"], + ) +""" + +load("@rules_cc//cc:defs.bzl", "cc_binary", "cc_import", "cc_library") + +def windows_dll_library( + name, + srcs = [], + deps = [], + hdrs = [], + visibility = None, + **kwargs): + """A simple windows_dll_library rule for builing a DLL Windows.""" + dll_name = name + ".dll" + import_lib_name = name + "_import_lib" + import_target_name = name + "_dll_import" + + # Build the shared library + cc_binary( + name = dll_name, + srcs = srcs + hdrs, + deps = deps, + linkshared = 1, + **kwargs + ) + + # Get the import library for the dll + native.filegroup( + name = import_lib_name, + srcs = [":" + dll_name], + output_group = "interface_library", + ) + + # Because we cannot directly depend on cc_binary from other cc rules in deps attribute, + # we use cc_import as a bridge to depend on the dll. + cc_import( + name = import_target_name, + interface_library = ":" + import_lib_name, + shared_library = ":" + dll_name, + ) + + # Create a new cc_library to also include the headers needed for the shared library + cc_library( + name = name, + hdrs = hdrs, + visibility = visibility, + deps = deps + [ + ":" + import_target_name, + ], + ) \ No newline at end of file From 561da620df4fb44d24f4f2b0a44d9d93e8a64628 Mon Sep 17 00:00:00 2001 From: MaksymAtNimagna <88328636+MaksymAtNimagna@users.noreply.github.com> Date: Tue, 4 Jan 2022 11:43:21 +0100 Subject: [PATCH 02/14] Update mediapipe/pose_tracking_dll/README.md Co-authored-by: Xavier Valls --- mediapipe/pose_tracking_dll/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/mediapipe/pose_tracking_dll/README.md b/mediapipe/pose_tracking_dll/README.md index a183c4f2b..9fed2b27f 100644 --- a/mediapipe/pose_tracking_dll/README.md +++ b/mediapipe/pose_tracking_dll/README.md @@ -4,7 +4,7 @@ The pose_tracking_dll module allows for building a dll library that can be used Currently, the following features are supported: - Segmenting the person(s) of interest - Segmenting the skeleton(s) -- Accessing the 3D coordinates of each node of the skeleton by name (using enum) +- Accessing the 3D coordinates of each node of the skeleton ## Prerequisites Follow the guidelines on the official Mediapipe website: https://google.github.io/mediapipe/getting_started/install.html#installing-on-windows From 3e9b56010eea2d7ac2c3e6224eb0b61a0dc0d993 Mon Sep 17 00:00:00 2001 From: MaksymAtNimagna <88328636+MaksymAtNimagna@users.noreply.github.com> Date: Tue, 4 Jan 2022 11:43:34 +0100 Subject: [PATCH 03/14] Update mediapipe/pose_tracking_dll/pose_tracking.h Co-authored-by: Xavier Valls --- mediapipe/pose_tracking_dll/pose_tracking.h | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/mediapipe/pose_tracking_dll/pose_tracking.h b/mediapipe/pose_tracking_dll/pose_tracking.h index 34161506c..5583cb6de 100644 --- a/mediapipe/pose_tracking_dll/pose_tracking.h +++ b/mediapipe/pose_tracking_dll/pose_tracking.h @@ -96,4 +96,4 @@ namespace nimagna { }; } -#endif \ No newline at end of file +#endif From 95483fa64aeb0843fa877dde85933305a562d4b2 Mon Sep 17 00:00:00 2001 From: MaksymAtNimagna <88328636+MaksymAtNimagna@users.noreply.github.com> Date: Tue, 4 Jan 2022 11:45:17 +0100 Subject: [PATCH 04/14] Update mediapipe/pose_tracking_dll/windows_dll_library.bzl Co-authored-by: Xavier Valls --- mediapipe/pose_tracking_dll/windows_dll_library.bzl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/mediapipe/pose_tracking_dll/windows_dll_library.bzl b/mediapipe/pose_tracking_dll/windows_dll_library.bzl index 69c243d60..ef7371af8 100644 --- a/mediapipe/pose_tracking_dll/windows_dll_library.bzl +++ b/mediapipe/pose_tracking_dll/windows_dll_library.bzl @@ -59,4 +59,4 @@ def windows_dll_library( deps = deps + [ ":" + import_target_name, ], - ) \ No newline at end of file + ) From 8b3cd11c39257829b8edb8eff45a85008de612cb Mon Sep 17 00:00:00 2001 From: MaksymAtNimagna <88328636+MaksymAtNimagna@users.noreply.github.com> Date: Tue, 4 Jan 2022 11:45:31 +0100 Subject: [PATCH 05/14] Update mediapipe/pose_tracking_dll/BUILD Co-authored-by: Xavier Valls --- mediapipe/pose_tracking_dll/BUILD | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/mediapipe/pose_tracking_dll/BUILD b/mediapipe/pose_tracking_dll/BUILD index 98b5f9dc9..9e2df0b7d 100644 --- a/mediapipe/pose_tracking_dll/BUILD +++ b/mediapipe/pose_tracking_dll/BUILD @@ -22,7 +22,7 @@ windows_dll_library( name = "pose_tracking_lib", srcs = ["pose_tracking.cpp"], hdrs = ["pose_tracking.h"], - # Define COMPILING_DLL to export symbols during compiling the DLL. + # Define COMPILING_DLL to export symbols during the DLL compilation. copts = ["-DCOMPILING_DLL"], deps = [ "//mediapipe/framework:calculator_framework", From d5581dabb338c6963e888bb316c0ee2178c713f4 Mon Sep 17 00:00:00 2001 From: MaksymAtNimagna <88328636+MaksymAtNimagna@users.noreply.github.com> Date: Tue, 4 Jan 2022 11:46:27 +0100 Subject: [PATCH 06/14] Update mediapipe/pose_tracking_dll/README.md Co-authored-by: Xavier Valls --- mediapipe/pose_tracking_dll/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/mediapipe/pose_tracking_dll/README.md b/mediapipe/pose_tracking_dll/README.md index 9fed2b27f..12e330393 100644 --- a/mediapipe/pose_tracking_dll/README.md +++ b/mediapipe/pose_tracking_dll/README.md @@ -1,5 +1,5 @@ ## Description -The pose_tracking_dll module allows for building a dll library that can be used with any C++ project. All the dependencies such as tensorflow are built statically into the dll. +The pose_tracking_dll module allows for building a Mediapipe-based pose tracking DLL library that can be used with any C++ project. All the dependencies such as tensorflow are built statically into the dll. Currently, the following features are supported: - Segmenting the person(s) of interest From d0cce9d97d8730ad7f3b316bb0bff3d9563595fd Mon Sep 17 00:00:00 2001 From: Maksym Walczak Date: Tue, 4 Jan 2022 11:54:01 +0100 Subject: [PATCH 07/14] Modify readme --- mediapipe/pose_tracking_dll/README.md | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/mediapipe/pose_tracking_dll/README.md b/mediapipe/pose_tracking_dll/README.md index 12e330393..b47ce0294 100644 --- a/mediapipe/pose_tracking_dll/README.md +++ b/mediapipe/pose_tracking_dll/README.md @@ -14,9 +14,11 @@ IMPORTANT: The tutorial does not specify which version of Bazel to install. Inst ## How to build Assuming you're in the root of the repository: -cd mediapipe +`cd mediapipe` -bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 pose_tracking_dll:pose_tracking_cpu +`bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 pose_tracking_dll:pose_tracking_cpu` + +Alternatively `dbg` can be used in place of `opt` to build the library with debug symbols in Visual Studio pdb format. The results will be stored in bazel-bin\mediapipe\pose_tracking_dll folder. From a55e33824b437289a040f37369ea86fe02bcea64 Mon Sep 17 00:00:00 2001 From: Maksym Walczak Date: Tue, 4 Jan 2022 11:55:37 +0100 Subject: [PATCH 08/14] Use Cpp style cast --- mediapipe/pose_tracking_dll/pose_tracking.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/mediapipe/pose_tracking_dll/pose_tracking.cpp b/mediapipe/pose_tracking_dll/pose_tracking.cpp index 65f9f619f..369542eb9 100644 --- a/mediapipe/pose_tracking_dll/pose_tracking.cpp +++ b/mediapipe/pose_tracking_dll/pose_tracking.cpp @@ -67,7 +67,7 @@ public: // Send image packet into the graph. size_t frameTimestampUs = - (double)cv::getTickCount() / (double)cv::getTickFrequency() * 1e6; + static_cast(cv::getTickCount()) / static_cast(cv::getTickFrequency()) * 1e6; auto status = graph.AddPacketToInputStream( kInputStream, mediapipe::Adopt(inputFrame.release()) .At(mediapipe::Timestamp(frameTimestampUs))); From 281199e27888ce2e6ed15b8ad3bd7e54244bb553 Mon Sep 17 00:00:00 2001 From: Maksym Walczak Date: Tue, 4 Jan 2022 12:09:48 +0100 Subject: [PATCH 09/14] Avoid void* for the sake of forward declaration --- mediapipe/pose_tracking_dll/pose_tracking.cpp | 11 ++++------- mediapipe/pose_tracking_dll/pose_tracking.h | 6 ++++-- 2 files changed, 8 insertions(+), 9 deletions(-) diff --git a/mediapipe/pose_tracking_dll/pose_tracking.cpp b/mediapipe/pose_tracking_dll/pose_tracking.cpp index 369542eb9..abb56c9e8 100644 --- a/mediapipe/pose_tracking_dll/pose_tracking.cpp +++ b/mediapipe/pose_tracking_dll/pose_tracking.cpp @@ -155,23 +155,20 @@ private: namespace nimagna { PoseTracking::PoseTracking(const char* calculatorGraphConfigFile) { - myInstance = new PoseTrackingImpl(calculatorGraphConfigFile); + mImplementation = new PoseTrackingImpl(calculatorGraphConfigFile); } bool PoseTracking::processFrame(const cv_wrapper::Mat& inputRGB8Bit) { - auto* instance = static_cast(myInstance); const auto frame = cv::Mat(inputRGB8Bit.rows, inputRGB8Bit.cols, CV_8UC3, inputRGB8Bit.data); - return instance->processFrame(frame); + return mImplementation->processFrame(frame); } cv_wrapper::Point3f* PoseTracking::lastDetectedLandmarks() { - auto* instance = static_cast(myInstance); - return instance->lastDetectedLandmarks(); + return mImplementation->lastDetectedLandmarks(); } cv_wrapper::Mat PoseTracking::lastSegmentedFrame() { - auto* instance = static_cast(myInstance); - const cv::Mat result = instance->lastSegmentedFrame(); + const cv::Mat result = mImplementation->lastSegmentedFrame(); return cv_wrapper::Mat(result.rows, result.cols, result.data); } diff --git a/mediapipe/pose_tracking_dll/pose_tracking.h b/mediapipe/pose_tracking_dll/pose_tracking.h index 5583cb6de..05c017b78 100644 --- a/mediapipe/pose_tracking_dll/pose_tracking.h +++ b/mediapipe/pose_tracking_dll/pose_tracking.h @@ -7,6 +7,8 @@ #define DLLEXPORT __declspec(dllimport) #endif +class PoseTrackingImpl; + namespace nimagna { namespace cv_wrapper { struct Point2f { @@ -85,14 +87,14 @@ namespace nimagna { }; PoseTracking(const char* calculatorGraphConfigFile); - ~PoseTracking() { delete myInstance; } + ~PoseTracking() { delete mImplementation; } bool processFrame(const cv_wrapper::Mat& inputRGB8Bit); cv_wrapper::Mat lastSegmentedFrame(); cv_wrapper::Point3f* lastDetectedLandmarks(); private: - void* myInstance; + PoseTrackingImpl* mImplementation; }; } From 092e1ad899aba0f37a4723568a820d50c1a4af92 Mon Sep 17 00:00:00 2001 From: Maksym Walczak Date: Tue, 4 Jan 2022 13:52:01 +0100 Subject: [PATCH 10/14] Avoid void* for the sake of forward declaration --- mediapipe/pose_tracking_dll/pose_tracking.cpp | 243 +++++++++--------- mediapipe/pose_tracking_dll/pose_tracking.h | 154 +++++------ 2 files changed, 192 insertions(+), 205 deletions(-) diff --git a/mediapipe/pose_tracking_dll/pose_tracking.cpp b/mediapipe/pose_tracking_dll/pose_tracking.cpp index abb56c9e8..a928bf708 100644 --- a/mediapipe/pose_tracking_dll/pose_tracking.cpp +++ b/mediapipe/pose_tracking_dll/pose_tracking.cpp @@ -1,14 +1,14 @@ +#include "pose_tracking.h" + #include #include -#include "pose_tracking.h" - #include "absl/flags/flag.h" #include "absl/flags/parse.h" -#include "mediapipe/framework/formats/landmark.pb.h" #include "mediapipe/framework/calculator_framework.h" #include "mediapipe/framework/formats/image_frame.h" #include "mediapipe/framework/formats/image_frame_opencv.h" +#include "mediapipe/framework/formats/landmark.pb.h" #include "mediapipe/framework/port/file_helpers.h" #include "mediapipe/framework/port/opencv_highgui_inc.h" #include "mediapipe/framework/port/opencv_imgproc_inc.h" @@ -17,160 +17,147 @@ #include "mediapipe/framework/port/status.h" class PoseTrackingImpl { -public: - PoseTrackingImpl(const std::string& calculatorGraphConfigFile) { - auto status = initialize(calculatorGraphConfigFile); - if (!status.ok()) { - LOG(WARNING) << "Warning: " << status; - } - } + public: + PoseTrackingImpl(const std::string& calculatorGraphConfigFile) { + auto status = initialize(calculatorGraphConfigFile); + if (!status.ok()) { + LOG(WARNING) << "Warning: " << status; + } + } - absl::Status initialize(const std::string& calculatorGraphConfigFile) { - std::string graphContents; - MP_RETURN_IF_ERROR(mediapipe::file::GetContents( - calculatorGraphConfigFile, - &graphContents)); + absl::Status initialize(const std::string& calculatorGraphConfigFile) { + std::string graphContents; + MP_RETURN_IF_ERROR(mediapipe::file::GetContents(calculatorGraphConfigFile, &graphContents)); - mediapipe::CalculatorGraphConfig config = - mediapipe::ParseTextProtoOrDie( - graphContents); - - MP_RETURN_IF_ERROR(graph.Initialize(config)); - ASSIGN_OR_RETURN(mediapipe::OutputStreamPoller poller, - graph.AddOutputStreamPoller(kOutputSegmentationStream)); + mediapipe::CalculatorGraphConfig config = + mediapipe::ParseTextProtoOrDie(graphContents); - ASSIGN_OR_RETURN(mediapipe::OutputStreamPoller landmarksPoller, - graph.AddOutputStreamPoller(kOutpuLandmarksStream)); + MP_RETURN_IF_ERROR(graph.Initialize(config)); + ASSIGN_OR_RETURN(mediapipe::OutputStreamPoller poller, + graph.AddOutputStreamPoller(kOutputSegmentationStream)); - ASSIGN_OR_RETURN(mediapipe::OutputStreamPoller posePresencePoller, - graph.AddOutputStreamPoller(kOutpuPosePresenceStream)); + ASSIGN_OR_RETURN(mediapipe::OutputStreamPoller landmarksPoller, + graph.AddOutputStreamPoller(kOutpuLandmarksStream)); + ASSIGN_OR_RETURN(mediapipe::OutputStreamPoller posePresencePoller, + graph.AddOutputStreamPoller(kOutpuPosePresenceStream)); - maskPollerPtr = std::make_unique(std::move(poller)); + maskPollerPtr = std::make_unique(std::move(poller)); - landmarksPollerPtr = std::make_unique( - std::move(landmarksPoller)); + landmarksPollerPtr = + std::make_unique(std::move(landmarksPoller)); - posePresencePollerPtr = std::make_unique( - std::move(posePresencePoller)); + posePresencePollerPtr = + std::make_unique(std::move(posePresencePoller)); - MP_RETURN_IF_ERROR(graph.StartRun({})); - } + MP_RETURN_IF_ERROR(graph.StartRun({})); + } - bool processFrame(const cv::Mat& inputRGB8Bit) { - // Wrap Mat into an ImageFrame. - auto inputFrame = absl::make_unique( - mediapipe::ImageFormat::SRGB, inputRGB8Bit.cols, inputRGB8Bit.rows, - mediapipe::ImageFrame::kDefaultAlignmentBoundary); - cv::Mat inputFrameMat = mediapipe::formats::MatView(inputFrame.get()); - inputRGB8Bit.copyTo(inputFrameMat); + bool processFrame(const cv::Mat& inputRGB8Bit) { + // Wrap Mat into an ImageFrame. + auto inputFrame = absl::make_unique( + mediapipe::ImageFormat::SRGB, inputRGB8Bit.cols, inputRGB8Bit.rows, + mediapipe::ImageFrame::kDefaultAlignmentBoundary); + cv::Mat inputFrameMat = mediapipe::formats::MatView(inputFrame.get()); + inputRGB8Bit.copyTo(inputFrameMat); - // Send image packet into the graph. - size_t frameTimestampUs = - static_cast(cv::getTickCount()) / static_cast(cv::getTickFrequency()) * 1e6; - auto status = graph.AddPacketToInputStream( - kInputStream, mediapipe::Adopt(inputFrame.release()) - .At(mediapipe::Timestamp(frameTimestampUs))); + // Send image packet into the graph. + size_t frameTimestampUs = + static_cast(cv::getTickCount()) / static_cast(cv::getTickFrequency()) * 1e6; + auto status = graph.AddPacketToInputStream( + kInputStream, + mediapipe::Adopt(inputFrame.release()).At(mediapipe::Timestamp(frameTimestampUs))); - if (!status.ok()) { - LOG(WARNING) << "Graph execution failed: " << status; - return false; - } + if (!status.ok()) { + LOG(WARNING) << "Graph execution failed: " << status; + return false; + } - mediapipe::Packet posePresencePacket; - if (!posePresencePollerPtr || !posePresencePollerPtr->Next(&posePresencePacket)) return false; - auto landmarksDetected = posePresencePacket.Get(); + mediapipe::Packet posePresencePacket; + if (!posePresencePollerPtr || !posePresencePollerPtr->Next(&posePresencePacket)) return false; + auto landmarksDetected = posePresencePacket.Get(); - if (!landmarksDetected) { - return false; - } + if (!landmarksDetected) { + return false; + } - // Get the graph result packet, or stop if that fails. - mediapipe::Packet maskPacket; - if (!maskPollerPtr || !maskPollerPtr->Next(&maskPacket)) return false; - auto& outputFrame = maskPacket.Get(); + // Get the graph result packet, or stop if that fails. + mediapipe::Packet maskPacket; + if (!maskPollerPtr || !maskPollerPtr->Next(&maskPacket)) return false; + auto& outputFrame = maskPacket.Get(); - // Get pose landmarks. - if (!landmarksPollerPtr || - !landmarksPollerPtr->Next(&poseLandmarksPacket)) { - return false; - } + // Get pose landmarks. + if (!landmarksPollerPtr || !landmarksPollerPtr->Next(&poseLandmarksPacket)) { + return false; + } - // Convert back to opencv for display or saving. - auto mask = mediapipe::formats::MatView(&outputFrame); - segmentedMask = mask.clone(); + // Convert back to opencv for display or saving. + auto mask = mediapipe::formats::MatView(&outputFrame); + segmentedMask = mask.clone(); - absl::Status landmarksStatus = detectLandmarksWithStatus(poseLandmarks); + absl::Status landmarksStatus = detectLandmarksWithStatus(poseLandmarks); - return landmarksStatus.ok(); - } + return landmarksStatus.ok(); + } - absl::Status detectLandmarksWithStatus( - nimagna::cv_wrapper::Point3f* poseLandmarks) { + absl::Status detectLandmarksWithStatus(nimagna::cv_wrapper::Point3f* poseLandmarks) { + if (poseLandmarksPacket.IsEmpty()) { + return absl::CancelledError("Pose landmarks packet is empty."); + } - if (poseLandmarksPacket.IsEmpty()) { - return absl::CancelledError("Pose landmarks packet is empty."); - } + auto retrievedLandmarks = poseLandmarksPacket.Get<::mediapipe::NormalizedLandmarkList>(); - auto retrievedLandmarks = - poseLandmarksPacket - .Get<::mediapipe::NormalizedLandmarkList>(); + // Convert landmarks to cv::Point3f**. + const auto landmarksCount = retrievedLandmarks.landmark_size(); - // Convert landmarks to cv::Point3f**. - const auto landmarksCount = retrievedLandmarks.landmark_size(); + for (int j = 0; j < landmarksCount; ++j) { + const auto& landmark = retrievedLandmarks.landmark(j); + poseLandmarks[j].x = landmark.x(); + poseLandmarks[j].y = landmark.y(); + poseLandmarks[j].z = landmark.z(); + } - for (int j = 0; j < landmarksCount; ++j) { - const auto& landmark = retrievedLandmarks.landmark(j); - poseLandmarks[j].x = landmark.x(); - poseLandmarks[j].y = landmark.y(); - poseLandmarks[j].z = landmark.z(); - } + return absl::OkStatus(); + } - return absl::OkStatus(); - } + nimagna::cv_wrapper::Point3f* lastDetectedLandmarks() { return poseLandmarks; } - nimagna::cv_wrapper::Point3f* lastDetectedLandmarks() { - return poseLandmarks; - } + cv::Mat lastSegmentedFrame() { return segmentedMask; } - cv::Mat lastSegmentedFrame() { - return segmentedMask; - } + static constexpr size_t kLandmarksCount = 33u; - static constexpr size_t kLandmarksCount = 33u; - -private: - mediapipe::Packet poseLandmarksPacket; - cv::Mat segmentedMask; - nimagna::cv_wrapper::Point3f poseLandmarks[kLandmarksCount]; - std::unique_ptr posePresencePollerPtr; - std::unique_ptr maskPollerPtr; - std::unique_ptr landmarksPollerPtr; - mediapipe::CalculatorGraph graph; - const char* kInputStream = "input_video"; - const char* kOutputSegmentationStream = "segmentation_mask"; - const char* kOutpuLandmarksStream = "pose_landmarks"; - const char* kOutpuPosePresenceStream = "pose_presence"; + private: + mediapipe::Packet poseLandmarksPacket; + cv::Mat segmentedMask; + nimagna::cv_wrapper::Point3f poseLandmarks[kLandmarksCount]; + std::unique_ptr posePresencePollerPtr; + std::unique_ptr maskPollerPtr; + std::unique_ptr landmarksPollerPtr; + mediapipe::CalculatorGraph graph; + const char* kInputStream = "input_video"; + const char* kOutputSegmentationStream = "segmentation_mask"; + const char* kOutpuLandmarksStream = "pose_landmarks"; + const char* kOutpuPosePresenceStream = "pose_presence"; }; namespace nimagna { - PoseTracking::PoseTracking(const char* calculatorGraphConfigFile) { - mImplementation = new PoseTrackingImpl(calculatorGraphConfigFile); - } - - bool PoseTracking::processFrame(const cv_wrapper::Mat& inputRGB8Bit) { - const auto frame = cv::Mat(inputRGB8Bit.rows, inputRGB8Bit.cols, CV_8UC3, inputRGB8Bit.data); - return mImplementation->processFrame(frame); - } - - cv_wrapper::Point3f* PoseTracking::lastDetectedLandmarks() { - return mImplementation->lastDetectedLandmarks(); - } - - cv_wrapper::Mat PoseTracking::lastSegmentedFrame() { - const cv::Mat result = mImplementation->lastSegmentedFrame(); - - return cv_wrapper::Mat(result.rows, result.cols, result.data); - } - +PoseTracking::PoseTracking(const char* calculatorGraphConfigFile) { + mImplementation = new PoseTrackingImpl(calculatorGraphConfigFile); } + +bool PoseTracking::processFrame(const cv_wrapper::Mat& inputRGB8Bit) { + const auto frame = cv::Mat(inputRGB8Bit.rows, inputRGB8Bit.cols, CV_8UC3, inputRGB8Bit.data); + return mImplementation->processFrame(frame); +} + +cv_wrapper::Point3f* PoseTracking::lastDetectedLandmarks() { + return mImplementation->lastDetectedLandmarks(); +} + +cv_wrapper::Mat PoseTracking::lastSegmentedFrame() { + const cv::Mat result = mImplementation->lastSegmentedFrame(); + + return cv_wrapper::Mat(result.rows, result.cols, result.data); +} + +} // namespace nimagna diff --git a/mediapipe/pose_tracking_dll/pose_tracking.h b/mediapipe/pose_tracking_dll/pose_tracking.h index 05c017b78..b521aef9e 100644 --- a/mediapipe/pose_tracking_dll/pose_tracking.h +++ b/mediapipe/pose_tracking_dll/pose_tracking.h @@ -10,92 +10,92 @@ class PoseTrackingImpl; namespace nimagna { - namespace cv_wrapper { - struct Point2f { - float x = 0; - float y = 0; +namespace cv_wrapper { +struct Point2f { + float x = 0; + float y = 0; - Point2f() = default; - Point2f(float x, float y) : x(x), y(y) {} - }; - struct Point3f { - float x = 0; - float y = 0; - float z = 0; + Point2f() = default; + Point2f(float x, float y) : x(x), y(y) {} +}; +struct Point3f { + float x = 0; + float y = 0; + float z = 0; - Point3f() = default; - Point3f(float x, float y, float z) : x(x), y(y), z(z) {} - }; + Point3f() = default; + Point3f(float x, float y, float z) : x(x), y(y), z(z) {} +}; - struct Rect { - int x = 0; - int y = 0; - int width = 0; - int height = 0; +struct Rect { + int x = 0; + int y = 0; + int width = 0; + int height = 0; - Rect() = default; - Rect(int x, int y, int width, int height) : x(x), y(y), width(width), height(height) {} - }; + Rect() = default; + Rect(int x, int y, int width, int height) : x(x), y(y), width(width), height(height) {} +}; - struct Mat { - int rows = 0; - int cols = 0; - unsigned char* data = 0; +struct Mat { + int rows = 0; + int cols = 0; + unsigned char* data = 0; - Mat(int rows, int cols, unsigned char* data) : rows(rows), cols(cols), data(data) {} - }; - } + Mat(int rows, int cols, unsigned char* data) : rows(rows), cols(cols), data(data) {} +}; +} // namespace cv_wrapper - class DLLEXPORT PoseTracking { - public: - static constexpr size_t landmarksCount = 33u; - enum LandmarkNames { - NOSE = 0, - LEFT_EYE_INNER, - LEFT_EYE, - LEFT_EYE_OUTER, - RIGHT_EYE_INNER, - RIGHT_EYE, - RIGHT_EYE_OUTER, - LEFT_EAR, - RIGHT_EAR, - MOUTH_LEFT, - MOUTH_RIGHT, - LEFT_SHOULDER, - RIGHT_SHOULDER, - LEFT_ELBOW, - RIGHT_ELBOW, - LEFT_WRIST, - RIGHT_WRIST, - LEFT_PINKY, - RIGHT_PINKY, - LEFT_INDEX, - RIGHT_INDEX, - LEFT_THUMB, - RIGHT_THUMB, - LEFT_HIP, - RIGHT_HIP, - LEFT_KNEE, - RIGHT_KNEE, - LEFT_ANKLE, - RIGHT_ANKLE, - LEFT_HEEL, - RIGHT_HEEL, - LEFT_FOOT_INDEX, - RIGHT_FOOT_INDEX, - COUNT = landmarksCount - }; +class DLLEXPORT PoseTracking { + public: + static constexpr size_t landmarksCount = 33u; + enum LandmarkNames { + NOSE = 0, + LEFT_EYE_INNER, + LEFT_EYE, + LEFT_EYE_OUTER, + RIGHT_EYE_INNER, + RIGHT_EYE, + RIGHT_EYE_OUTER, + LEFT_EAR, + RIGHT_EAR, + MOUTH_LEFT, + MOUTH_RIGHT, + LEFT_SHOULDER, + RIGHT_SHOULDER, + LEFT_ELBOW, + RIGHT_ELBOW, + LEFT_WRIST, + RIGHT_WRIST, + LEFT_PINKY, + RIGHT_PINKY, + LEFT_INDEX, + RIGHT_INDEX, + LEFT_THUMB, + RIGHT_THUMB, + LEFT_HIP, + RIGHT_HIP, + LEFT_KNEE, + RIGHT_KNEE, + LEFT_ANKLE, + RIGHT_ANKLE, + LEFT_HEEL, + RIGHT_HEEL, + LEFT_FOOT_INDEX, + RIGHT_FOOT_INDEX, + COUNT = landmarksCount + }; - PoseTracking(const char* calculatorGraphConfigFile); - ~PoseTracking() { delete mImplementation; } + PoseTracking(const char* calculatorGraphConfigFile); + ~PoseTracking() { delete mImplementation; } - bool processFrame(const cv_wrapper::Mat& inputRGB8Bit); - cv_wrapper::Mat lastSegmentedFrame(); - cv_wrapper::Point3f* lastDetectedLandmarks(); + bool processFrame(const cv_wrapper::Mat& inputRGB8Bit); + cv_wrapper::Mat lastSegmentedFrame(); + cv_wrapper::Point3f* lastDetectedLandmarks(); - private: - PoseTrackingImpl* mImplementation; - }; -} + private: + PoseTrackingImpl* mImplementation; +}; +} // namespace nimagna #endif From 365eb9a1ab71c7328df3969856976b4d97583f26 Mon Sep 17 00:00:00 2001 From: Maksym Walczak Date: Wed, 5 Jan 2022 11:35:04 +0100 Subject: [PATCH 11/14] Fix formatting in readme --- mediapipe/pose_tracking_dll/README.md | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/mediapipe/pose_tracking_dll/README.md b/mediapipe/pose_tracking_dll/README.md index b47ce0294..6307e4fe8 100644 --- a/mediapipe/pose_tracking_dll/README.md +++ b/mediapipe/pose_tracking_dll/README.md @@ -14,9 +14,10 @@ IMPORTANT: The tutorial does not specify which version of Bazel to install. Inst ## How to build Assuming you're in the root of the repository: -`cd mediapipe` - -`bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 pose_tracking_dll:pose_tracking_cpu` +``` +cd mediapipe +bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 pose_tracking_dll:pose_tracking_cpu +``` Alternatively `dbg` can be used in place of `opt` to build the library with debug symbols in Visual Studio pdb format. From 50a6d5cbe9d66a0293781d56443e062cace9e110 Mon Sep 17 00:00:00 2001 From: MaksymAtNimagna <88328636+MaksymAtNimagna@users.noreply.github.com> Date: Wed, 5 Jan 2022 11:42:27 +0100 Subject: [PATCH 12/14] Update mediapipe/pose_tracking_dll/README.md Co-authored-by: Xavier Valls --- mediapipe/pose_tracking_dll/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/mediapipe/pose_tracking_dll/README.md b/mediapipe/pose_tracking_dll/README.md index 6307e4fe8..6165f1b47 100644 --- a/mediapipe/pose_tracking_dll/README.md +++ b/mediapipe/pose_tracking_dll/README.md @@ -21,7 +21,7 @@ bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 pose_tracking_dll:pose_track Alternatively `dbg` can be used in place of `opt` to build the library with debug symbols in Visual Studio pdb format. -The results will be stored in bazel-bin\mediapipe\pose_tracking_dll folder. +The results will be stored in the bazel-bin\mediapipe\pose_tracking_dll folder. ## How to use Go to bazel-bin\mediapipe\pose_tracking_dll From 71998bc650c4003f0238b5c7f223b9319dd8cf0c Mon Sep 17 00:00:00 2001 From: MaksymAtNimagna <88328636+MaksymAtNimagna@users.noreply.github.com> Date: Wed, 5 Jan 2022 11:42:33 +0100 Subject: [PATCH 13/14] Update mediapipe/pose_tracking_dll/README.md Co-authored-by: Xavier Valls --- mediapipe/pose_tracking_dll/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/mediapipe/pose_tracking_dll/README.md b/mediapipe/pose_tracking_dll/README.md index 6165f1b47..6e4f483c7 100644 --- a/mediapipe/pose_tracking_dll/README.md +++ b/mediapipe/pose_tracking_dll/README.md @@ -30,4 +30,4 @@ Link pose_tracking_cpu.lib and pose_tracking_lib.dll.if.lib statically in your p Make sure the opencv_world3410.dll and pose_tracking_lib.dll are accessible in your working directory. -Use mediapipe\pose_tracking_dll\pose_tracking.h header file to access the methods of the library. +Use the mediapipe\pose_tracking_dll\pose_tracking.h header file to access the methods of the library. From 38f4da8a11662fefdfffdb310f23039a903fa519 Mon Sep 17 00:00:00 2001 From: Xavier Valls Date: Thu, 6 Jan 2022 11:42:21 +0100 Subject: [PATCH 14/14] Update installation step in README.md --- mediapipe/pose_tracking_dll/README.md | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/mediapipe/pose_tracking_dll/README.md b/mediapipe/pose_tracking_dll/README.md index 6e4f483c7..fb4b731ac 100644 --- a/mediapipe/pose_tracking_dll/README.md +++ b/mediapipe/pose_tracking_dll/README.md @@ -9,14 +9,17 @@ Currently, the following features are supported: ## Prerequisites Follow the guidelines on the official Mediapipe website: https://google.github.io/mediapipe/getting_started/install.html#installing-on-windows -IMPORTANT: The tutorial does not specify which version of Bazel to install. Install Bazel version 3.7.2 +IMPORTANT: The tutorial does not specify which version of Bazel to install. Install Bazel version 3.7.2. The OpenCV version used by default in mediapipe is 3.4.10. + +If you are using a different OpenCV version, adapt the `OPENCV_VERSION` variable in the file `mediapipe/external/opencv_.BUILD` to the one installed in the system (https://github.com/google/mediapipe/issues/1926#issuecomment-825874197). + ## How to build Assuming you're in the root of the repository: ``` cd mediapipe -bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 pose_tracking_dll:pose_tracking_cpu +bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 --action_env PYTHON_BIN_PATH= pose_tracking_dll:pose_tracking_cpu ``` Alternatively `dbg` can be used in place of `opt` to build the library with debug symbols in Visual Studio pdb format.