Added pybind version graph runner.

2020-06-21 23:16:44 +09:00 · 2020-06-21 23:16:44 +09:00 · 5498c65e14
commit 5498c65e14
parent 46d914e9a4
3 changed files with 176 additions and 27 deletions
--- a/mediapipe/examples/desktop/BUILD
+++ b/mediapipe/examples/desktop/BUILD
@ -97,5 +97,13 @@ pybind_extension(
    name = "cameravtuber2",
    srcs = [
        "cameravtuber_pybind.cc"
-    ]
+    ],
    deps = [
        ":demo_run_graph_main_gpu",
        "//mediapipe/calculators/ipc:zmq_calculator",
        "//mediapipe/calculators/image:sobel_edges_calculator",
        "//mediapipe/graphs/hand_tracking:multi_hand_mobile_calculators",
        "//mediapipe/graphs/face_mesh:desktop_live_gpu_calculators",
        "//mediapipe/calculators/video:opencv_video_encoder_calculator",
    ],
 )
--- a/mediapipe/examples/desktop/cameravtuber_pybind.cc
+++ b/mediapipe/examples/desktop/cameravtuber_pybind.cc
@ -1,35 +1,134 @@
 #include <pybind11/pybind11.h>
 #include <pybind11/numpy.h>
-int add(int i, int j) {
+#include "mediapipe/framework/calculator_framework.h"
-    return i + j;
+#include "mediapipe/framework/formats/image_frame.h"
-}
+#include "mediapipe/framework/formats/image_frame_opencv.h"
 #include "mediapipe/framework/port/file_helpers.h"
 #include "mediapipe/framework/port/parse_text_proto.h"
 #include "mediapipe/framework/port/opencv_imgproc_inc.h"
 #include "mediapipe/gpu/gl_calculator_helper.h"
 #include "mediapipe/gpu/gpu_shared_data_internal.h"
 namespace py = pybind11;
-PYBIND11_MODULE(cameravtuber2, m) {
+constexpr char kInputStream[] = "input_video";
-    m.doc() = R"pbdoc(
+constexpr char kOutputStream[] = "output_video";
        Pybind11 example plugin
        -----------------------
        .. currentmodule:: python_example
        .. autosummary::
           :toctree: _generate
           add
           subtract
    )pbdoc";
-    m.def("add", &add, R"pbdoc(
+class GraphRunner
-        Add two numbers
+{
-        Some other explanation about the add function.
+public:
-    )pbdoc");
+    GraphRunner(const std::string &graph_path)
    {
        std::string calculator_graph_config_contents;
        mediapipe::file::GetContents(
            graph_path, &calculator_graph_config_contents);
        LOG(INFO) << "Get calculator graph config contents: "
                  << calculator_graph_config_contents;
        config = mediapipe::ParseTextProtoOrDie<mediapipe::CalculatorGraphConfig>(
            calculator_graph_config_contents);
-    m.def("subtract", [](int i, int j) { return i - j; }, R"pbdoc(
+        LOG(INFO) << "Initialize the calculator graph.";
-        Subtract two numbers
+        graph.Initialize(config);
        Some other explanation about the subtract function.
    )pbdoc");
-#ifdef VERSION_INFO
+        LOG(INFO) << "Initialize the GPU.";
-    m.attr("__version__") = VERSION_INFO;
+        std::shared_ptr<mediapipe::GpuResources> gpu_resources = mediapipe::GpuResources::Create().ValueOrDie();
-#else
+        graph.SetGpuResources(std::move(gpu_resources));
-    m.attr("__version__") = "dev";
+        gpu_helper.InitializeForTest(graph.GetGpuResources().get());
-#endif
+
        poller = std::make_shared<mediapipe::OutputStreamPoller>(
            graph.AddOutputStreamPoller(kOutputStream).ValueOrDie());
        graph.StartRun({});
    }
    py::array_t<unsigned char> ProcessFrame(py::array_t<unsigned char> &input)
    {
        if (input.ndim() != 3)
            throw std::runtime_error("1-channel image must be 2 dims ");
        py::buffer_info buf = input.request();
        cv::Mat mat(buf.shape[0], buf.shape[1], CV_8UC3, (unsigned char *)buf.ptr);
        // Wrap Mat into an ImageFrame.
        auto input_frame = absl::make_unique<mediapipe::ImageFrame>(
            mediapipe::ImageFormat::SRGB, mat.cols, mat.rows,
            mediapipe::ImageFrame::kGlDefaultAlignmentBoundary);
        cv::Mat input_frame_mat = mediapipe::formats::MatView(input_frame.get());
        mat.copyTo(input_frame_mat);
        // Prepare and add graph input packet.
        size_t frame_timestamp_us =
            (double)cv::getTickCount() / (double)cv::getTickFrequency() * 1e6;
        gpu_helper.RunInGlContext([this, &input_frame, &frame_timestamp_us]() -> ::mediapipe::Status {
            // Convert ImageFrame to GpuBuffer.
            auto texture = gpu_helper.CreateSourceTexture(*input_frame.get());
            auto gpu_frame = texture.GetFrame<mediapipe::GpuBuffer>();
            glFlush();
            texture.Release();
            // Send GPU image packet into the graph.
            graph.AddPacketToInputStream(
                kInputStream, mediapipe::Adopt(gpu_frame.release())
                                  .At(mediapipe::Timestamp(frame_timestamp_us)));
            return ::mediapipe::OkStatus();
        });
        // Get the graph result packet, or stop if that fails.
        mediapipe::Packet packet;
        if (!poller->Next(&packet))
            LOG(INFO) << "error getting packet";
        // break;
        std::unique_ptr<mediapipe::ImageFrame> output_frame;
        // Convert GpuBuffer to ImageFrame.
        gpu_helper.RunInGlContext(
            [this, &packet, &output_frame]() -> ::mediapipe::Status {
                auto &gpu_frame = packet.Get<mediapipe::GpuBuffer>();
                auto texture = gpu_helper.CreateSourceTexture(gpu_frame);
                output_frame = absl::make_unique<mediapipe::ImageFrame>(
                    mediapipe::ImageFormatForGpuBufferFormat(gpu_frame.format()),
                    gpu_frame.width(), gpu_frame.height(),
                    mediapipe::ImageFrame::kGlDefaultAlignmentBoundary);
                gpu_helper.BindFramebuffer(texture);
                const auto info =
                    mediapipe::GlTextureInfoForGpuBufferFormat(gpu_frame.format(), 0);
                glReadPixels(0, 0, texture.width(), texture.height(), info.gl_format,
                             info.gl_type, output_frame->MutablePixelData());
                glFlush();
                texture.Release();
                return ::mediapipe::OkStatus();
            });
        // Convert back to opencv for display or saving.
        cv::Mat output_frame_mat = mediapipe::formats::MatView(output_frame.get());
        int size = output_frame_mat.channels() * output_frame_mat.size().width * output_frame_mat.size().height;
        py::array_t<unsigned char> result(size);
        py::buffer_info buf2 = result.request();
        auto pt = output_frame_mat.data;
        unsigned char *dstPt = (unsigned char *)buf2.ptr;
        for (int i = 0; i < size; i++)
        {
            dstPt[i] = pt[i];
        }
        return result;
    }
 private:
    mediapipe::CalculatorGraphConfig config;
    mediapipe::CalculatorGraph graph;
    mediapipe::GlCalculatorHelper gpu_helper;
    std::shared_ptr<mediapipe::OutputStreamPoller> poller;
 };
 PYBIND11_MODULE(cameravtuber2, m)
 {
    py::class_<GraphRunner>(m, "GraphRunner")
        .def(py::init<const std::string &>())
        .def("process_frame", &GraphRunner::ProcessFrame);
 }
--- a/run_graph.py
+++ b/run_graph.py
@ -0,0 +1,42 @@
 import time
 import streamlit as st
 import cameravtuber2
 import cv2
 runner = cameravtuber2.GraphRunner("mediapipe/graphs/hand_tracking/hand_face_detection_no_gating.pbtxt")
@st.cache(allow_output_mutation=True)
 def get_frames():
    cap = cv2.VideoCapture("hand_motion.mp4")
    frames = []
    while(True):
        ret, frame = cap.read()
        if frame is None:
            break
        gray = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        frames.append(gray)
    return frames
 frames = get_frames()
 frame_idx = st.slider('frame idx', 0, len(frames))
 # st.image(frames[frame_idx])
 # st.write(frames[frame_idx].shape)
 frame = frames[frame_idx]
 start = time.time()
 new_frame = runner.process_frame(frame)
 end = time.time()
 st.write(end - start)
 st.write(new_frame.shape)
 new_frame = new_frame.reshape((360,640,4))
 st.image(new_frame)
 # cameravtuber2.GraphRunner("mediapipe/graphs/hand_tracking/hand_face_tracking_desktop.pbtxt")