Merge pull request #4940 from priankakariatyml:ios-pose-landmarker-implementation
PiperOrigin-RevId: 580578919
This commit is contained in:
commit
65e74dde0f
35
mediapipe/tasks/ios/test/vision/pose_landmarker/utils/BUILD
Normal file
35
mediapipe/tasks/ios/test/vision/pose_landmarker/utils/BUILD
Normal file
|
@ -0,0 +1,35 @@
|
||||||
|
# Copyright 2023 The MediaPipe Authors.
|
||||||
|
#
|
||||||
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
# you may not use this file except in compliance with the License.
|
||||||
|
# You may obtain a copy of the License at
|
||||||
|
#
|
||||||
|
# http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
#
|
||||||
|
# Unless required by applicable law or agreed to in writing, software
|
||||||
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
# See the License for the specific language governing permissions and
|
||||||
|
# limitations under the License.
|
||||||
|
|
||||||
|
package(default_visibility = ["//mediapipe/tasks:internal"])
|
||||||
|
|
||||||
|
licenses(["notice"])
|
||||||
|
|
||||||
|
objc_library(
|
||||||
|
name = "MPPPoseLandmarkerResultProtobufHelpers",
|
||||||
|
srcs = ["sources/MPPPoseLandmarkerResult+ProtobufHelpers.mm"],
|
||||||
|
hdrs = ["sources/MPPPoseLandmarkerResult+ProtobufHelpers.h"],
|
||||||
|
copts = [
|
||||||
|
"-ObjC++",
|
||||||
|
"-std=c++17",
|
||||||
|
"-x objective-c++",
|
||||||
|
],
|
||||||
|
deps = [
|
||||||
|
"//mediapipe/tasks/cc/components/containers/proto:landmarks_detection_result_cc_proto",
|
||||||
|
"//mediapipe/tasks/ios/common/utils:NSStringHelpers",
|
||||||
|
"//mediapipe/tasks/ios/test/vision/utils:parse_proto_utils",
|
||||||
|
"//mediapipe/tasks/ios/vision/pose_landmarker:MPPPoseLandmarkerResult",
|
||||||
|
"//mediapipe/tasks/ios/vision/pose_landmarker/utils:MPPPoseLandmarkerResultHelpers",
|
||||||
|
],
|
||||||
|
)
|
|
@ -0,0 +1,26 @@
|
||||||
|
// Copyright 2023 The MediaPipe Authors.
|
||||||
|
//
|
||||||
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
// you may not use this file except in compliance with the License.
|
||||||
|
// You may obtain a copy of the License at
|
||||||
|
//
|
||||||
|
// http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
//
|
||||||
|
// Unless required by applicable law or agreed to in writing, software
|
||||||
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
// See the License for the specific language governing permissions and
|
||||||
|
// limitations under the License.
|
||||||
|
|
||||||
|
#import <Foundation/Foundation.h>
|
||||||
|
#import "mediapipe/tasks/ios/vision/pose_landmarker/sources/MPPPoseLandmarkerResult.h"
|
||||||
|
|
||||||
|
NS_ASSUME_NONNULL_BEGIN
|
||||||
|
@interface MPPPoseLandmarkerResult (ProtobufHelpers)
|
||||||
|
|
||||||
|
+ (MPPPoseLandmarkerResult *)poseLandmarkerResultFromProtobufFileWithName:(NSString *)fileName
|
||||||
|
shouldRemoveZPosition:(BOOL)removeZPosition;
|
||||||
|
|
||||||
|
@end
|
||||||
|
|
||||||
|
NS_ASSUME_NONNULL_END
|
|
@ -0,0 +1,55 @@
|
||||||
|
// Copyright 2023 The MediaPipe Authors.
|
||||||
|
//
|
||||||
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
// you may not use this file except in compliance with the License.
|
||||||
|
// You may obtain a copy of the License at
|
||||||
|
//
|
||||||
|
// http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
//
|
||||||
|
// Unless required by applicable law or agreed to in writing, software
|
||||||
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
// See the License for the specific language governing permissions and
|
||||||
|
// limitations under the License.
|
||||||
|
|
||||||
|
#import "mediapipe/tasks/ios/test/vision/pose_landmarker/utils/sources/MPPPoseLandmarkerResult+ProtobufHelpers.h"
|
||||||
|
|
||||||
|
#import "mediapipe/tasks/ios/common/utils/sources/NSString+Helpers.h"
|
||||||
|
#import "mediapipe/tasks/ios/vision/pose_landmarker/utils/sources/MPPPoseLandmarkerResult+Helpers.h"
|
||||||
|
|
||||||
|
#include "mediapipe/tasks/cc/components/containers/proto/landmarks_detection_result.pb.h"
|
||||||
|
#include "mediapipe/tasks/ios/test/vision/utils/sources/parse_proto_utils.h"
|
||||||
|
|
||||||
|
namespace {
|
||||||
|
using LandmarksDetectionResultProto =
|
||||||
|
::mediapipe::tasks::containers::proto::LandmarksDetectionResult;
|
||||||
|
using ::mediapipe::tasks::ios::test::vision::utils::get_proto_from_pbtxt;
|
||||||
|
} // anonymous namespace
|
||||||
|
|
||||||
|
@implementation MPPPoseLandmarkerResult (ProtobufHelpers)
|
||||||
|
|
||||||
|
+ (MPPPoseLandmarkerResult *)poseLandmarkerResultFromProtobufFileWithName:(NSString *)fileName
|
||||||
|
shouldRemoveZPosition:(BOOL)removeZPosition {
|
||||||
|
LandmarksDetectionResultProto landmarkDetectionResultProto;
|
||||||
|
|
||||||
|
if (!get_proto_from_pbtxt(fileName.cppString, landmarkDetectionResultProto).ok()) {
|
||||||
|
return nil;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (removeZPosition) {
|
||||||
|
// Remove z position of landmarks, because they are not used in correctness testing. For video
|
||||||
|
// or live stream mode, the z positions varies a lot during tracking from frame to frame.
|
||||||
|
for (int i = 0; i < landmarkDetectionResultProto.landmarks().landmark().size(); i++) {
|
||||||
|
auto &landmark = *landmarkDetectionResultProto.mutable_landmarks()->mutable_landmark(i);
|
||||||
|
landmark.clear_z();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
return [MPPPoseLandmarkerResult
|
||||||
|
poseLandmarkerResultWithLandmarksProto:{landmarkDetectionResultProto.landmarks()}
|
||||||
|
worldLandmarksProto:{landmarkDetectionResultProto.world_landmarks()}
|
||||||
|
segmentationMasks:nullptr
|
||||||
|
timestampInMilliseconds:0];
|
||||||
|
}
|
||||||
|
|
||||||
|
@end
|
|
@ -17,14 +17,14 @@
|
||||||
|
|
||||||
#include "mediapipe/tasks/cc/components/containers/proto/classifications.pb.h"
|
#include "mediapipe/tasks/cc/components/containers/proto/classifications.pb.h"
|
||||||
|
|
||||||
static const int kMicroSecondsPerMilliSecond = 1000;
|
static const int kMicrosecondsPerMillisecond = 1000;
|
||||||
|
|
||||||
namespace {
|
namespace {
|
||||||
using ClassificationResultProto =
|
using ClassificationResultProto =
|
||||||
::mediapipe::tasks::components::containers::proto::ClassificationResult;
|
::mediapipe::tasks::components::containers::proto::ClassificationResult;
|
||||||
} // namespace
|
} // namespace
|
||||||
|
|
||||||
#define int kMicroSecondsPerMilliSecond = 1000;
|
#define int kMicrosecondsPerMillisecond = 1000;
|
||||||
|
|
||||||
@implementation MPPLanguageDetectorResult (Helpers)
|
@implementation MPPLanguageDetectorResult (Helpers)
|
||||||
|
|
||||||
|
@ -36,7 +36,7 @@ using ClassificationResultProto =
|
||||||
return [MPPLanguageDetectorResult
|
return [MPPLanguageDetectorResult
|
||||||
languageDetectorResultWithClassificationResult:classificationResult
|
languageDetectorResultWithClassificationResult:classificationResult
|
||||||
timestampInMilliseconds:(NSInteger)(packet.Timestamp().Value() /
|
timestampInMilliseconds:(NSInteger)(packet.Timestamp().Value() /
|
||||||
kMicroSecondsPerMilliSecond)];
|
kMicrosecondsPerMillisecond)];
|
||||||
}
|
}
|
||||||
|
|
||||||
+ (MPPLanguageDetectorResult *)
|
+ (MPPLanguageDetectorResult *)
|
||||||
|
|
|
@ -17,7 +17,7 @@
|
||||||
|
|
||||||
#include "mediapipe/tasks/cc/components/containers/proto/classifications.pb.h"
|
#include "mediapipe/tasks/cc/components/containers/proto/classifications.pb.h"
|
||||||
|
|
||||||
static const int kMicroSecondsPerMilliSecond = 1000;
|
static const int kMicrosecondsPerMillisecond = 1000;
|
||||||
|
|
||||||
namespace {
|
namespace {
|
||||||
using ClassificationResultProto =
|
using ClassificationResultProto =
|
||||||
|
@ -25,7 +25,7 @@ using ClassificationResultProto =
|
||||||
using ::mediapipe::Packet;
|
using ::mediapipe::Packet;
|
||||||
} // namespace
|
} // namespace
|
||||||
|
|
||||||
#define int kMicroSecondsPerMilliSecond = 1000;
|
#define int kMicrosecondsPerMillisecond = 1000;
|
||||||
|
|
||||||
@implementation MPPTextClassifierResult (Helpers)
|
@implementation MPPTextClassifierResult (Helpers)
|
||||||
|
|
||||||
|
@ -36,7 +36,7 @@ using ::mediapipe::Packet;
|
||||||
return [[MPPTextClassifierResult alloc]
|
return [[MPPTextClassifierResult alloc]
|
||||||
initWithClassificationResult:classificationResult
|
initWithClassificationResult:classificationResult
|
||||||
timestampInMilliseconds:(NSInteger)(packet.Timestamp().Value() /
|
timestampInMilliseconds:(NSInteger)(packet.Timestamp().Value() /
|
||||||
kMicroSecondsPerMilliSecond)];
|
kMicrosecondsPerMillisecond)];
|
||||||
}
|
}
|
||||||
|
|
||||||
@end
|
@end
|
||||||
|
|
|
@ -17,14 +17,14 @@
|
||||||
|
|
||||||
#include "mediapipe/tasks/cc/components/containers/proto/embeddings.pb.h"
|
#include "mediapipe/tasks/cc/components/containers/proto/embeddings.pb.h"
|
||||||
|
|
||||||
static const int kMicroSecondsPerMilliSecond = 1000;
|
static const int kMicrosecondsPerMillisecond = 1000;
|
||||||
|
|
||||||
namespace {
|
namespace {
|
||||||
using EmbeddingResultProto = ::mediapipe::tasks::components::containers::proto::EmbeddingResult;
|
using EmbeddingResultProto = ::mediapipe::tasks::components::containers::proto::EmbeddingResult;
|
||||||
using ::mediapipe::Packet;
|
using ::mediapipe::Packet;
|
||||||
} // namespace
|
} // namespace
|
||||||
|
|
||||||
#define int kMicroSecondsPerMilliSecond = 1000;
|
#define int kMicrosecondsPerMillisecond = 1000;
|
||||||
|
|
||||||
@implementation MPPTextEmbedderResult (Helpers)
|
@implementation MPPTextEmbedderResult (Helpers)
|
||||||
|
|
||||||
|
@ -35,7 +35,7 @@ using ::mediapipe::Packet;
|
||||||
return [[MPPTextEmbedderResult alloc]
|
return [[MPPTextEmbedderResult alloc]
|
||||||
initWithEmbeddingResult:embeddingResult
|
initWithEmbeddingResult:embeddingResult
|
||||||
timestampInMilliseconds:(NSInteger)(packet.Timestamp().Value() /
|
timestampInMilliseconds:(NSInteger)(packet.Timestamp().Value() /
|
||||||
kMicroSecondsPerMilliSecond)];
|
kMicrosecondsPerMillisecond)];
|
||||||
}
|
}
|
||||||
|
|
||||||
@end
|
@end
|
||||||
|
|
|
@ -18,7 +18,7 @@
|
||||||
#include "mediapipe/framework/formats/image.h"
|
#include "mediapipe/framework/formats/image.h"
|
||||||
#include "mediapipe/framework/timestamp.h"
|
#include "mediapipe/framework/timestamp.h"
|
||||||
|
|
||||||
static const NSUInteger kMicroSecondsPerMilliSecond = 1000;
|
static const NSUInteger kMicrosecondsPerMillisecond = 1000;
|
||||||
|
|
||||||
namespace {
|
namespace {
|
||||||
using ::mediapipe::Image;
|
using ::mediapipe::Image;
|
||||||
|
@ -51,7 +51,7 @@ using ::mediapipe::Timestamp;
|
||||||
}
|
}
|
||||||
|
|
||||||
return MakePacket<Image>(std::move(imageFrame))
|
return MakePacket<Image>(std::move(imageFrame))
|
||||||
.At(Timestamp(int64(timestampInMilliseconds * kMicroSecondsPerMilliSecond)));
|
.At(Timestamp(int64(timestampInMilliseconds * kMicrosecondsPerMillisecond)));
|
||||||
}
|
}
|
||||||
|
|
||||||
+ (Packet)createPacketWithNormalizedRect:(NormalizedRect &)normalizedRect {
|
+ (Packet)createPacketWithNormalizedRect:(NormalizedRect &)normalizedRect {
|
||||||
|
@ -61,7 +61,7 @@ using ::mediapipe::Timestamp;
|
||||||
+ (Packet)createPacketWithNormalizedRect:(NormalizedRect &)normalizedRect
|
+ (Packet)createPacketWithNormalizedRect:(NormalizedRect &)normalizedRect
|
||||||
timestampInMilliseconds:(NSInteger)timestampInMilliseconds {
|
timestampInMilliseconds:(NSInteger)timestampInMilliseconds {
|
||||||
return MakePacket<NormalizedRect>(std::move(normalizedRect))
|
return MakePacket<NormalizedRect>(std::move(normalizedRect))
|
||||||
.At(Timestamp(int64(timestampInMilliseconds * kMicroSecondsPerMilliSecond)));
|
.At(Timestamp(int64(timestampInMilliseconds * kMicrosecondsPerMillisecond)));
|
||||||
}
|
}
|
||||||
|
|
||||||
@end
|
@end
|
||||||
|
|
|
@ -198,7 +198,7 @@ static NSString *const kTaskName = @"gestureRecognizer";
|
||||||
|
|
||||||
NSInteger timestampInMilliseconds =
|
NSInteger timestampInMilliseconds =
|
||||||
outputPacketMap[kImageOutStreamName.cppString].Timestamp().Value() /
|
outputPacketMap[kImageOutStreamName.cppString].Timestamp().Value() /
|
||||||
kMicroSecondsPerMilliSecond;
|
kMicrosecondsPerMillisecond;
|
||||||
dispatch_async(_callbackQueue, ^{
|
dispatch_async(_callbackQueue, ^{
|
||||||
[self.gestureRecognizerLiveStreamDelegate gestureRecognizer:self
|
[self.gestureRecognizerLiveStreamDelegate gestureRecognizer:self
|
||||||
didFinishRecognitionWithResult:result
|
didFinishRecognitionWithResult:result
|
||||||
|
|
|
@ -20,7 +20,7 @@
|
||||||
|
|
||||||
NS_ASSUME_NONNULL_BEGIN
|
NS_ASSUME_NONNULL_BEGIN
|
||||||
|
|
||||||
static const int kMicroSecondsPerMilliSecond = 1000;
|
static const int kMicrosecondsPerMillisecond = 1000;
|
||||||
|
|
||||||
@interface MPPGestureRecognizerResult (Helpers)
|
@interface MPPGestureRecognizerResult (Helpers)
|
||||||
|
|
||||||
|
|
|
@ -117,7 +117,7 @@ static const NSInteger kDefaultGestureIndex = -1;
|
||||||
handLandmarksPacket:(const Packet &)handLandmarksPacket
|
handLandmarksPacket:(const Packet &)handLandmarksPacket
|
||||||
worldLandmarksPacket:(const Packet &)worldLandmarksPacket {
|
worldLandmarksPacket:(const Packet &)worldLandmarksPacket {
|
||||||
NSInteger timestampInMilliseconds =
|
NSInteger timestampInMilliseconds =
|
||||||
(NSInteger)(handGesturesPacket.Timestamp().Value() / kMicroSecondsPerMilliSecond);
|
(NSInteger)(handGesturesPacket.Timestamp().Value() / kMicrosecondsPerMillisecond);
|
||||||
|
|
||||||
if (handGesturesPacket.IsEmpty()) {
|
if (handGesturesPacket.IsEmpty()) {
|
||||||
return [MPPGestureRecognizerResult
|
return [MPPGestureRecognizerResult
|
||||||
|
|
|
@ -222,7 +222,7 @@ static NSString *const kTaskName = @"handLandmarker";
|
||||||
|
|
||||||
NSInteger timestampInMilliseconds =
|
NSInteger timestampInMilliseconds =
|
||||||
outputPacketMap[kImageOutStreamName.cppString].Timestamp().Value() /
|
outputPacketMap[kImageOutStreamName.cppString].Timestamp().Value() /
|
||||||
kMicroSecondsPerMilliSecond;
|
kMicrosecondsPerMillisecond;
|
||||||
dispatch_async(_callbackQueue, ^{
|
dispatch_async(_callbackQueue, ^{
|
||||||
[self.handLandmarkerLiveStreamDelegate handLandmarker:self
|
[self.handLandmarkerLiveStreamDelegate handLandmarker:self
|
||||||
didFinishDetectionWithResult:result
|
didFinishDetectionWithResult:result
|
||||||
|
|
|
@ -20,7 +20,7 @@
|
||||||
|
|
||||||
NS_ASSUME_NONNULL_BEGIN
|
NS_ASSUME_NONNULL_BEGIN
|
||||||
|
|
||||||
static const int kMicroSecondsPerMilliSecond = 1000;
|
static const int kMicrosecondsPerMillisecond = 1000;
|
||||||
|
|
||||||
@interface MPPHandLandmarkerResult (Helpers)
|
@interface MPPHandLandmarkerResult (Helpers)
|
||||||
|
|
||||||
|
|
|
@ -95,7 +95,7 @@ using ::mediapipe::Packet;
|
||||||
worldLandmarksPacket:(const Packet &)worldLandmarksPacket
|
worldLandmarksPacket:(const Packet &)worldLandmarksPacket
|
||||||
handednessPacket:(const Packet &)handednessPacket {
|
handednessPacket:(const Packet &)handednessPacket {
|
||||||
NSInteger timestampInMilliseconds =
|
NSInteger timestampInMilliseconds =
|
||||||
(NSInteger)(landmarksPacket.Timestamp().Value() / kMicroSecondsPerMilliSecond);
|
(NSInteger)(landmarksPacket.Timestamp().Value() / kMicrosecondsPerMillisecond);
|
||||||
|
|
||||||
if (landmarksPacket.IsEmpty()) {
|
if (landmarksPacket.IsEmpty()) {
|
||||||
return [MPPHandLandmarkerResult
|
return [MPPHandLandmarkerResult
|
||||||
|
|
|
@ -43,7 +43,7 @@ static NSString *const kTaskGraphName =
|
||||||
@"mediapipe.tasks.vision.image_classifier.ImageClassifierGraph";
|
@"mediapipe.tasks.vision.image_classifier.ImageClassifierGraph";
|
||||||
static NSString *const kTaskName = @"imageClassifier";
|
static NSString *const kTaskName = @"imageClassifier";
|
||||||
|
|
||||||
static const int kMicroSecondsPerMilliSecond = 1000;
|
static const int kMicrosecondsPerMillisecond = 1000;
|
||||||
|
|
||||||
#define InputPacketMap(imagePacket, normalizedRectPacket) \
|
#define InputPacketMap(imagePacket, normalizedRectPacket) \
|
||||||
{ \
|
{ \
|
||||||
|
@ -221,7 +221,7 @@ static const int kMicroSecondsPerMilliSecond = 1000;
|
||||||
|
|
||||||
NSInteger timestampInMilliseconds =
|
NSInteger timestampInMilliseconds =
|
||||||
outputPacketMap[kImageOutStreamName.cppString].Timestamp().Value() /
|
outputPacketMap[kImageOutStreamName.cppString].Timestamp().Value() /
|
||||||
kMicroSecondsPerMilliSecond;
|
kMicrosecondsPerMillisecond;
|
||||||
dispatch_async(_callbackQueue, ^{
|
dispatch_async(_callbackQueue, ^{
|
||||||
[self.imageClassifierLiveStreamDelegate imageClassifier:self
|
[self.imageClassifierLiveStreamDelegate imageClassifier:self
|
||||||
didFinishClassificationWithResult:result
|
didFinishClassificationWithResult:result
|
||||||
|
|
|
@ -182,7 +182,7 @@ static NSString *const kTaskName = @"objectDetector";
|
||||||
|
|
||||||
NSInteger timestampInMilliseconds =
|
NSInteger timestampInMilliseconds =
|
||||||
outputPacketMap[kImageOutStreamName.cppString].Timestamp().Value() /
|
outputPacketMap[kImageOutStreamName.cppString].Timestamp().Value() /
|
||||||
kMicroSecondsPerMilliSecond;
|
kMicrosecondsPerMillisecond;
|
||||||
dispatch_async(_callbackQueue, ^{
|
dispatch_async(_callbackQueue, ^{
|
||||||
[self.objectDetectorLiveStreamDelegate objectDetector:self
|
[self.objectDetectorLiveStreamDelegate objectDetector:self
|
||||||
didFinishDetectionWithResult:result
|
didFinishDetectionWithResult:result
|
||||||
|
|
|
@ -18,7 +18,7 @@
|
||||||
|
|
||||||
NS_ASSUME_NONNULL_BEGIN
|
NS_ASSUME_NONNULL_BEGIN
|
||||||
|
|
||||||
static const int kMicroSecondsPerMilliSecond = 1000;
|
static const int kMicrosecondsPerMillisecond = 1000;
|
||||||
|
|
||||||
@interface MPPObjectDetectorResult (Helpers)
|
@interface MPPObjectDetectorResult (Helpers)
|
||||||
|
|
||||||
|
|
|
@ -27,7 +27,7 @@ using ::mediapipe::Packet;
|
||||||
(const Packet &)packet {
|
(const Packet &)packet {
|
||||||
|
|
||||||
NSInteger timestampInMilliseconds = (NSInteger)(packet.Timestamp().Value() /
|
NSInteger timestampInMilliseconds = (NSInteger)(packet.Timestamp().Value() /
|
||||||
kMicroSecondsPerMilliSecond);
|
kMicrosecondsPerMillisecond);
|
||||||
if (!packet.ValidateAsType<std::vector<DetectionProto>>().ok()) {
|
if (!packet.ValidateAsType<std::vector<DetectionProto>>().ok()) {
|
||||||
return [[MPPObjectDetectorResult alloc] initWithDetections:@[]
|
return [[MPPObjectDetectorResult alloc] initWithDetections:@[]
|
||||||
timestampInMilliseconds:timestampInMilliseconds];
|
timestampInMilliseconds:timestampInMilliseconds];
|
||||||
|
|
|
@ -47,13 +47,27 @@ objc_library(
|
||||||
|
|
||||||
objc_library(
|
objc_library(
|
||||||
name = "MPPPoseLandmarker",
|
name = "MPPPoseLandmarker",
|
||||||
|
srcs = ["sources/MPPPoseLandmarker.mm"],
|
||||||
hdrs = ["sources/MPPPoseLandmarker.h"],
|
hdrs = ["sources/MPPPoseLandmarker.h"],
|
||||||
|
copts = [
|
||||||
|
"-ObjC++",
|
||||||
|
"-std=c++17",
|
||||||
|
"-x objective-c++",
|
||||||
|
],
|
||||||
module_name = "MPPPoseLandmarker",
|
module_name = "MPPPoseLandmarker",
|
||||||
deps = [
|
deps = [
|
||||||
":MPPPoseLandmarkerOptions",
|
":MPPPoseLandmarkerOptions",
|
||||||
":MPPPoseLandmarkerResult",
|
":MPPPoseLandmarkerResult",
|
||||||
":MPPPoseLandmarksConnections",
|
":MPPPoseLandmarksConnections",
|
||||||
|
"//mediapipe/tasks/cc/vision/pose_landmarker:pose_landmarker_graph",
|
||||||
|
"//mediapipe/tasks/ios/common/utils:MPPCommonUtils",
|
||||||
|
"//mediapipe/tasks/ios/common/utils:NSStringHelpers",
|
||||||
"//mediapipe/tasks/ios/components/containers:MPPConnection",
|
"//mediapipe/tasks/ios/components/containers:MPPConnection",
|
||||||
|
"//mediapipe/tasks/ios/core:MPPTaskInfo",
|
||||||
"//mediapipe/tasks/ios/vision/core:MPPImage",
|
"//mediapipe/tasks/ios/vision/core:MPPImage",
|
||||||
|
"//mediapipe/tasks/ios/vision/core:MPPVisionPacketCreator",
|
||||||
|
"//mediapipe/tasks/ios/vision/core:MPPVisionTaskRunner",
|
||||||
|
"//mediapipe/tasks/ios/vision/pose_landmarker/utils:MPPPoseLandmarkerOptionsHelpers",
|
||||||
|
"//mediapipe/tasks/ios/vision/pose_landmarker/utils:MPPPoseLandmarkerResultHelpers",
|
||||||
],
|
],
|
||||||
)
|
)
|
||||||
|
|
|
@ -0,0 +1,220 @@
|
||||||
|
// Copyright 2023 The MediaPipe Authors.
|
||||||
|
//
|
||||||
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
// you may not use this file except in compliance with the License.
|
||||||
|
// You may obtain a copy of the License at
|
||||||
|
//
|
||||||
|
// http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
//
|
||||||
|
// Unless required by applicable law or agreed to in writing, software
|
||||||
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
// See the License for the specific language governing permissions and
|
||||||
|
// limitations under the License.
|
||||||
|
|
||||||
|
#import "mediapipe/tasks/ios/vision/pose_landmarker/sources/MPPPoseLandmarker.h"
|
||||||
|
|
||||||
|
#import "mediapipe/tasks/ios/common/utils/sources/MPPCommonUtils.h"
|
||||||
|
#import "mediapipe/tasks/ios/common/utils/sources/NSString+Helpers.h"
|
||||||
|
#import "mediapipe/tasks/ios/core/sources/MPPTaskInfo.h"
|
||||||
|
#import "mediapipe/tasks/ios/vision/core/sources/MPPVisionPacketCreator.h"
|
||||||
|
#import "mediapipe/tasks/ios/vision/core/sources/MPPVisionTaskRunner.h"
|
||||||
|
#import "mediapipe/tasks/ios/vision/pose_landmarker/sources/MPPPoseLandmarksConnections.h"
|
||||||
|
#import "mediapipe/tasks/ios/vision/pose_landmarker/utils/sources/MPPPoseLandmarkerOptions+Helpers.h"
|
||||||
|
#import "mediapipe/tasks/ios/vision/pose_landmarker/utils/sources/MPPPoseLandmarkerResult+Helpers.h"
|
||||||
|
|
||||||
|
namespace {
|
||||||
|
using ::mediapipe::Timestamp;
|
||||||
|
using ::mediapipe::tasks::core::PacketMap;
|
||||||
|
using ::mediapipe::tasks::core::PacketsCallback;
|
||||||
|
} // namespace
|
||||||
|
|
||||||
|
static NSString *const kImageTag = @"IMAGE";
|
||||||
|
static NSString *const kImageInStreamName = @"image_in";
|
||||||
|
static NSString *const kNormRectTag = @"NORM_RECT";
|
||||||
|
static NSString *const kNormRectInStreamName = @"norm_rect_in";
|
||||||
|
static NSString *const kImageOutStreamName = @"image_out";
|
||||||
|
static NSString *const kPoseLandmarksTag = @"NORM_LANDMARKS";
|
||||||
|
static NSString *const kPoseLandmarksOutStreamName = @"pose_landmarks";
|
||||||
|
static NSString *const kWorldLandmarksTag = @"WORLD_LANDMARKS";
|
||||||
|
static NSString *const kWorldLandmarksOutStreamName = @"world_landmarks";
|
||||||
|
static NSString *const kSegmentationMasksTag = @"SEGMENTATION_MASK";
|
||||||
|
static NSString *const kSegmentationMasksOutStreamName = @"segmentation_masks";
|
||||||
|
static NSString *const kTaskGraphName =
|
||||||
|
@"mediapipe.tasks.vision.pose_landmarker.PoseLandmarkerGraph";
|
||||||
|
static NSString *const kTaskName = @"poseLandmarker";
|
||||||
|
|
||||||
|
#define InputPacketMap(imagePacket, normalizedRectPacket) \
|
||||||
|
{ \
|
||||||
|
{kImageInStreamName.cppString, imagePacket}, { \
|
||||||
|
kNormRectInStreamName.cppString, normalizedRectPacket \
|
||||||
|
} \
|
||||||
|
}
|
||||||
|
|
||||||
|
#define PoseLandmarkerResultWithOutputPacketMap(outputPacketMap) \
|
||||||
|
([MPPPoseLandmarkerResult \
|
||||||
|
poseLandmarkerResultWithLandmarksPacket:outputPacketMap[kPoseLandmarksOutStreamName \
|
||||||
|
.cppString] \
|
||||||
|
worldLandmarksPacket:outputPacketMap[kWorldLandmarksOutStreamName \
|
||||||
|
.cppString] \
|
||||||
|
segmentationMasksPacket:&(outputPacketMap[kSegmentationMasksOutStreamName \
|
||||||
|
.cppString])])
|
||||||
|
|
||||||
|
@interface MPPPoseLandmarker () {
|
||||||
|
/** iOS Vision Task Runner */
|
||||||
|
MPPVisionTaskRunner *_visionTaskRunner;
|
||||||
|
dispatch_queue_t _callbackQueue;
|
||||||
|
}
|
||||||
|
@property(nonatomic, weak) id<MPPPoseLandmarkerLiveStreamDelegate> poseLandmarkerLiveStreamDelegate;
|
||||||
|
@end
|
||||||
|
|
||||||
|
@implementation MPPPoseLandmarker
|
||||||
|
|
||||||
|
#pragma mark - Public
|
||||||
|
|
||||||
|
- (instancetype)initWithOptions:(MPPPoseLandmarkerOptions *)options error:(NSError **)error {
|
||||||
|
self = [super init];
|
||||||
|
if (self) {
|
||||||
|
MPPTaskInfo *taskInfo = [[MPPTaskInfo alloc]
|
||||||
|
initWithTaskGraphName:kTaskGraphName
|
||||||
|
inputStreams:@[
|
||||||
|
[NSString stringWithFormat:@"%@:%@", kImageTag, kImageInStreamName],
|
||||||
|
[NSString stringWithFormat:@"%@:%@", kNormRectTag, kNormRectInStreamName]
|
||||||
|
]
|
||||||
|
outputStreams:@[
|
||||||
|
[NSString
|
||||||
|
stringWithFormat:@"%@:%@", kPoseLandmarksTag, kPoseLandmarksOutStreamName],
|
||||||
|
[NSString
|
||||||
|
stringWithFormat:@"%@:%@", kWorldLandmarksTag, kWorldLandmarksOutStreamName],
|
||||||
|
[NSString stringWithFormat:@"%@:%@", kSegmentationMasksTag,
|
||||||
|
kSegmentationMasksOutStreamName],
|
||||||
|
[NSString stringWithFormat:@"%@:%@", kImageTag, kImageOutStreamName]
|
||||||
|
]
|
||||||
|
taskOptions:options
|
||||||
|
enableFlowLimiting:options.runningMode == MPPRunningModeLiveStream
|
||||||
|
error:error];
|
||||||
|
|
||||||
|
if (!taskInfo) {
|
||||||
|
return nil;
|
||||||
|
}
|
||||||
|
|
||||||
|
PacketsCallback packetsCallback = nullptr;
|
||||||
|
|
||||||
|
if (options.poseLandmarkerLiveStreamDelegate) {
|
||||||
|
_poseLandmarkerLiveStreamDelegate = options.poseLandmarkerLiveStreamDelegate;
|
||||||
|
|
||||||
|
// Create a private serial dispatch queue in which the deleagte method will be called
|
||||||
|
// asynchronously. This is to ensure that if the client performs a long running operation in
|
||||||
|
// the delegate method, the queue on which the C++ callbacks is invoked is not blocked and is
|
||||||
|
// freed up to continue with its operations.
|
||||||
|
_callbackQueue = dispatch_queue_create(
|
||||||
|
[MPPVisionTaskRunner uniqueDispatchQueueNameWithSuffix:kTaskName], nullptr);
|
||||||
|
|
||||||
|
// Capturing `self` as weak in order to avoid `self` being kept in memory
|
||||||
|
// and cause a retain cycle, after self is set to `nil`.
|
||||||
|
MPPPoseLandmarker *__weak weakSelf = self;
|
||||||
|
packetsCallback = [=](absl::StatusOr<PacketMap> liveStreamResult) {
|
||||||
|
[weakSelf processLiveStreamResult:liveStreamResult];
|
||||||
|
};
|
||||||
|
}
|
||||||
|
|
||||||
|
_visionTaskRunner = [[MPPVisionTaskRunner alloc] initWithTaskInfo:taskInfo
|
||||||
|
runningMode:options.runningMode
|
||||||
|
roiAllowed:NO
|
||||||
|
packetsCallback:std::move(packetsCallback)
|
||||||
|
imageInputStreamName:kImageInStreamName
|
||||||
|
normRectInputStreamName:kNormRectInStreamName
|
||||||
|
error:error];
|
||||||
|
|
||||||
|
if (!_visionTaskRunner) {
|
||||||
|
return nil;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return self;
|
||||||
|
}
|
||||||
|
|
||||||
|
- (instancetype)initWithModelPath:(NSString *)modelPath error:(NSError **)error {
|
||||||
|
MPPPoseLandmarkerOptions *options = [[MPPPoseLandmarkerOptions alloc] init];
|
||||||
|
|
||||||
|
options.baseOptions.modelAssetPath = modelPath;
|
||||||
|
|
||||||
|
return [self initWithOptions:options error:error];
|
||||||
|
}
|
||||||
|
|
||||||
|
- (nullable MPPPoseLandmarkerResult *)detectImage:(MPPImage *)image error:(NSError **)error {
|
||||||
|
std::optional<PacketMap> outputPacketMap = [_visionTaskRunner processImage:image error:error];
|
||||||
|
|
||||||
|
return [MPPPoseLandmarker poseLandmarkerResultWithOptionalOutputPacketMap:outputPacketMap];
|
||||||
|
}
|
||||||
|
|
||||||
|
- (nullable MPPPoseLandmarkerResult *)detectVideoFrame:(MPPImage *)image
|
||||||
|
timestampInMilliseconds:(NSInteger)timestampInMilliseconds
|
||||||
|
error:(NSError **)error {
|
||||||
|
std::optional<PacketMap> outputPacketMap =
|
||||||
|
[_visionTaskRunner processVideoFrame:image
|
||||||
|
timestampInMilliseconds:timestampInMilliseconds
|
||||||
|
error:error];
|
||||||
|
|
||||||
|
return [MPPPoseLandmarker poseLandmarkerResultWithOptionalOutputPacketMap:outputPacketMap];
|
||||||
|
}
|
||||||
|
|
||||||
|
- (BOOL)detectAsyncImage:(MPPImage *)image
|
||||||
|
timestampInMilliseconds:(NSInteger)timestampInMilliseconds
|
||||||
|
error:(NSError **)error {
|
||||||
|
return [_visionTaskRunner processLiveStreamImage:image
|
||||||
|
timestampInMilliseconds:timestampInMilliseconds
|
||||||
|
error:error];
|
||||||
|
}
|
||||||
|
|
||||||
|
+ (NSArray<MPPConnection *> *)poseLandmarks {
|
||||||
|
return MPPPoseLandmarksConnections;
|
||||||
|
}
|
||||||
|
|
||||||
|
#pragma mark - Private
|
||||||
|
|
||||||
|
- (void)processLiveStreamResult:(absl::StatusOr<PacketMap>)liveStreamResult {
|
||||||
|
if (![self.poseLandmarkerLiveStreamDelegate
|
||||||
|
respondsToSelector:@selector(poseLandmarker:
|
||||||
|
didFinishDetectionWithResult:timestampInMilliseconds:error:)]) {
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
NSError *callbackError = nil;
|
||||||
|
if (![MPPCommonUtils checkCppError:liveStreamResult.status() toError:&callbackError]) {
|
||||||
|
dispatch_async(_callbackQueue, ^{
|
||||||
|
[self.poseLandmarkerLiveStreamDelegate poseLandmarker:self
|
||||||
|
didFinishDetectionWithResult:nil
|
||||||
|
timestampInMilliseconds:Timestamp::Unset().Value()
|
||||||
|
error:callbackError];
|
||||||
|
});
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
PacketMap &outputPacketMap = liveStreamResult.value();
|
||||||
|
if (outputPacketMap[kImageOutStreamName.cppString].IsEmpty()) {
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
MPPPoseLandmarkerResult *result = PoseLandmarkerResultWithOutputPacketMap(outputPacketMap);
|
||||||
|
|
||||||
|
NSInteger timestampInMilliseconds =
|
||||||
|
outputPacketMap[kImageOutStreamName.cppString].Timestamp().Value() /
|
||||||
|
kMicrosecondsPerMillisecond;
|
||||||
|
dispatch_async(_callbackQueue, ^{
|
||||||
|
[self.poseLandmarkerLiveStreamDelegate poseLandmarker:self
|
||||||
|
didFinishDetectionWithResult:result
|
||||||
|
timestampInMilliseconds:timestampInMilliseconds
|
||||||
|
error:callbackError];
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
+ (nullable MPPPoseLandmarkerResult *)poseLandmarkerResultWithOptionalOutputPacketMap:
|
||||||
|
(std::optional<PacketMap> &)outputPacketMap {
|
||||||
|
if (!outputPacketMap.has_value()) {
|
||||||
|
return nil;
|
||||||
|
}
|
||||||
|
|
||||||
|
return PoseLandmarkerResultWithOutputPacketMap(outputPacketMap.value());
|
||||||
|
}
|
||||||
|
|
||||||
|
@end
|
|
@ -20,6 +20,8 @@
|
||||||
|
|
||||||
NS_ASSUME_NONNULL_BEGIN
|
NS_ASSUME_NONNULL_BEGIN
|
||||||
|
|
||||||
|
static const int kMicrosecondsPerMillisecond = 1000;
|
||||||
|
|
||||||
@interface MPPPoseLandmarkerResult (Helpers)
|
@interface MPPPoseLandmarkerResult (Helpers)
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
@ -55,8 +57,9 @@ NS_ASSUME_NONNULL_BEGIN
|
||||||
(const std::vector<::mediapipe::NormalizedLandmarkList> &)landmarksProto
|
(const std::vector<::mediapipe::NormalizedLandmarkList> &)landmarksProto
|
||||||
worldLandmarksProto:
|
worldLandmarksProto:
|
||||||
(const std::vector<::mediapipe::LandmarkList> &)worldLandmarksProto
|
(const std::vector<::mediapipe::LandmarkList> &)worldLandmarksProto
|
||||||
segmentationMasks:(const std::vector<mediapipe::Image> *)segmentationMasks
|
segmentationMasks:
|
||||||
timestampInMilliSeconds:(NSInteger)timestampInMilliseconds;
|
(nullable const std::vector<mediapipe::Image> *)segmentationMasks
|
||||||
|
timestampInMilliseconds:(NSInteger)timestampInMilliseconds;
|
||||||
|
|
||||||
@end
|
@end
|
||||||
|
|
||||||
|
|
|
@ -21,8 +21,6 @@ using LandmarkListProto = ::mediapipe::LandmarkList;
|
||||||
using NormalizedLandmarkListProto = ::mediapipe::NormalizedLandmarkList;
|
using NormalizedLandmarkListProto = ::mediapipe::NormalizedLandmarkList;
|
||||||
using ::mediapipe::Image;
|
using ::mediapipe::Image;
|
||||||
using ::mediapipe::Packet;
|
using ::mediapipe::Packet;
|
||||||
|
|
||||||
static const int kMicroSecondsPerMilliSecond = 1000;
|
|
||||||
} // namespace
|
} // namespace
|
||||||
|
|
||||||
@implementation MPPPoseLandmarkerResult (Helpers)
|
@implementation MPPPoseLandmarkerResult (Helpers)
|
||||||
|
@ -40,8 +38,8 @@ static const int kMicroSecondsPerMilliSecond = 1000;
|
||||||
(const std::vector<NormalizedLandmarkListProto> &)landmarksProto
|
(const std::vector<NormalizedLandmarkListProto> &)landmarksProto
|
||||||
worldLandmarksProto:
|
worldLandmarksProto:
|
||||||
(const std::vector<LandmarkListProto> &)worldLandmarksProto
|
(const std::vector<LandmarkListProto> &)worldLandmarksProto
|
||||||
segmentationMasks:(const std::vector<Image> *)segmentationMasks
|
segmentationMasks:(nullable const std::vector<Image> *)segmentationMasks
|
||||||
timestampInMilliSeconds:(NSInteger)timestampInMilliseconds {
|
timestampInMilliseconds:(NSInteger)timestampInMilliseconds {
|
||||||
NSMutableArray<NSMutableArray<MPPNormalizedLandmark *> *> *multiplePoseLandmarks =
|
NSMutableArray<NSMutableArray<MPPNormalizedLandmark *> *> *multiplePoseLandmarks =
|
||||||
[NSMutableArray arrayWithCapacity:(NSUInteger)landmarksProto.size()];
|
[NSMutableArray arrayWithCapacity:(NSUInteger)landmarksProto.size()];
|
||||||
|
|
||||||
|
@ -69,6 +67,12 @@ static const int kMicroSecondsPerMilliSecond = 1000;
|
||||||
[multiplePoseWorldLandmarks addObject:worldLandmarks];
|
[multiplePoseWorldLandmarks addObject:worldLandmarks];
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if (!segmentationMasks) {
|
||||||
|
return [[MPPPoseLandmarkerResult alloc] initWithLandmarks:multiplePoseLandmarks
|
||||||
|
worldLandmarks:multiplePoseWorldLandmarks
|
||||||
|
segmentationMasks:nil
|
||||||
|
timestampInMilliseconds:timestampInMilliseconds];
|
||||||
|
}
|
||||||
NSMutableArray<MPPMask *> *confidenceMasks =
|
NSMutableArray<MPPMask *> *confidenceMasks =
|
||||||
[NSMutableArray arrayWithCapacity:(NSUInteger)segmentationMasks->size()];
|
[NSMutableArray arrayWithCapacity:(NSUInteger)segmentationMasks->size()];
|
||||||
|
|
||||||
|
@ -83,12 +87,11 @@ static const int kMicroSecondsPerMilliSecond = 1000;
|
||||||
shouldCopy:YES]];
|
shouldCopy:YES]];
|
||||||
}
|
}
|
||||||
|
|
||||||
MPPPoseLandmarkerResult *poseLandmarkerResult =
|
return [[MPPPoseLandmarkerResult alloc] initWithLandmarks:multiplePoseLandmarks
|
||||||
[[MPPPoseLandmarkerResult alloc] initWithLandmarks:multiplePoseLandmarks
|
|
||||||
worldLandmarks:multiplePoseWorldLandmarks
|
worldLandmarks:multiplePoseWorldLandmarks
|
||||||
segmentationMasks:confidenceMasks
|
segmentationMasks:confidenceMasks
|
||||||
timestampInMilliseconds:timestampInMilliseconds];
|
timestampInMilliseconds:timestampInMilliseconds];
|
||||||
return poseLandmarkerResult;
|
;
|
||||||
}
|
}
|
||||||
|
|
||||||
+ (MPPPoseLandmarkerResult *)
|
+ (MPPPoseLandmarkerResult *)
|
||||||
|
@ -96,7 +99,7 @@ static const int kMicroSecondsPerMilliSecond = 1000;
|
||||||
worldLandmarksPacket:(const Packet &)worldLandmarksPacket
|
worldLandmarksPacket:(const Packet &)worldLandmarksPacket
|
||||||
segmentationMasksPacket:(const Packet *)segmentationMasksPacket {
|
segmentationMasksPacket:(const Packet *)segmentationMasksPacket {
|
||||||
NSInteger timestampInMilliseconds =
|
NSInteger timestampInMilliseconds =
|
||||||
(NSInteger)(landmarksPacket.Timestamp().Value() / kMicroSecondsPerMilliSecond);
|
(NSInteger)(landmarksPacket.Timestamp().Value() / kMicrosecondsPerMillisecond);
|
||||||
|
|
||||||
if (landmarksPacket.IsEmpty()) {
|
if (landmarksPacket.IsEmpty()) {
|
||||||
return [MPPPoseLandmarkerResult
|
return [MPPPoseLandmarkerResult
|
||||||
|
@ -118,7 +121,7 @@ static const int kMicroSecondsPerMilliSecond = 1000;
|
||||||
worldLandmarksProto:worldLandmarksPacket
|
worldLandmarksProto:worldLandmarksPacket
|
||||||
.Get<std::vector<LandmarkListProto>>()
|
.Get<std::vector<LandmarkListProto>>()
|
||||||
segmentationMasks:segmentationMasks
|
segmentationMasks:segmentationMasks
|
||||||
timestampInMilliSeconds:timestampInMilliseconds];
|
timestampInMilliseconds:timestampInMilliseconds];
|
||||||
}
|
}
|
||||||
|
|
||||||
@end
|
@end
|
||||||
|
|
Loading…
Reference in New Issue
Block a user