Internal change

PiperOrigin-RevId: 535751178
2023-05-26 17:24:03 -07:00 · 2023-05-26 17:24:03 -07:00 · d4c7ed2217
commit d4c7ed2217
parent fddc3facf0
6 changed files with 338 additions and 32 deletions
--- a/mediapipe/tasks/cc/vision/image_segmenter/calculators/BUILD
+++ b/mediapipe/tasks/cc/vision/image_segmenter/calculators/BUILD
@ -50,7 +50,12 @@ cc_library(
        "@com_google_absl//absl/status",
        "@com_google_absl//absl/strings:str_format",
        "@com_google_absl//absl/types:span",
+    ] + select({
+        "//conditions:default": [],
+        "//mediapipe:android": [
+            ":segmentation_postprocessor_gl",
        ],
+    }),
    alwayslink = 1,
 )

@ -72,6 +77,29 @@ cc_library(
        "//mediapipe/tasks/cc/vision/utils:image_utils",
        "@com_google_absl//absl/status",
        "@com_google_absl//absl/strings:str_format",
+    ] + select({
+        "//conditions:default": [],
+        "//mediapipe:android": [
+            "ssbo_to_texture_converter",
+        ],
+    }),
+)
+
+cc_library(
+    name = "ssbo_to_texture_converter",
+    srcs = ["ssbo_to_texture_converter.cc"],
+    hdrs = ["ssbo_to_texture_converter.h"],
+    tags = [
+        "nomac",
+        "notap",
+    ],
+    deps = [
+        "//mediapipe/framework/formats:tensor",
+        "//mediapipe/gpu:gl_base",
+        "@org_tensorflow//tensorflow/lite/delegates/gpu/gl:gl_program",
+        "@org_tensorflow//tensorflow/lite/delegates/gpu/gl:gl_shader",
+        "@org_tensorflow//tensorflow/lite/delegates/gpu/gl:gl_texture",
+        "@org_tensorflow//tensorflow/lite/delegates/gpu/gl/converters:util",
    ],
 )

--- a/mediapipe/tasks/cc/vision/image_segmenter/calculators/segmentation_postprocessor_gl.cc
+++ b/mediapipe/tasks/cc/vision/image_segmenter/calculators/segmentation_postprocessor_gl.cc
@ -16,6 +16,14 @@ namespace mediapipe {
 namespace tasks {
 namespace {

+// On most platforms, glGetUniformLocation returns -1 for an error status, but
+// on web we'll see 0 instead.
+#ifdef __EMSCRIPTEN__
+const GLint kUniformErrorStatus = 0;
+#else
+const GLint kUniformErrorStatus = -1;
+#endif  // __EMSCRIPTEN__
+
 using mediapipe::kBasicSquareVertices;
 using mediapipe::kBasicTextureVertices;
 using mediapipe::kBasicVertexShader;
@ -341,7 +349,7 @@ absl::Status SegmentationPostprocessorGl::CreateBasicFragmentShaderProgram(
  for (const auto& uniform_name : uniform_names) {
    shader_struct_ptr->uniforms[uniform_name] =
        glGetUniformLocation(shader_struct_ptr->program, uniform_name.c_str());
-    RET_CHECK(shader_struct_ptr->uniforms[uniform_name] > 0)
+    RET_CHECK(shader_struct_ptr->uniforms[uniform_name] > kUniformErrorStatus)
        << uniform_name << " uniform not found for " << program_name
        << " program";
  }
@ -427,10 +435,10 @@ absl::Status SegmentationPostprocessorGl::GlInit(
    // Get split program uniform locations.
    split_texture_uniform_ =
        glGetUniformLocation(split_program_, "input_texture");
-    RET_CHECK(split_texture_uniform_ > 0)
+    RET_CHECK(split_texture_uniform_ > kUniformErrorStatus)
        << "split input_texture uniform not found.";
    split_x_offset_uniform_ = glGetUniformLocation(split_program_, "x_offset");
-    RET_CHECK(split_x_offset_uniform_ > 0)
+    RET_CHECK(split_x_offset_uniform_ > kUniformErrorStatus)
        << "split x_offset uniform not found.";

    // TODO: If ES3.0+ only, switch to VAO for handling attributes.
@ -445,10 +453,24 @@ absl::Status SegmentationPostprocessorGl::GlInit(
                 kBasicTextureVertices, GL_STATIC_DRAW);

    glBindBuffer(GL_ARRAY_BUFFER, 0);
+
+#ifdef TASK_SEGMENTATION_USE_GLES_31_POSTPROCESSING
+    MP_RETURN_IF_ERROR(ssbo_to_texture_converter_.Init());
+#endif  // TASK_SEGMENTATION_USE_GLES_31_POSTPROCESSING
+
    return absl::OkStatus();
  });
 }

+// On Android, the extensions are prefixed by GL_, whereas on web they are not.
+bool SegmentationPostprocessorGl::HasGlExtension(std::string const& extension) {
+#ifdef __EMSCRIPTEN__
+  return helper_.GetGlContext().HasGlExtension(extension);
+#else
+  return helper_.GetGlContext().HasGlExtension("GL_" + extension);
+#endif  // __EMSCRIPTEN__
+}
+
 std::vector<std::unique_ptr<Image>>
 SegmentationPostprocessorGl::GetSegmentationResultGpu(
    const Shape& input_shape, const Shape& output_shape, const Tensor& tensor,
@ -459,18 +481,35 @@ SegmentationPostprocessorGl::GetSegmentationResultGpu(
                                        produce_category_mask,
                                        &image_outputs]() -> absl::Status {
    // Get Tensor input and image output parameters
+    const int width = input_shape.width;           // Slice width from shape
+    const int height = input_shape.height;         // Slice height from chape
+    const int num_outputs = input_shape.channels;  // One output per channel
+    const int num_chunks = (input_shape.channels + 3) / 4;  // ceil(channels/4)
+    const int output_width = output_shape.width;    // Final output width
+    const int output_height = output_shape.height;  // Final output height
    int input_width, input_height;

-    if (!tensor.ready_as_opengl_texture_2d()) {
+    if (!tensor.ready_on_gpu()) {
      LOG(WARNING) << "Tensor wasn't ready on GPU; using slow workaround.";
      (void)tensor.GetCpuReadView();
    }

+#ifdef TASK_SEGMENTATION_USE_GLES_31_POSTPROCESSING
+    // If our Tensor is an SSBO, then it's also linearized, so we convert to a
+    // kAligned 2d texture using a special converter and then proceed as before.
+    GLuint ssbo_tex_id;
+    ASSIGN_OR_RETURN(ssbo_tex_id,
+                     ssbo_to_texture_converter_.ConvertTensorToGlTexture(
+                         tensor, width, height, num_outputs));
+    std::tie(input_width, input_height) =
+        ssbo_to_texture_converter_.GetTextureSize();
+#else
    const auto layout = tensor.GetOpenGlTexture2dReadView().GetLayoutDimensions(
        tensor.shape(), &input_width, &input_height);
    if (layout != Tensor::OpenGlTexture2dView::Layout::kAligned) {
      LOG(ERROR) << "Tensor layout not kAligned! Cannot handle.";
    }
+#endif  // TASK_SEGMENTATION_USE_GLES_31_POSTPROCESSING

    // Optimization: Only apply SOFTMAX when producing confidence masks, since
    // SOFTMAX errors out when num_classes = 1, so we don't have to worry about
@ -486,14 +525,12 @@ SegmentationPostprocessorGl::GetSegmentationResultGpu(
    // (3) blending
    // Otherwise, we just try for F16. See b/277656755 for more information.
    // TODO: In the future, separate these 3 different restrictions.
-    // TODO: Also, we should extend this logic to non-web platforms.
-    static bool can_use_f32 =
-        helper_.GetGlContext().HasGlExtension("EXT_color_buffer_float") &&
-        helper_.GetGlContext().HasGlExtension("OES_texture_float_linear") &&
-        helper_.GetGlContext().HasGlExtension("EXT_float_blend");
+    // TODO: Also, we should extend this logic to all platforms.
+    static bool can_use_f32 = HasGlExtension("EXT_color_buffer_float") &&
+                              HasGlExtension("OES_texture_float_linear") &&
+                              HasGlExtension("EXT_float_blend");
    static bool can_use_f16_backup =
-        helper_.GetGlContext().HasGlExtension("EXT_color_buffer_half_float");
-
+        HasGlExtension("EXT_color_buffer_half_float");
    RET_CHECK(can_use_f32 || can_use_f16_backup)
        << "Segmentation postprocessing error: GPU does not fully support "
        << "4-channel float32 or float16 formats.";
@ -510,15 +547,6 @@ SegmentationPostprocessorGl::GetSegmentationResultGpu(
    const GpuBufferFormat final_output_format =
        can_use_f32 ? GpuBufferFormat::kGrayFloat32
                    : GpuBufferFormat::kGrayHalf16;
-    const Tensor::OpenGlTexture2dView read_view =
-        tensor.GetOpenGlTexture2dReadView();
-
-    const int width = input_shape.width;           // Slice width from shape
-    const int height = input_shape.height;         // Slice height from chape
-    const int num_outputs = input_shape.channels;  // One output per channel
-    const int num_chunks = (input_shape.channels + 3) / 4;  // ceil(channels/4)
-    const int output_width = output_shape.width;    // Final output width
-    const int output_height = output_shape.height;  // Final output height

    // We disable blending or else our alpha channel may destroy our other
    // channels' data.
@ -540,9 +568,16 @@ SegmentationPostprocessorGl::GetSegmentationResultGpu(
        input_width, input_height, activation_output_format);
    helper_.BindFramebuffer(activated_texture);

-    // All our input source textures are just simple GL_TEXTURE_2D types.
+    // All our input source textures will be just simple GL_TEXTURE_2D types.
    glActiveTexture(GL_TEXTURE1);
+
+#ifdef TASK_SEGMENTATION_USE_GLES_31_POSTPROCESSING
+    glBindTexture(GL_TEXTURE_2D, ssbo_tex_id);
+#else
+    const Tensor::OpenGlTexture2dView read_view =
+        tensor.GetOpenGlTexture2dReadView();
    glBindTexture(GL_TEXTURE_2D, read_view.name());
+#endif  // TASK_SEGMENTATION_USE_GLES_31_POSTPROCESSING

    // Render
    glClear(GL_COLOR_BUFFER_BIT);
@ -841,6 +876,10 @@ SegmentationPostprocessorGl::~SegmentationPostprocessorGl() {
    glDeleteProgram(softmax_max_shader_.program);
    glDeleteProgram(softmax_transform_and_sum_shader_.program);
    glDeleteProgram(softmax_normalization_shader_.program);
+
+#ifdef TASK_SEGMENTATION_USE_GLES_31_POSTPROCESSING
+    ssbo_to_texture_converter_.Close();
+#endif  // TASK_SEGMENTATION_USE_GLES_31_POSTPROCESSING
  });
 }

--- a/mediapipe/tasks/cc/vision/image_segmenter/calculators/segmentation_postprocessor_gl.h
+++ b/mediapipe/tasks/cc/vision/image_segmenter/calculators/segmentation_postprocessor_gl.h
@ -21,6 +21,14 @@
 #include "mediapipe/tasks/cc/vision/image_segmenter/calculators/tensors_to_segmentation_calculator.pb.h"
 #include "mediapipe/tasks/cc/vision/utils/image_utils.h"

+// On Android with compute shaders we include the SSBO-to-texture converter
+#if MEDIAPIPE_OPENGL_ES_VERSION >= MEDIAPIPE_OPENGL_ES_31 && \
+    defined(__ANDROID__)
+#define TASK_SEGMENTATION_USE_GLES_31_POSTPROCESSING 1
+#include "mediapipe/tasks/cc/vision/image_segmenter/calculators/ssbo_to_texture_converter.h"
+#endif  // MEDIAPIPE_OPENGL_ES_VERSION >= MEDIAPIPE_OPENGL_ES_31 &&
+        // defined(__ANDROID__)
+
 namespace mediapipe {
 namespace tasks {

@ -45,6 +53,7 @@ class SegmentationPostprocessorGl {
  };

  absl::Status GlInit(const bool produce_confidence_masks);
+  bool HasGlExtension(std::string const& extension);
  absl::Status CreateBasicFragmentShaderProgram(
      std::string const& program_name,
      std::string const& fragment_shader_source,
@ -69,6 +78,10 @@ class SegmentationPostprocessorGl {
  GlShader softmax_max_shader_;
  GlShader softmax_transform_and_sum_shader_;
  GlShader softmax_normalization_shader_;
+
+#ifdef TASK_SEGMENTATION_USE_GLES_31_POSTPROCESSING
+  SsboToTextureConverter ssbo_to_texture_converter_;
+#endif
 };

 }  // namespace tasks
--- a/mediapipe/tasks/cc/vision/image_segmenter/calculators/ssbo_to_texture_converter.cc
+++ b/mediapipe/tasks/cc/vision/image_segmenter/calculators/ssbo_to_texture_converter.cc
@ -0,0 +1,162 @@
+#include "mediapipe/tasks/cc/vision/image_segmenter/calculators/ssbo_to_texture_converter.h"
+
+#include "tensorflow/lite/delegates/gpu/gl/converters/util.h"
+#include "tensorflow/lite/delegates/gpu/gl/gl_shader.h"
+
+// Quick compile-time warning to ensure usage on the proper platform.
+#if !(MEDIAPIPE_OPENGL_ES_VERSION >= MEDIAPIPE_OPENGL_ES_31)
+#warning "SsboToTextureConverter should be used with OpenGL ES 3.1 or above"
+#endif
+
+namespace mediapipe {
+namespace tasks {
+namespace {
+
+using ::tflite::gpu::gl::GlProgram;
+using ::tflite::gpu::gl::GlShader;
+
+constexpr int kWorkgroupSize = 8;  // Block size for GPU shader.
+const tflite::gpu::uint3 workgroup_size = {kWorkgroupSize, kWorkgroupSize, 1};
+
+// "Delinearization" shader:
+// Example data using n=5 channels: 0,1,2,3,4,5,6,7,8,9,10,11,12,13,14 -->
+// 0,1,2,3 | 4,X,X,X | 5,6,7,8 | 9,X,X,X | 10,11,12,13 | 14,X,X,X
+const char delinearization_shader_source[] = R"(
+precision highp float;
+layout(rgba32f, binding = 0) writeonly uniform highp image2D output_texture;
+
+uniform ivec2 out_size;
+uniform int num_channels;
+uniform int num_channels_padded;  // ^ rounded up to nearest multiple of 4
+
+layout(std430, binding = 2) readonly buffer B0 {
+  float elements[];
+} input_data;   // data tensor
+
+void main() {
+  int out_width = out_size.x;
+  int out_height = out_size.y;
+
+  ivec2 gid = ivec2(gl_GlobalInvocationID.xy);
+  if (gid.x >= out_width || gid.y >= out_height) { return; }
+  int linear_index_pixels = gid.y * out_width + gid.x;
+  int linear_index = linear_index_pixels * 4;
+
+  int num_completed_chunks = linear_index / num_channels_padded;
+  int offset = linear_index % num_channels_padded;
+  int data_index = num_completed_chunks * num_channels + offset;
+
+  // Early exit if fully outside buffer
+  int data_size = input_data.elements.length();
+  if (data_index >= data_size) return;
+
+  // We add some extra logic here just to ensure we don't overrun buffer and get
+  // undefined behavior.  TODO: Come up with nicer way around this if
+  // we end up needing this sort of patch more frequently.
+  float x = input_data.elements[data_index];
+  float y = 0.0;
+  float z = 0.0;
+  float w = 0.0;
+  if (data_index + 3 < data_size) {
+    w = input_data.elements[data_index + 3];
+    z = input_data.elements[data_index + 2];
+    y = input_data.elements[data_index + 1];
+  } else if (data_index + 2 < data_size) {
+    z = input_data.elements[data_index + 2];
+    y = input_data.elements[data_index + 1];
+  } else if (data_index + 1 < data_size) {
+    y = input_data.elements[data_index + 1];
+  }
+
+  ivec2 output_coordinate = ivec2(gid.x, gid.y);
+  vec4 out_value = vec4(x, y, z, w);
+  imageStore(output_texture, output_coordinate, out_value);
+})";
+
+// Commonly used to compute the number of blocks to launch in a kernel.
+int NumGroups(const int size, const int group_size) {  // NOLINT
+  return (size + group_size - 1) / group_size;
+}
+
+}  // namespace
+
+absl::Status SsboToTextureConverter::Init() {
+  GlShader delinearization_shader;
+  std::string delinearization_shader_source_with_headers =
+      absl::StrCat(tflite::gpu::gl::GetShaderHeader(workgroup_size),
+                   delinearization_shader_source);
+  MP_RETURN_IF_ERROR(GlShader::CompileShader(
+      GL_COMPUTE_SHADER, delinearization_shader_source_with_headers,
+      &delinearization_shader));
+  delinearization_program_ = absl::make_unique<GlProgram>();
+  MP_RETURN_IF_ERROR(GlProgram::CreateWithShader(
+      delinearization_shader, delinearization_program_.get()));
+  return absl::OkStatus();
+}
+
+void SsboToTextureConverter::Close() { delinearization_program_.reset(); }
+
+std::pair<const uint32_t, const uint32_t>
+SsboToTextureConverter::GetTextureSize() {
+  return std::make_pair(texture_width_, texture_height_);
+}
+
+absl::StatusOr<GLuint> SsboToTextureConverter::ConvertTensorToGlTexture(
+    const Tensor& tensor, const uint32_t width, const uint32_t height,
+    const uint32_t channels) {
+  // The tflite::gpu:: namespace looks like it's much simpler and older-- it
+  // doesn't tap into any memory pools, and doesn't allow linearF32 filtering
+  // where available, for example. The key difference is that it uses
+  // glTexStorage2D for allocation instead of glTexImage2D, which is necessary
+  // in order to create an immutable format (as required by glBindImageTexture).
+  // MP will automatically use this for RGBA16F but not RGBA32F textures
+  // currently, oddly enough.  So options are:
+  // (1) extend MP to similarly handle RGBA32F
+  // (2) just make our own texture here and keep reusing, recreating if the size
+  //     changes, which should generally not happen. (This is ok because we use
+  //     the texture immediately and never output it from the calculator).
+  // (3) Change glBindImageTexture call to alternative so we can just use
+  //     existing MP glTexImage2D storage creation?  This seems less than
+  //     ideal since it's rather nice to keep the above program in compute
+  //     shader format.
+  // TODO: To be safe for this initial implementation, we go with
+  // option #2, as it's simplest/easiest, but this should be cleaned up later.
+  const uint32_t num_pixels_per_element = ((channels + 3) / 4);
+  const uint32_t padded_channels = 4 * num_pixels_per_element;
+  const uint32_t texture_width = width * num_pixels_per_element;
+  const uint32_t texture_height = height;
+  if (texture_width != texture_width_ || texture_height != texture_height_) {
+    // tflite::gpu::gl::GlTexture autoreleases, so we don't have to worry about
+    // freeing memory.
+    MP_RETURN_IF_ERROR(CreateReadWriteRgbaImageTexture(
+        tflite::gpu::DataType::FLOAT32, {texture_width, texture_height},
+        &out_texture_));
+    texture_width_ = texture_width;
+    texture_height_ = texture_height;
+  }
+
+  glBindImageTexture(0 /* output index */, out_texture_.id(), 0, GL_FALSE, 0,
+                     GL_WRITE_ONLY, GL_RGBA32F);
+  auto read_view = tensor.GetOpenGlBufferReadView();
+  glBindBufferBase(GL_SHADER_STORAGE_BUFFER, 2 /* input index */,
+                   read_view.name());
+
+  glUseProgram(delinearization_program_->id());
+  glUniform2i(glGetUniformLocation(delinearization_program_->id(), "out_size"),
+              texture_width, texture_height);
+  glUniform1i(
+      glGetUniformLocation(delinearization_program_->id(), "num_channels"),
+      channels);
+  glUniform1i(glGetUniformLocation(delinearization_program_->id(),
+                                   "num_channels_padded"),
+              padded_channels);
+
+  const tflite::gpu::uint3 workgroups = {
+      NumGroups(texture_width, kWorkgroupSize),
+      NumGroups(texture_height, kWorkgroupSize), 1};
+  MP_RETURN_IF_ERROR(delinearization_program_->Dispatch(workgroups));
+  return out_texture_.id();
+}
+
+}  // namespace tasks
+}  // namespace mediapipe
--- a/mediapipe/tasks/cc/vision/image_segmenter/calculators/ssbo_to_texture_converter.h
+++ b/mediapipe/tasks/cc/vision/image_segmenter/calculators/ssbo_to_texture_converter.h
@ -0,0 +1,55 @@
+// Copyright 2023 The MediaPipe Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//      http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef MEDIAPIPE_TASKS_CC_VISION_IMAGE_SEGMENTER_CALCULATORS_SSBO_TO_TEXTURE_CONVERTER_H_
+#define MEDIAPIPE_TASKS_CC_VISION_IMAGE_SEGMENTER_CALCULATORS_SSBO_TO_TEXTURE_CONVERTER_H_
+
+#include <utility>
+
+#include "mediapipe/framework/formats/tensor.h"
+#include "mediapipe/gpu/gl_base.h"
+#include "tensorflow/lite/delegates/gpu/gl/gl_program.h"
+#include "tensorflow/lite/delegates/gpu/gl/gl_texture.h"
+
+namespace mediapipe {
+namespace tasks {
+
+// Helper class for converting Android and Linux Tensors from OpenGL ES >=3.1
+// SSBO objects into OpenGL ES <=3.0 2D textures. Cannot be used with other
+// Tensor backends.
+class SsboToTextureConverter {
+ public:
+  SsboToTextureConverter() = default;
+  ~SsboToTextureConverter() = default;
+  absl::Status Init();
+  void Close();
+  absl::StatusOr<GLuint> ConvertTensorToGlTexture(const Tensor& tensor,
+                                                  const uint32_t width,
+                                                  const uint32_t height,
+                                                  const uint32_t channels);
+
+  // Should only be called after ConvertTensorToGlTexture
+  std::pair<const uint32_t, const uint32_t> GetTextureSize();
+
+ private:
+  uint32_t texture_width_;
+  uint32_t texture_height_;
+  tflite::gpu::gl::GlTexture out_texture_;
+  std::unique_ptr<tflite::gpu::gl::GlProgram> delinearization_program_;
+};
+
+}  // namespace tasks
+}  // namespace mediapipe
+
+#endif  // MEDIAPIPE_TASKS_CC_VISION_IMAGE_SEGMENTER_CALCULATORS_SSBO_TO_TEXTURE_CONVERTER_H_
--- a/mediapipe/tasks/cc/vision/image_segmenter/calculators/tensors_to_segmentation_calculator.cc
+++ b/mediapipe/tasks/cc/vision/image_segmenter/calculators/tensors_to_segmentation_calculator.cc
@ -43,9 +43,18 @@ limitations under the License.
 #include "mediapipe/util/label_map.pb.h"

 #ifdef __EMSCRIPTEN__
-#include "mediapipe/tasks/cc/vision/image_segmenter/calculators/segmentation_postprocessor_gl.h"
+#define TASK_SEGMENTATION_USE_GL_POSTPROCESSING 1
+#elif MEDIAPIPE_OPENGL_ES_VERSION >= MEDIAPIPE_OPENGL_ES_31 && \
+    !MEDIAPIPE_USING_SWIFTSHADER && defined(MEDIAPIPE_ANDROID)
+#define TASK_SEGMENTATION_USE_GL_POSTPROCESSING 1
+#else
+#undef TASK_SEGMENTATION_USE_GL_POSTPROCESSING
 #endif  // __EMSCRIPTEN__

+#ifdef TASK_SEGMENTATION_USE_GL_POSTPROCESSING
+#include "mediapipe/tasks/cc/vision/image_segmenter/calculators/segmentation_postprocessor_gl.h"
+#endif  // TASK_SEGMENTATION_USE_GL_POSTPROCESSING
+
 // TODO: consolidate TensorToSegmentationCalculator.
 namespace mediapipe {
 namespace tasks {
@ -308,19 +317,19 @@ class TensorsToSegmentationCalculator : public Node {
                                              const float* tensors_buffer);
  TensorsToSegmentationCalculatorOptions options_;

-#ifdef __EMSCRIPTEN__
+#ifdef TASK_SEGMENTATION_USE_GL_POSTPROCESSING
  SegmentationPostprocessorGl postprocessor_;
-#endif  // __EMSCRIPTEN__
+#endif  // TASK_SEGMENTATION_USE_GL_POSTPROCESSING
 };

 // static
 absl::Status TensorsToSegmentationCalculator::UpdateContract(
    CalculatorContract* cc) {
-#ifdef __EMSCRIPTEN__
+#ifdef TASK_SEGMENTATION_USE_GL_POSTPROCESSING
  return SegmentationPostprocessorGl::UpdateContract(cc);
 #else
  return absl::OkStatus();
-#endif  // __EMSCRIPTEN__
+#endif  // TASK_SEGMENTATION_USE_GL_POSTPROCESSING
 }

 absl::Status TensorsToSegmentationCalculator::Open(
@ -340,9 +349,9 @@ absl::Status TensorsToSegmentationCalculator::Open(
          "connected.");
    }
  }
-#ifdef __EMSCRIPTEN__
+#ifdef TASK_SEGMENTATION_USE_GL_POSTPROCESSING
  MP_RETURN_IF_ERROR(postprocessor_.Initialize(cc, options_));
-#endif  // __EMSCRIPTEN__
+#endif  // TASK_SEGMENTATION_USE_GL_POSTPROCESSING
  return absl::OkStatus();
 }

@ -390,11 +399,11 @@ absl::Status TensorsToSegmentationCalculator::Process(
  }

  // Use GPU postprocessing on web when Tensor is there already.
-#ifdef __EMSCRIPTEN__
+#ifdef TASK_SEGMENTATION_USE_GL_POSTPROCESSING
  Shape output_shape = {/* height= */ output_height,
                        /* width= */ output_width,
                        /* channels= */ input_shape.channels};
-  if (input_tensor.ready_as_opengl_texture_2d()) {
+  if (input_tensor.ready_on_gpu()) {
    bool produce_category_mask = options_.segmenter_options().output_type() ==
                                     SegmenterOptions::CATEGORY_MASK ||
                                 cc->Outputs().HasTag("CATEGORY_MASK");
@ -428,7 +437,7 @@ absl::Status TensorsToSegmentationCalculator::Process(
    }
    return absl::OkStatus();
  }
-#endif  // __EMSCRIPTEN__
+#endif  // TASK_SEGMENTATION_USE_GL_POSTPROCESSING

  // Otherwise, use CPU postprocessing.
  const float* tensors_buffer = input_tensor.GetCpuReadView().buffer<float>();