diff --git a/.gitignore b/.gitignore
index 5bcaac023..aa1bde53e 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,8 +1,4 @@
-mediapipe/provisioning_profile.mobileprovision
-bazel-bin
-bazel-genfiles
-bazel-mediapipe-ioss
-bazel-out
-bazel-testlogs
+bazel-*
 mediapipe/MediaPipe.xcodeproj
 mediapipe/MediaPipe.tulsiproj/*.tulsiconf-user
+mediapipe/provisioning_profile.mobileprovision
diff --git a/README.md b/README.md
index 2d136d932..5992bd82e 100644
--- a/README.md
+++ b/README.md
@@ -1,84 +1,141 @@
-![MediaPipe](mediapipe/docs/images/mediapipe_small.png?raw=true "MediaPipe logo")
-=======================================================================
+---
+layout: default
+title: Home
+nav_order: 1
+---
 
-[MediaPipe](http://mediapipe.dev) is the simplest way for researchers and developers to build world-class ML solutions and applications for mobile, edge, cloud and the web.
+![MediaPipe](docs/images/mediapipe_small.png)
 
-## ML Solutions in MediaPipe
+--------------------------------------------------------------------------------
 
-* [Face Detection](mediapipe/docs/face_detection_mobile_gpu.md) [(web demo)](https://viz.mediapipe.dev/runner/demos/face_detection/face_detection.html)
-* [Face Mesh](mediapipe/docs/face_mesh_mobile_gpu.md)
-* [Hand Detection](mediapipe/docs/hand_detection_mobile_gpu.md)
-* [Hand Tracking](mediapipe/docs/hand_tracking_mobile_gpu.md) [(web demo)](https://viz.mediapipe.dev/runner/demos/hand_tracking/hand_tracking.html)
-* [Multi-hand Tracking](mediapipe/docs/multi_hand_tracking_mobile_gpu.md)
-* [Hair Segmentation](mediapipe/docs/hair_segmentation_mobile_gpu.md) [(web demo)](https://viz.mediapipe.dev/runner/demos/hair_segmentation/hair_segmentation.html)
-* [Object Detection](mediapipe/docs/object_detection_mobile_gpu.md)
-* [Object Detection and Tracking](mediapipe/docs/object_tracking_mobile_gpu.md)
-* [Objectron: 3D Object Detection and Tracking](mediapipe/docs/objectron_mobile_gpu.md)
-* [AutoFlip: Intelligent Video Reframing](mediapipe/docs/autoflip.md)
-* [KNIFT: Template Matching with Neural Image Features](mediapipe/docs/template_matching_mobile_cpu.md)
+## Cross-platform ML solutions made simple
 
-![face_detection](mediapipe/docs/images/mobile/face_detection_android_gpu_small.gif)
-![face_mesh](mediapipe/docs/images/mobile/face_mesh_android_gpu_small.gif)
-![hand_tracking](mediapipe/docs/images/mobile/hand_tracking_android_gpu_small.gif)
-![multi-hand_tracking](mediapipe/docs/images/mobile/multi_hand_tracking_3d_android_gpu_small.gif)
-![hair_segmentation](mediapipe/docs/images/mobile/hair_segmentation_android_gpu_small.gif)
-![object_detection](mediapipe/docs/images/mobile/object_detection_android_gpu_small.gif)
-![object_tracking](mediapipe/docs/images/mobile/object_tracking_android_gpu_small.gif)
-![objectron_shoes](mediapipe/docs/images/mobile/objectron_shoe_android_gpu_small.gif)
-![objectron_chair](mediapipe/docs/images/mobile/objectron_chair_android_gpu_small.gif)
-![template_matching](mediapipe/docs/images/mobile/template_matching_android_cpu_small.gif)
+[MediaPipe](https://google.github.io/mediapipe/) is the simplest way for researchers
+and developers to build world-class ML solutions and applications for mobile,
+desktop/cloud, web and IoT devices.
 
-## Installation
-Follow these [instructions](mediapipe/docs/install.md).
+![accelerated.png](docs/images/accelerated_small.png)                                                               | ![cross_platform.png](docs/images/cross_platform_small.png)
+:------------------------------------------------------------------------------------------------------------: | :----------------------------------------------------:
+***End-to-End acceleration***: *built-in fast ML inference and processing accelerated even on common hardware* | ***Build one, deploy anywhere***: *Unified solution works across Android, iOS, desktop/cloud, web and IoT*
+![ready_to_use.png](docs/images/ready_to_use_small.png)                                                             | ![open_source.png](docs/images/open_source_small.png)
+***Ready-to-use solutions***: *Cutting-edge ML solutions demonstrating full power of the framework*            | ***Free and open source***: *Framework and solutions both under Apache 2.0, fully extensible and customizable*
+
+## ML solutions in MediaPipe
+
+Face Detection                                                                                                                 | Face Mesh                                                                                                       | Hand                                                                                                      | Hair Segmentation
+:----------------------------------------------------------------------------------------------------------------------------: | :-------------------------------------------------------------------------------------------------------------: | :-------------------------------------------------------------------------------------------------------: | :---------------:
+[![face_detection](docs/images/mobile/face_detection_android_gpu_small.gif)](https://google.github.io/mediapipe/solutions/face_detection) | [![face_mesh](docs/images/mobile/face_mesh_android_gpu_small.gif)](https://google.github.io/mediapipe/solutions/face_mesh) | [![hand](docs/images/mobile/hand_tracking_android_gpu_small.gif)](https://google.github.io/mediapipe/solutions/hand) | [![hair_segmentation](docs/images/mobile/hair_segmentation_android_gpu_small.gif)](https://google.github.io/mediapipe/solutions/hair_segmentation)
+
+Object Detection                                                                                                                     | Box Tracking                                                                                                                | Objectron                                                                                                             | KNIFT
+:----------------------------------------------------------------------------------------------------------------------------------: | :-------------------------------------------------------------------------------------------------------------------------: | :-------------------------------------------------------------------------------------------------------------------: | :---:
+[![object_detection](docs/images/mobile/object_detection_android_gpu_small.gif)](https://google.github.io/mediapipe/solutions/object_detection) | [![box_tracking](docs/images/mobile/object_tracking_android_gpu_small.gif)](https://google.github.io/mediapipe/solutions/box_tracking) | [![objectron](docs/images/mobile/objectron_chair_android_gpu_small.gif)](https://google.github.io/mediapipe/solutions/objectron) | [![knift](docs/images/mobile/template_matching_android_cpu_small.gif)](https://google.github.io/mediapipe/solutions/knift)
+
+<!-- []() in the first cell is needed to preserve table formatting in GitHub Pages. -->
+<!-- Whenever this table is updated, paste a copy to solutions/solutions.md. -->
+
+[]()                                                                          | Android | iOS | Desktop | Web | Coral
+:---------------------------------------------------------------------------- | :-----: | :-: | :-----: | :-: | :---:
+[Face Detection](https://google.github.io/mediapipe/solutions/face_detection)       | ✅       | ✅   | ✅       | ✅   | ✅
+[Face Mesh](https://google.github.io/mediapipe/solutions/face_mesh)                 | ✅       | ✅   | ✅       |     |
+[Hand](https://google.github.io/mediapipe/solutions/hand)                           | ✅       | ✅   | ✅       | ✅   |
+[Hair Segmentation](https://google.github.io/mediapipe/solutions/hair_segmentation) | ✅       |     | ✅       | ✅   |
+[Object Detection](https://google.github.io/mediapipe/solutions/object_detection)   | ✅       | ✅   | ✅       |     | ✅
+[Box Tracking](https://google.github.io/mediapipe/solutions/box_tracking)           | ✅       | ✅   | ✅       |     |
+[Objectron](https://google.github.io/mediapipe/solutions/objectron)                 | ✅       |     |         |     |
+[KNIFT](https://google.github.io/mediapipe/solutions/knift)                         | ✅       |     |         |     |
+[AutoFlip](https://google.github.io/mediapipe/solutions/autoflip)                   |         |     | ✅       |     |
+[MediaSequence](https://google.github.io/mediapipe/solutions/media_sequence)        |         |     | ✅       |     |
+[YouTube 8M](https://google.github.io/mediapipe/solutions/youtube_8m)               |         |     | ✅       |     |
+
+## MediaPipe on the Web
+
+MediaPipe on the Web is an effort to run the same ML solutions built for mobile
+and desktop also in web browsers. The official API is under construction, but
+the core technology has been proven effective. Please see
+[MediaPipe on the Web](https://developers.googleblog.com/2020/01/mediapipe-on-web.html)
+in Google Developers Blog for details.
+
+You can use the following links to load a demo in the MediaPipe Visualizer, and
+over there click the "Runner" icon in the top bar like shown below. The demos
+use your webcam video as input, which is processed all locally in real-time and
+never leaves your device.
+
+![visualizer_runner](docs/images/visualizer_runner.png)
+
+*   [MediaPipe Face Detection](https://viz.mediapipe.dev/demo/face_detection)
+*   [MediaPipe Hand](https://viz.mediapipe.dev/demo/hand_tracking)
+*   [MediaPipe Hand (palm/hand detection only)](https://viz.mediapipe.dev/demo/hand_detection)
+*   [MediaPipe Hair Segmentation](https://viz.mediapipe.dev/demo/hair_segmentation)
 
 ## Getting started
-See mobile, desktop, web and Google Coral [examples](mediapipe/docs/examples.md).
 
-## Documentation
-[MediaPipe Read-the-Docs](https://mediapipe.readthedocs.io/) or [docs.mediapipe.dev](https://docs.mediapipe.dev)
+Learn how to [install](https://google.github.io/mediapipe/getting_started/install)
+MediaPipe and
+[build example applications](https://google.github.io/mediapipe/getting_started/building_examples),
+and start exploring our ready-to-use
+[solutions](https://google.github.io/mediapipe/solutions/solutions) that you can
+further extend and customize.
 
-Check out the [Examples page](https://mediapipe.readthedocs.io/en/latest/examples.html) for tutorials on how to use MediaPipe. [Concepts page](https://mediapipe.readthedocs.io/en/latest/concepts.html) for basic definitions
-
-## Visualizing MediaPipe graphs
-A web-based visualizer is hosted on [viz.mediapipe.dev](https://viz.mediapipe.dev/). Please also see instructions [here](mediapipe/docs/visualizer.md).
-
-## Google Open Source Code search
-Search MediaPipe Github repository using [Google Open Source code search](https://t.co/LSZnbMUUnT?amp=1)
-
-## Videos
-*  [YouTube Channel](https://www.youtube.com/channel/UCObqmpuSMx-usADtL_qdMAw)
+The source code is hosted in the
+[MediaPipe Github repository](https://github.com/google/mediapipe), and you can
+run code search using
+[Google Open Source Code Search](https://cs.opensource.google/mediapipe/mediapipe).
 
 ## Publications
-* [MediaPipe KNIFT: Template-based Feature Matching](https://mediapipe.page.link/knift-blog)
-* [Alfred Camera: Smart camera features using MediaPipe](https://developers.googleblog.com/2020/03/alfred-camera-smart-camera-features-using-mediapipe.html)
-* [MediaPipe Objectron: Real-time 3D Object Detection on Mobile Devices](https://mediapipe.page.link/objectron-aiblog)
-* [AutoFlip: An Open Source Framework for Intelligent Video Reframing](https://mediapipe.page.link/autoflip)
-* [Google Developer Blog: MediaPipe on the Web](https://mediapipe.page.link/webdevblog)
-* [Google Developer Blog: Object Detection and Tracking using MediaPipe](https://mediapipe.page.link/objecttrackingblog)
-* [On-Device, Real-Time Hand Tracking with MediaPipe](https://ai.googleblog.com/2019/08/on-device-real-time-hand-tracking-with.html)
-* [MediaPipe: A Framework for Building Perception Pipelines](https://arxiv.org/abs/1906.08172)
+
+*   [MediaPipe KNIFT: Template-based feature matching](https://developers.googleblog.com/2020/04/mediapipe-knift-template-based-feature-matching.html)
+    in Google Developers Blog
+*   [Alfred Camera: Smart camera features using MediaPipe](https://developers.googleblog.com/2020/03/alfred-camera-smart-camera-features-using-mediapipe.html)
+    in Google Developers Blog
+*   [Real-Time 3D Object Detection on Mobile Devices with MediaPipe](https://ai.googleblog.com/2020/03/real-time-3d-object-detection-on-mobile.html)
+    in Google AI Blog
+*   [AutoFlip: An Open Source Framework for Intelligent Video Reframing](https://ai.googleblog.com/2020/02/autoflip-open-source-framework-for.html)
+    in Google AI Blog
+*   [MediaPipe on the Web](https://developers.googleblog.com/2020/01/mediapipe-on-web.html)
+    in Google Developers Blog
+*   [Object Detection and Tracking using MediaPipe](https://developers.googleblog.com/2019/12/object-detection-and-tracking-using-mediapipe.html)
+    in Google Developers Blog
+*   [On-Device, Real-Time Hand Tracking with MediaPipe](https://ai.googleblog.com/2019/08/on-device-real-time-hand-tracking-with.html)
+    in Google AI Blog
+*   [MediaPipe: A Framework for Building Perception Pipelines](https://arxiv.org/abs/1906.08172)
+
+## Videos
+
+*   [YouTube Channel](https://www.youtube.com/channel/UCObqmpuSMx-usADtL_qdMAw)
 
 ## Events
-* [MediaPipe Seattle Meetup, Google Building Waterside, 13 Feb 2020](https://mediapipe.page.link/seattle2020)
-* [AI Nextcon 2020, 12-16 Feb 2020, Seattle](http://aisea20.xnextcon.com/)
-* [MediaPipe Madrid Meetup, 16 Dec 2019](https://www.meetup.com/Madrid-AI-Developers-Group/events/266329088/)
-* [MediaPipe London Meetup, Google 123 Building, 12 Dec 2019](https://www.meetup.com/London-AI-Tech-Talk/events/266329038)
-* [ML Conference, Berlin, 11 Dec 2019](https://mlconference.ai/machine-learning-advanced-development/mediapipe-building-real-time-cross-platform-mobile-web-edge-desktop-video-audio-ml-pipelines/)
-* [MediaPipe Berlin Meetup, Google Berlin, 11 Dec 2019](https://www.meetup.com/Berlin-AI-Tech-Talk/events/266328794/)
-* [The 3rd Workshop on YouTube-8M Large Scale Video Understanding Workshop](https://research.google.com/youtube8m/workshop2019/index.html) Seoul, Korea ICCV 2019
-* [AI DevWorld 2019](https://aidevworld.com) on Oct 10 in San Jose, California
-* [Google Industry Workshop at ICIP 2019](http://2019.ieeeicip.org/?action=page4&id=14#Google) [Presentation](https://docs.google.com/presentation/d/e/2PACX-1vRIBBbO_LO9v2YmvbHHEt1cwyqH6EjDxiILjuT0foXy1E7g6uyh4CesB2DkkEwlRDO9_lWfuKMZx98T/pub?start=false&loop=false&delayms=3000&slide=id.g556cc1a659_0_5) on Sept 24 in Taipei, Taiwan
-* [Open sourced at CVPR 2019](https://sites.google.com/corp/view/perception-cv4arvr/mediapipe) on June 17~20 in Long Beach, CA
+
+*   [MediaPipe Seattle Meetup, Google Building Waterside, 13 Feb 2020](https://mediapipe.page.link/seattle2020)
+*   [AI Nextcon 2020, 12-16 Feb 2020, Seattle](http://aisea20.xnextcon.com/)
+*   [MediaPipe Madrid Meetup, 16 Dec 2019](https://www.meetup.com/Madrid-AI-Developers-Group/events/266329088/)
+*   [MediaPipe London Meetup, Google 123 Building, 12 Dec 2019](https://www.meetup.com/London-AI-Tech-Talk/events/266329038)
+*   [ML Conference, Berlin, 11 Dec 2019](https://mlconference.ai/machine-learning-advanced-development/mediapipe-building-real-time-cross-platform-mobile-web-edge-desktop-video-audio-ml-pipelines/)
+*   [MediaPipe Berlin Meetup, Google Berlin, 11 Dec 2019](https://www.meetup.com/Berlin-AI-Tech-Talk/events/266328794/)
+*   [The 3rd Workshop on YouTube-8M Large Scale Video Understanding Workshop,
+    Seoul, Korea ICCV
+    2019](https://research.google.com/youtube8m/workshop2019/index.html)
+*   [AI DevWorld 2019, 10 Oct 2019, San Jose, CA](https://aidevworld.com)
+*   [Google Industry Workshop at ICIP 2019, 24 Sept 2019, Taipei, Taiwan](http://2019.ieeeicip.org/?action=page4&id=14#Google)
+    ([presentation](https://docs.google.com/presentation/d/e/2PACX-1vRIBBbO_LO9v2YmvbHHEt1cwyqH6EjDxiILjuT0foXy1E7g6uyh4CesB2DkkEwlRDO9_lWfuKMZx98T/pub?start=false&loop=false&delayms=3000&slide=id.g556cc1a659_0_5))
+*   [Open sourced at CVPR 2019, 17~20 June, Long Beach, CA](https://sites.google.com/corp/view/perception-cv4arvr/mediapipe)
 
 ## Community
-*  [Awesome MediaPipe: curation of code related to MediaPipe](https://mediapipe.org)
-*  [Slack community for MediaPipe users](https://mediapipe.slack.com)
-*  [Discuss](https://groups.google.com/forum/#!forum/mediapipe) - General community discussion around MediaPipe
+
+*   [Awesome MediaPipe](https://mediapipe.org) - A curated list of awesome
+    MediaPipe related frameworks, libraries and software
+*   [Slack community](https://mediapipe.slack.com) for MediaPipe users
+*   [Discuss](https://groups.google.com/forum/#!forum/mediapipe) - General
+    community discussion around MediaPipe
 
 ## Alpha Disclaimer
-MediaPipe is currently in alpha for v0.7. We are still making breaking API changes and expect to get to stable API by v1.0.
+
+MediaPipe is currently in alpha at v0.7. We may be still making breaking API
+changes and expect to get to stable APIs by v1.0.
 
 ## Contributing
-We welcome contributions. Please follow these [guidelines](./CONTRIBUTING.md).
 
-We use GitHub issues for tracking requests and bugs. Please post questions to the MediaPipe Stack Overflow with a 'mediapipe' tag.
+We welcome contributions. Please follow these
+[guidelines](https://github.com/google/mediapipe/blob/master/CONTRIBUTING.md).
+
+We use GitHub issues for tracking requests and bugs. Please post questions to
+the MediaPipe Stack Overflow with a `mediapipe` tag.
diff --git a/mediapipe/docs/Makefile b/docs/Makefile
similarity index 100%
rename from mediapipe/docs/Makefile
rename to docs/Makefile
diff --git a/docs/_config.yml b/docs/_config.yml
new file mode 100644
index 000000000..4da202e75
--- /dev/null
+++ b/docs/_config.yml
@@ -0,0 +1,29 @@
+# Configuration for GitHub Pages
+
+remote_theme: pmarsceill/just-the-docs
+
+# Set a path/url to a logo that will be displayed instead of the title
+logo: "images/logo_horizontal_color.png"
+
+# Enable or disable the site search
+search_enabled: true
+
+# Set the search token separator for hyphenated-word search:
+search_tokenizer_separator: /[\s/]+/
+
+# Enable or disable heading anchors
+heading_anchors: true
+
+# Aux links for the upper right navigation
+aux_links:
+  "MediaPipe on GitHub":
+    - "//github.com/google/mediapipe"
+
+# Footer content appears at the bottom of every page's main content
+footer_content: "&copy; 2020 GOOGLE LLC | <a href=\"https://policies.google.com/privacy\">PRIVACY POLICY</a> | <a href=\"https://policies.google.com/terms\">TERMS OF SERVICE</a>"
+
+# Color scheme currently only supports "dark" or nil (default)
+color_scheme: nil
+
+# Google Analytics Tracking (optional)
+ga_tracking: UA-140696581-2
diff --git a/mediapipe/docs/conf.py b/docs/conf.py
similarity index 100%
rename from mediapipe/docs/conf.py
rename to docs/conf.py
diff --git a/mediapipe/docs/data/visualizer/sample_trace.binarypb b/docs/data/visualizer/sample_trace.binarypb
similarity index 100%
rename from mediapipe/docs/data/visualizer/sample_trace.binarypb
rename to docs/data/visualizer/sample_trace.binarypb
diff --git a/docs/examples.md b/docs/examples.md
new file mode 100644
index 000000000..b45a2ee39
--- /dev/null
+++ b/docs/examples.md
@@ -0,0 +1,96 @@
+---
+nav_exclude: true
+---
+
+# Examples
+
+Below are code samples on how to run MediaPipe on both mobile and desktop. We
+currently support MediaPipe APIs on mobile for Android only but will add support
+for Objective-C shortly.
+
+## Mobile
+
+### [Hello World! on Android](./getting_started/hello_world_android.md)
+
+This should be the first mobile Android example users go through in detail. It
+teaches the following:
+
+*   Introduction of a simple MediaPipe graph running on mobile GPUs for
+    [Sobel edge detection](https://en.wikipedia.org/wiki/Sobel_operator).
+*   Building a simple baseline Android application that displays "Hello World!".
+*   Adding camera preview support into the baseline application using the
+    Android [CameraX] API.
+*   Incorporating the Sobel edge detection graph to process the live camera
+    preview and display the processed video in real-time.
+
+[Sobel edge detection]:https://en.wikipedia.org/wiki/Sobel_operator
+[CameraX]:https://developer.android.com/training/camerax
+
+### [Hello World! on iOS](./getting_started/hello_world_ios.md)
+
+This is the iOS version of Sobel edge detection example.
+
+### [Face Detection](./solutions/face_detection.md)
+
+### [Face Mesh](./solutions/face_mesh.md)
+
+### [Hand](./solutions/hand.md)
+
+### [Hair Segmentation](./solutions/hair_segmentation.md)
+
+### [Object Detection](./solutions/object_detection.md)
+
+### [Box Tracking](./solutions/box_tracking.md)
+
+### [Objectron: 3D Object Detection](./solutions/objectron.md)
+
+### [KNIFT: Template-based Feature Matching](./solutions/knift.md)
+
+## Desktop
+
+### [Hello World for C++](./getting_started/hello_world_desktop.md)
+
+This shows how to run a simple graph using the MediaPipe C++ APIs.
+
+### [Face Detection](./solutions/face_detection.md)
+
+### [Face Mesh](./solutions/face_mesh.md)
+
+### [Hand](./solutions/hand.md)
+
+### [Hair Segmentation](./solutions/hair_segmentation.md)
+
+### [Object Detection](./solutions/object_detection.md)
+
+### [Box Tracking](./solutions/box_tracking.md)
+
+### [AutoFlip - Semantic-aware Video Cropping](./solutions/autoflip.md)
+
+### [Preparing Data Sets with MediaSequence](./solutions/media_sequence.md)
+
+This shows how to use MediaPipe for media processing to prepare video data sets
+for training a TensorFlow model.
+
+### [Feature Extraction and Model Inference for YouTube-8M Challenge](./solutions/youtube_8m.md)
+
+This shows how to use MediaPipe to prepare training data for the YouTube-8M
+Challenge and do the model inference with the baseline model.
+
+## Google Coral (ML acceleration with Google EdgeTPU)
+
+### [Face Detection](./solutions/face_detection.md)
+
+### [Object Detection](./solutions/object_detection.md)
+
+## Web Browser
+
+See more details [here](./getting_started/web.md) and
+[Google Developer blog post](https://mediapipe.page.link/webdevblog).
+
+### [Face Detection in Browser](https://viz.mediapipe.dev/demo/face_detection)
+
+### [Hand Detection in Browser](https://viz.mediapipe.dev/demo/hand_detection)
+
+### [Hand Tracking in Browser](https://viz.mediapipe.dev/demo/hand_tracking)
+
+### [Hair Segmentation in Browser](https://viz.mediapipe.dev/demo/hair_segmentation)
diff --git a/docs/framework_concepts/calculators.md b/docs/framework_concepts/calculators.md
new file mode 100644
index 000000000..66aefb7b1
--- /dev/null
+++ b/docs/framework_concepts/calculators.md
@@ -0,0 +1,412 @@
+---
+layout: default
+title: Calculators
+parent: Framework Concepts
+nav_order: 1
+---
+
+# Calculators
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
+
+Each calculator is a node of a graph. We describe how to create a new
+calculator, how to initialize a calculator, how to perform its calculations,
+input and output streams, timestamps, and options. Each node in the graph is
+implemented as a `Calculator`. The bulk of graph execution happens inside its
+calculators. A calculator may receive zero or more input streams and/or side
+packets and produces zero or more output streams and/or side packets.
+
+## CalculatorBase
+
+A calculator is created by defining a new sub-class of the
+[`CalculatorBase`](https://github.com/google/mediapipe/tree/master/mediapipe/framework/calculator_base.cc)
+class, implementing a number of methods, and registering the new sub-class with
+Mediapipe. At a minimum, a new calculator must implement the below four methods
+
+*   `GetContract()`
+    *   Calculator authors can specify the expected types of inputs and outputs
+        of a calculator in GetContract(). When a graph is initialized, the
+        framework calls a static method to verify if the packet types of the
+        connected inputs and outputs match the information in this
+        specification.
+*   `Open()`
+    *   After a graph starts, the framework calls `Open()`. The input side
+        packets are available to the calculator at this point. `Open()`
+        interprets the node configuration operations (see [Graphs](graphs.md))
+        and prepares the calculator's per-graph-run state. This function may
+        also write packets to calculator outputs. An error during `Open()` can
+        terminate the graph run.
+*   `Process()`
+    *   For a calculator with inputs, the framework calls `Process()` repeatedly
+        whenever at least one input stream has a packet available. The framework
+        by default guarantees that all inputs have the same timestamp (see
+        [Synchronization](synchronization.md) for more information). Multiple
+        `Process()` calls can be invoked simultaneously when parallel execution
+        is enabled. If an error occurs during `Process()`, the framework calls
+        `Close()` and the graph run terminates.
+*   `Close()`
+    *   After all calls to `Process()` finish or when all input streams close,
+        the framework calls `Close()`. This function is always called if
+        `Open()` was called and succeeded and even if the graph run terminated
+        because of an error. No inputs are available via any input streams
+        during `Close()`, but it still has access to input side packets and
+        therefore may write outputs. After `Close()` returns, the calculator
+        should be considered a dead node. The calculator object is destroyed as
+        soon as the graph finishes running.
+
+The following are code snippets from
+[CalculatorBase.h](https://github.com/google/mediapipe/tree/master/mediapipe/framework/calculator_base.h).
+
+```c++
+class CalculatorBase {
+ public:
+  ...
+
+  // The subclasses of CalculatorBase must implement GetContract.
+  // ...
+  static ::MediaPipe::Status GetContract(CalculatorContract* cc);
+
+  // Open is called before any Process() calls, on a freshly constructed
+  // calculator.  Subclasses may override this method to perform necessary
+  // setup, and possibly output Packets and/or set output streams' headers.
+  // ...
+  virtual ::MediaPipe::Status Open(CalculatorContext* cc) {
+    return ::MediaPipe::OkStatus();
+  }
+
+  // Processes the incoming inputs. May call the methods on cc to access
+  // inputs and produce outputs.
+  // ...
+  virtual ::MediaPipe::Status Process(CalculatorContext* cc) = 0;
+
+  // Is called if Open() was called and succeeded.  Is called either
+  // immediately after processing is complete or after a graph run has ended
+  // (if an error occurred in the graph).  ...
+  virtual ::MediaPipe::Status Close(CalculatorContext* cc) {
+    return ::MediaPipe::OkStatus();
+  }
+
+  ...
+};
+```
+
+## Life of a calculator
+
+During initialization of a MediaPipe graph, the framework calls a
+`GetContract()` static method to determine what kinds of packets are expected.
+
+The framework constructs and destroys the entire calculator for each graph run
+(e.g. once per video or once per image). Expensive or large objects that remain
+constant across graph runs should be supplied as input side packets so the
+calculations are not repeated on subsequent runs.
+
+After initialization, for each run of the graph, the following sequence occurs:
+
+*   `Open()`
+*   `Process()` (repeatedly)
+*   `Close()`
+
+The framework calls `Open()` to initialize the calculator. `Open()` should
+interpret any options and set up the calculator's per-graph-run state. `Open()`
+may obtain input side packets and write packets to calculator outputs. If
+appropriate, it should call `SetOffset()` to reduce potential packet buffering
+of input streams.
+
+If an error occurs during `Open()` or `Process()` (as indicated by one of them
+returning a non-`Ok` status), the graph run is terminated with no further calls
+to the calculator's methods, and the calculator is destroyed.
+
+For a calculator with inputs, the framework calls `Process()` whenever at least
+one input has a packet available. The framework guarantees that inputs all have
+the same timestamp, that timestamps increase with each call to `Process()` and
+that all packets are delivered. As a consequence, some inputs may not have any
+packets when `Process()` is called. An input whose packet is missing appears to
+produce an empty packet (with no timestamp).
+
+The framework calls `Close()` after all calls to `Process()`. All inputs will
+have been exhausted, but `Close()` has access to input side packets and may
+write outputs. After Close returns, the calculator is destroyed.
+
+Calculators with no inputs are referred to as sources. A source calculator
+continues to have `Process()` called as long as it returns an `Ok` status. A
+source calculator indicates that it is exhausted by returning a stop status
+(i.e. MediaPipe::tool::StatusStop).
+
+## Identifying inputs and outputs
+
+The public interface to a calculator consists of a set of input streams and
+output streams. In a CalculatorGraphConfiguration, the outputs from some
+calculators are connected to the inputs of other calculators using named
+streams. Stream names are normally lowercase, while input and output tags are
+normally UPPERCASE. In the example below, the output with tag name `VIDEO` is
+connected to the input with tag name `VIDEO_IN` using the stream named
+`video_stream`.
+
+```proto
+# Graph describing calculator SomeAudioVideoCalculator
+node {
+  calculator: "SomeAudioVideoCalculator"
+  input_stream: "INPUT:combined_input"
+  output_stream: "VIDEO:video_stream"
+}
+node {
+  calculator: "SomeVideoCalculator"
+  input_stream: "VIDEO_IN:video_stream"
+  output_stream: "VIDEO_OUT:processed_video"
+}
+```
+
+Input and output streams can be identified by index number, by tag name, or by a
+combination of tag name and index number. You can see some examples of input and
+output identifiers in the example below. `SomeAudioVideoCalculator` identifies
+its video output by tag and its audio outputs by the combination of tag and
+index. The input with tag `VIDEO` is connected to the stream named
+`video_stream`. The outputs with tag `AUDIO` and indices `0` and `1` are
+connected to the streams named `audio_left` and `audio_right`.
+`SomeAudioCalculator` identifies its audio inputs by index only (no tag needed).
+
+```proto
+# Graph describing calculator SomeAudioVideoCalculator
+node {
+  calculator: "SomeAudioVideoCalculator"
+  input_stream: "combined_input"
+  output_stream: "VIDEO:video_stream"
+  output_stream: "AUDIO:0:audio_left"
+  output_stream: "AUDIO:1:audio_right"
+}
+
+node {
+  calculator: "SomeAudioCalculator"
+  input_stream: "audio_left"
+  input_stream: "audio_right"
+  output_stream: "audio_energy"
+}
+```
+
+In the calculator implementation, inputs and outputs are also identified by tag
+name and index number. In the function below input are output are identified:
+
+*   By index number: The combined input stream is identified simply by index
+    `0`.
+*   By tag name: The video output stream is identified by tag name "VIDEO".
+*   By tag name and index number: The output audio streams are identified by the
+    combination of the tag name `AUDIO` and the index numbers `0` and `1`.
+
+```c++
+// c++ Code snippet describing the SomeAudioVideoCalculator GetContract() method
+class SomeAudioVideoCalculator : public CalculatorBase {
+ public:
+  static ::mediapipe::Status GetContract(CalculatorContract* cc) {
+    cc->Inputs().Index(0).SetAny();
+    // SetAny() is used to specify that whatever the type of the
+    // stream is, it's acceptable.  This does not mean that any
+    // packet is acceptable.  Packets in the stream still have a
+    // particular type.  SetAny() has the same effect as explicitly
+    // setting the type to be the stream's type.
+    cc->Outputs().Tag("VIDEO").Set<ImageFrame>();
+    cc->Outputs().Get("AUDIO", 0).Set<Matrix>;
+    cc->Outputs().Get("AUDIO", 1).Set<Matrix>;
+    return ::mediapipe::OkStatus();
+  }
+```
+
+## Processing
+
+`Process()` called on a non-source node must return `::mediapipe::OkStatus()` to
+indicate that all went well, or any other status code to signal an error
+
+If a non-source calculator returns `tool::StatusStop()`, then this signals the
+graph is being cancelled early. In this case, all source calculators and graph
+input streams will be closed (and remaining Packets will propagate through the
+graph).
+
+A source node in a graph will continue to have `Process()` called on it as long
+as it returns `::mediapipe::OkStatus(`). To indicate that there is no more data
+to be generated return `tool::StatusStop()`. Any other status indicates an error
+has occurred.
+
+`Close()` returns `::mediapipe::OkStatus()` to indicate success. Any other
+status indicates a failure.
+
+Here is the basic `Process()` function. It uses the `Input()` method (which can
+be used only if the calculator has a single input) to request its input data. It
+then uses `std::unique_ptr` to allocate the memory needed for the output packet,
+and does the calculations. When done it releases the pointer when adding it to
+the output stream.
+
+```c++
+::util::Status MyCalculator::Process() {
+  const Matrix& input = Input()->Get<Matrix>();
+  std::unique_ptr<Matrix> output(new Matrix(input.rows(), input.cols()));
+  // do your magic here....
+  //    output->row(n) =  ...
+  Output()->Add(output.release(), InputTimestamp());
+  return ::mediapipe::OkStatus();
+}
+```
+
+## Example calculator
+
+This section discusses the implementation of `PacketClonerCalculator`, which
+does a relatively simple job, and is used in many calculator graphs.
+`PacketClonerCalculator` simply produces a copy of its most recent input
+packets on demand.
+
+`PacketClonerCalculator` is useful when the timestamps of arriving data packets
+are not aligned perfectly. Suppose we have a room with a microphone, light
+sensor and a video camera that is collecting sensory data. Each of the sensors
+operates independently and collects data intermittently. Suppose that the output
+of each sensor is:
+
+*   microphone = loudness in decibels of sound in the room (Integer)
+*   light sensor = brightness of room (Integer)
+*   video camera = RGB image frame of room (ImageFrame)
+
+Our simple perception pipeline is designed to process sensory data from these 3
+sensors such that at any time when we have image frame data from the camera that
+is synchronized with the last collected microphone loudness data and light
+sensor brightness data. To do this with MediaPipe, our perception pipeline has 3
+input streams:
+
+*   room_mic_signal - Each packet of data in this input stream is integer data
+    representing how loud audio is in a room with timestamp.
+*   room_lightening_sensor - Each packet of data in this input stream is integer
+    data representing how bright is the room illuminated with timestamp.
+*   room_video_tick_signal - Each packet of data in this input stream is
+    imageframe of video data representing video collected from camera in the
+    room with timestamp.
+
+Below is the implementation of the `PacketClonerCalculator`.  You can see
+the `GetContract()`, `Open()`, and `Process()` methods as well as the instance
+variable `current_` which holds the most recent input packets.
+
+```c++
+// This takes packets from N+1 streams, A_1, A_2, ..., A_N, B.
+// For every packet that appears in B, outputs the most recent packet from each
+// of the A_i on a separate stream.
+
+#include <vector>
+
+#include "absl/strings/str_cat.h"
+#include "mediapipe/framework/calculator_framework.h"
+
+namespace mediapipe {
+
+// For every packet received on the last stream, output the latest packet
+// obtained on all other streams. Therefore, if the last stream outputs at a
+// higher rate than the others, this effectively clones the packets from the
+// other streams to match the last.
+//
+// Example config:
+// node {
+//   calculator: "PacketClonerCalculator"
+//   input_stream: "first_base_signal"
+//   input_stream: "second_base_signal"
+//   input_stream: "tick_signal"
+//   output_stream: "cloned_first_base_signal"
+//   output_stream: "cloned_second_base_signal"
+// }
+//
+class PacketClonerCalculator : public CalculatorBase {
+ public:
+  static ::mediapipe::Status GetContract(CalculatorContract* cc) {
+    const int tick_signal_index = cc->Inputs().NumEntries() - 1;
+    // cc->Inputs().NumEntries() returns the number of input streams
+    // for the PacketClonerCalculator
+    for (int i = 0; i < tick_signal_index; ++i) {
+      cc->Inputs().Index(i).SetAny();
+      // cc->Inputs().Index(i) returns the input stream pointer by index
+      cc->Outputs().Index(i).SetSameAs(&cc->Inputs().Index(i));
+    }
+    cc->Inputs().Index(tick_signal_index).SetAny();
+    return ::mediapipe::OkStatus();
+  }
+
+  ::mediapipe::Status Open(CalculatorContext* cc) final {
+    tick_signal_index_ = cc->Inputs().NumEntries() - 1;
+    current_.resize(tick_signal_index_);
+    // Pass along the header for each stream if present.
+    for (int i = 0; i < tick_signal_index_; ++i) {
+      if (!cc->Inputs().Index(i).Header().IsEmpty()) {
+        cc->Outputs().Index(i).SetHeader(cc->Inputs().Index(i).Header());
+        // Sets the output stream of index i header to be the same as
+        // the header for the input stream of index i
+      }
+    }
+    return ::mediapipe::OkStatus();
+  }
+
+  ::mediapipe::Status Process(CalculatorContext* cc) final {
+    // Store input signals.
+    for (int i = 0; i < tick_signal_index_; ++i) {
+      if (!cc->Inputs().Index(i).Value().IsEmpty()) {
+        current_[i] = cc->Inputs().Index(i).Value();
+      }
+    }
+
+    // Output if the tick signal is non-empty.
+    if (!cc->Inputs().Index(tick_signal_index_).Value().IsEmpty()) {
+      for (int i = 0; i < tick_signal_index_; ++i) {
+        if (!current_[i].IsEmpty()) {
+          cc->Outputs().Index(i).AddPacket(
+              current_[i].At(cc->InputTimestamp()));
+          // Add a packet to output stream of index i a packet from inputstream i
+          // with timestamp common to all present inputs
+          //
+        } else {
+          cc->Outputs().Index(i).SetNextTimestampBound(
+              cc->InputTimestamp().NextAllowedInStream());
+          // if current_[i], 1 packet buffer for input stream i is empty, we will set
+          // next allowed timestamp for input stream i to be current timestamp + 1
+        }
+      }
+    }
+    return ::mediapipe::OkStatus();
+  }
+
+ private:
+  std::vector<Packet> current_;
+  int tick_signal_index_;
+};
+
+REGISTER_CALCULATOR(PacketClonerCalculator);
+}  // namespace mediapipe
+```
+
+Typically, a calculator has only a .cc file. No .h is required, because
+mediapipe uses registration to make calculators known to it. After you have
+defined your calculator class, register it with a macro invocation
+REGISTER_CALCULATOR(calculator_class_name).
+
+Below is a trivial MediaPipe graph that has 3 input streams, 1 node
+(PacketClonerCalculator) and 3 output streams.
+
+```proto
+input_stream: "room_mic_signal"
+input_stream: "room_lighting_sensor"
+input_stream: "room_video_tick_signal"
+
+node {
+   calculator: "PacketClonerCalculator"
+   input_stream: "room_mic_signal"
+   input_stream: "room_lighting_sensor"
+   input_stream: "room_video_tick_signal"
+   output_stream: "cloned_room_mic_signal"
+   output_stream: "cloned_lighting_sensor"
+ }
+```
+
+The diagram below shows how the `PacketClonerCalculator` defines its output
+packets based on its series of input packets.
+
+| ![Graph using                                                                |
+: PacketClonerCalculator](../images/packet_cloner_calculator.png)              :
+| :--------------------------------------------------------------------------: |
+| *Each time it receives a packet on its TICK input stream, the                |
+: PacketClonerCalculator outputs the most recent packet from each of its input :
+: streams. The sequence of output packets is determined by the sequene of      :
+: input packets and their timestamps. The timestamps are shows along the right :
+: side of the diagram.*                                                        :
diff --git a/mediapipe/docs/concepts.md b/docs/framework_concepts/framework_concepts.md
similarity index 62%
rename from mediapipe/docs/concepts.md
rename to docs/framework_concepts/framework_concepts.md
index 37d988e6d..b39adf154 100644
--- a/mediapipe/docs/concepts.md
+++ b/docs/framework_concepts/framework_concepts.md
@@ -1,24 +1,42 @@
-# MediaPipe Concepts
+---
+layout: default
+title: Framework Concepts
+nav_order: 5
+has_children: true
+has_toc: false
+---
+
+# Framework Concepts
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
 
 ## The basics
 
 ### Packet
 
-The basic data flow unit. A packet consists of a numeric timestamp and a shared pointer to an **immutable** payload. The payload can be of any C++ type, and the payload's type is also referred to as the type of the packet. Packets are value classes and can be copied cheaply. Each copy shares ownership of the payload, with reference-counting semantics. Each copy has its own timestamp. [Details](packets.md).
+The basic data flow unit. A packet consists of a numeric timestamp and a shared
+pointer to an **immutable** payload. The payload can be of any C++ type, and the
+payload's type is also referred to as the type of the packet. Packets are value
+classes and can be copied cheaply. Each copy shares ownership of the payload,
+with reference-counting semantics. Each copy has its own timestamp. See also
+[Packet](packets.md).
 
 ### Graph
 
 MediaPipe processing takes place inside a graph, which defines packet flow paths
 between **nodes**. A graph can have any number of inputs and outputs, and data
-flow can branch and merge. Generally data flows forward, but
-[backward loops](cycles.md) are possible.
+flow can branch and merge. Generally data flows forward, but backward loops are
+possible. See [Graphs](graphs.md) for details.
 
 ### Nodes
 
 Nodes produce and/or consume packets, and they are where the bulk of the graph’s
 work takes place. They are also known as “calculators”, for historical reasons.
-Each node’s interface defines a number of input and output **ports**, identified by
-a tag and/or an index.
+Each node’s interface defines a number of input and output **ports**, identified
+by a tag and/or an index. See [Calculators](calculators.md) for details.
 
 ### Streams
 
@@ -34,21 +52,23 @@ whereas a stream represents a flow of data that changes over time.
 ### Packet Ports
 
 A port has an associated type; packets transiting through the port must be of
-that type. An output stream port can be connected to any number of
-input stream ports of the same type; each consumer receives a separate copy of
-the output packets, and has its own queue, so it can consume them at its own
-pace. Similarly, a side packet output port can be connected to as many side
-packet input ports as desired.
+that type. An output stream port can be connected to any number of input stream
+ports of the same type; each consumer receives a separate copy of the output
+packets, and has its own queue, so it can consume them at its own pace.
+Similarly, a side packet output port can be connected to as many side packet
+input ports as desired.
 
 A port can be required, meaning that a connection must be made for the graph to
 be valid, or optional, meaning it may remain unconnected.
 
-Note: even if a stream connection is required, the stream may not carry a packet for all timestamps.
+Note: even if a stream connection is required, the stream may not carry a packet
+for all timestamps.
 
 ## Input and output
 
 Data flow can originate from **source nodes**, which have no input streams and
-produce packets spontaneously (e.g. by reading from a file); or from **graph input streams**, which let an application feed packets into a graph.
+produce packets spontaneously (e.g. by reading from a file); or from **graph
+input streams**, which let an application feed packets into a graph.
 
 Similarly, there are **sink nodes** that receive data and write it to various
 destinations (e.g. a file, a memory buffer, etc.), and an application can also
@@ -78,15 +98,15 @@ processed data.
 
 ### Input policies
 
-The default input policy is deterministic collation of packets by timestamp. A node receives
-all inputs for the same timestamp at the same time, in an invocation of its
-Process method; and successive input sets are received in their timestamp order. This can
-require delaying the processing of some packets until a packet with the same
-timestamp is received on all input streams, or until it can be guaranteed that a
-packet with that timestamp will not be arriving on the streams that have not
-received it.
+The default input policy is deterministic collation of packets by timestamp. A
+node receives all inputs for the same timestamp at the same time, in an
+invocation of its Process method; and successive input sets are received in
+their timestamp order. This can require delaying the processing of some packets
+until a packet with the same timestamp is received on all input streams, or
+until it can be guaranteed that a packet with that timestamp will not be
+arriving on the streams that have not received it.
 
 Other policies are also available, implemented using a separate kind of
 component known as an InputStreamHandler.
 
-See [scheduling](scheduling_sync.md) for more details.
+See [Synchronization](synchronization.md) for more details.
diff --git a/mediapipe/docs/gpu.md b/docs/framework_concepts/gpu.md
similarity index 52%
rename from mediapipe/docs/gpu.md
rename to docs/framework_concepts/gpu.md
index e2d2be983..06355ac44 100644
--- a/mediapipe/docs/gpu.md
+++ b/docs/framework_concepts/gpu.md
@@ -1,14 +1,18 @@
-## Running on GPUs
+---
+layout: default
+title: GPU
+parent: Framework Concepts
+nav_order: 5
+---
 
--   [Overview](#overview)
--   [OpenGL ES Support](#opengl-es-support)
--   [Disable OpenGL ES Support](#disable-opengl-es-support)
--   [OpenGL ES Setup on Linux Desktop](#opengl-es-setup-on-linux-desktop)
--   [TensorFlow CUDA Support and Setup on Linux Desktop](#tensorflow-cuda-support-and-setup-on-linux-desktop)
--   [Life of a GPU Calculator](#life-of-a-gpu-calculator)
--   [GpuBuffer to ImageFrame Converters](#gpubuffer-to-imageframe-converters)
+# GPU
+{: .no_toc }
 
-### Overview
+1. TOC
+{:toc}
+---
+
+## Overview
 
 MediaPipe supports calculator nodes for GPU compute and rendering, and allows combining multiple GPU nodes, as well as mixing them with CPU based calculator nodes. There exist several GPU APIs on mobile platforms (eg, OpenGL ES, Metal and Vulkan). MediaPipe does not attempt to offer a single cross-API GPU abstraction. Individual nodes can be written using different APIs, allowing them to take advantage of platform specific features when needed.
 
@@ -25,7 +29,7 @@ Below are the design principles for GPU support in MediaPipe
    * Because different platforms may require different techniques for best performance, the API should allow flexibility in the way things are implemented behind the scenes.
    * A calculator should be allowed maximum flexibility in using the GPU for all or part of its operation, combining it with the CPU if necessary.
 
-### OpenGL ES Support
+## OpenGL ES Support
 
 MediaPipe supports OpenGL ES up to version 3.2 on Android/Linux and up to ES 3.0
 on iOS. In addition, MediaPipe also supports Metal on iOS.
@@ -50,172 +54,7 @@ some Android devices. Therefore, our approach is to have one dedicated thread
 per context. Each thread issues GL commands, building up a serial command queue
 on its context, which is then executed by the GPU asynchronously.
 
-### Disable OpenGL ES Support
-
-By default, building MediaPipe (with no special bazel flags) attempts to compile
-and link against OpenGL ES (and for iOS also Metal) libraries.
-
-On platforms where OpenGL ES is not available (see also
-[OpenGL ES Setup on Linux Desktop](#opengl-es-setup-on-linux-desktop)), you
-should disable OpenGL ES support with:
-
-```
-$ bazel build --define MEDIAPIPE_DISABLE_GPU=1 <my-target>
-```
-
-Note: On Android and iOS, OpenGL ES is required by MediaPipe framework and the
-support should never be disabled.
-
-### OpenGL ES Setup on Linux Desktop
-
-On Linux desktop with video cards that support OpenGL ES 3.1+, MediaPipe can run
-GPU compute and rendering and perform TFLite inference on GPU.
-
-To check if your Linux desktop GPU can run MediaPipe with OpenGL ES:
-
-```bash
-$ sudo apt-get install mesa-common-dev libegl1-mesa-dev libgles2-mesa-dev
-$ sudo apt-get install mesa-utils
-$ glxinfo | grep -i opengl
-```
-
-For example, it may print:
-
-```bash
-$ glxinfo | grep -i opengl
-...
-OpenGL ES profile version string: OpenGL ES 3.2 NVIDIA 430.50
-OpenGL ES profile shading language version string: OpenGL ES GLSL ES 3.20
-OpenGL ES profile extensions:
-```
-
-*Notice the ES 3.20 text above.*
-
-You need to see ES 3.1 or greater printed in order to perform TFLite inference
-on GPU in MediaPipe. With this setup, build with:
-
-```
-$ bazel build --copt -DMESA_EGL_NO_X11_HEADERS --copt -DEGL_NO_X11 <my-target>
-```
-
-If only ES 3.0 or below is supported, you can still build MediaPipe targets that
-don't require TFLite inference on GPU with:
-
-```
-$ bazel build --copt -DMESA_EGL_NO_X11_HEADERS --copt -DEGL_NO_X11 --copt -DMEDIAPIPE_DISABLE_GL_COMPUTE <my-target>
-```
-
-Note: MEDIAPIPE_DISABLE_GL_COMPUTE is already defined automatically on all Apple
-systems (Apple doesn't support OpenGL ES 3.1+).
-
-### TensorFlow CUDA Support and Setup on Linux Desktop
-
-MediaPipe framework doesn't require CUDA for GPU compute and rendering. However,
-MediaPipe can work with TensorFlow to perform GPU inference on video cards that
-support CUDA.
-
-To enable TensorFlow GPU inference with MediaPipe, the first step is to follow
-the
-[TensorFlow GPU documentation](https://www.tensorflow.org/install/gpu#software_requirements)
-to install the required NVIDIA software on your Linux desktop.
-
-After installation, update `$PATH` and `$LD_LIBRARY_PATH` and run `ldconfig`
-with:
-
-```
-$ export PATH=/usr/local/cuda-10.1/bin${PATH:+:${PATH}}
-$ export LD_LIBRARY_PATH=/usr/local/cuda/extras/CUPTI/lib64,/usr/local/cuda-10.1/lib64${LD_LIBRARY_PATH:+:${LD_LIBRARY_PATH}}
-$ sudo ldconfig
-```
-
-It's recommended to verify the installation of CUPTI, CUDA, CuDNN, and NVCC:
-
-```
-$ ls /usr/local/cuda/extras/CUPTI
-/lib64
-libcupti.so       libcupti.so.10.1.208  libnvperf_host.so        libnvperf_target.so
-libcupti.so.10.1  libcupti_static.a     libnvperf_host_static.a
-
-$ ls /usr/local/cuda-10.1
-LICENSE  bin  extras   lib64      libnvvp           nvml  samples  src      tools
-README   doc  include  libnsight  nsightee_plugins  nvvm  share    targets  version.txt
-
-$ nvcc -V
-nvcc: NVIDIA (R) Cuda compiler driver
-Copyright (c) 2005-2019 NVIDIA Corporation
-Built on Sun_Jul_28_19:07:16_PDT_2019
-Cuda compilation tools, release 10.1, V10.1.243
-
-$ ls /usr/lib/x86_64-linux-gnu/ | grep libcudnn.so
-libcudnn.so
-libcudnn.so.7
-libcudnn.so.7.6.4
-```
-
-Setting `$TF_CUDA_PATHS` is the way to declare where the CUDA library is. Note
-that the following code snippet also adds `/usr/lib/x86_64-linux-gnu` and
-`/usr/include` into `$TF_CUDA_PATHS` for cudablas and libcudnn.
-
-```
-$ export TF_CUDA_PATHS=/usr/local/cuda-10.1,/usr/lib/x86_64-linux-gnu,/usr/include
-```
-
-To make MediaPipe get TensorFlow's CUDA settings, find TensorFlow's
-[.bazelrc](https://github.com/tensorflow/tensorflow/blob/master/.bazelrc) and
-copy the `build:using_cuda` and `build:cuda` section into MediaPipe's .bazelrc
-file. For example, as of April 23, 2020, TensorFlow's CUDA setting is the
-following:
-
-```
-# This config refers to building with CUDA available. It does not necessarily
-# mean that we build CUDA op kernels.
-build:using_cuda --define=using_cuda=true
-build:using_cuda --action_env TF_NEED_CUDA=1
-build:using_cuda --crosstool_top=@local_config_cuda//crosstool:toolchain
-
-# This config refers to building CUDA op kernels with nvcc.
-build:cuda --config=using_cuda
-build:cuda --define=using_cuda_nvcc=true
-```
-
-Finally, build MediaPipe with TensorFlow GPU with two more flags `--config=cuda`
-and `--spawn_strategy=local`. For example:
-
-```
-$ bazel build -c opt --config=cuda --spawn_strategy=local \
-    --define no_aws_support=true --copt -DMESA_EGL_NO_X11_HEADERS \
-    mediapipe/examples/desktop/object_detection:object_detection_tensorflow
-```
-
-While the binary is running, it prints out the GPU device info:
-
-```
-I external/org_tensorflow/tensorflow/stream_executor/platform/default/dso_loader.cc:44] Successfully opened dynamic library libcuda.so.1
-I external/org_tensorflow/tensorflow/core/common_runtime/gpu/gpu_device.cc:1544] Found device 0 with properties: pciBusID: 0000:00:04.0 name: Tesla T4 computeCapability: 7.5 coreClock: 1.59GHz coreCount: 40 deviceMemorySize: 14.75GiB deviceMemoryBandwidth: 298.08GiB/s
-I external/org_tensorflow/tensorflow/core/common_runtime/gpu/gpu_device.cc:1686] Adding visible gpu devices: 0
-```
-
-You can monitor the GPU usage to verify whether the GPU is used for model
-inference.
-
-```
-$ nvidia-smi --query-gpu=utilization.gpu --format=csv --loop=1
-
-0 %
-0 %
-4 %
-5 %
-83 %
-21 %
-22 %
-27 %
-29 %
-100 %
-0 %
-0%
-```
-
-### Life of a GPU Calculator
+## Life of a GPU Calculator
 
 This section presents the basic structure of the Process method of a GPU
 calculator derived from base class GlSimpleCalculator. The GPU calculator
@@ -302,7 +141,7 @@ choices for MediaPipe GPU support:
    * Data that needs to be shared between all GPU-based calculators is provided as a external input that is implemented as a graph service and is managed by the `GlCalculatorHelper` class.
    * The combination of calculator-specific helpers and a shared graph service allows us great flexibility in managing the GPU resource: we can have a separate context per calculator, share a single context, share a lock or other synchronization primitives, etc. -- and all of this is managed by the helper and hidden from the individual calculators.
 
-### GpuBuffer to ImageFrame Converters
+## GpuBuffer to ImageFrame Converters
 
 We provide two calculators called `GpuBufferToImageFrameCalculator` and `ImageFrameToGpuBufferCalculator`. These calculators convert between `ImageFrame` and `GpuBuffer`, allowing the construction of graphs that combine GPU and CPU calculators. They are supported on both iOS and Android
 
@@ -310,6 +149,15 @@ When possible, these calculators use platform-specific functionality to share da
 
 The below diagram shows the data flow in a mobile application that captures video from the camera, runs it through a MediaPipe graph, and renders the output on the screen in real time. The dashed line indicates which parts are inside the MediaPipe graph proper. This application runs a Canny edge-detection filter on the CPU using OpenCV, and overlays it on top of the original video using the GPU.
 
-| ![How GPU calculators interact](images/gpu_example_graph.png) |
-|:--:|
-| *Video frames from the camera are fed into the graph as `GpuBuffer` packets. The input stream is accessed by two calculators in parallel. `GpuBufferToImageFrameCalculator` converts the buffer into an `ImageFrame`, which is then sent through a grayscale converter and a canny filter (both based on OpenCV and running on the CPU), whose output is then converted into a `GpuBuffer` again. A multi-input GPU calculator, GlOverlayCalculator, takes as input both the original `GpuBuffer` and the one coming out of the edge detector, and overlays them using a shader. The output is then sent back to the application using a callback calculator, and the application renders the image to the screen using OpenGL.* |
+| ![How GPU calculators interact](../images/gpu_example_graph.png)             |
+| :--------------------------------------------------------------------------: |
+| *Video frames from the camera are fed into the graph as `GpuBuffer` packets. |
+: The input stream is accessed by two calculators in parallel.                 :
+: `GpuBufferToImageFrameCalculator` converts the buffer into an `ImageFrame`,  :
+: which is then sent through a grayscale converter and a canny filter (both    :
+: based on OpenCV and running on the CPU), whose output is then converted into :
+: a `GpuBuffer` again. A multi-input GPU calculator, GlOverlayCalculator,      :
+: takes as input both the original `GpuBuffer` and the one coming out of the   :
+: edge detector, and overlays them using a shader. The output is then sent     :
+: back to the application using a callback calculator, and the application     :
+: renders the image to the screen using OpenGL.*                               :
diff --git a/docs/framework_concepts/graphs.md b/docs/framework_concepts/graphs.md
new file mode 100644
index 000000000..83f95e5bb
--- /dev/null
+++ b/docs/framework_concepts/graphs.md
@@ -0,0 +1,271 @@
+---
+layout: default
+title: Graphs
+parent: Framework Concepts
+nav_order: 2
+---
+
+# Graphs
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
+
+## GraphConfig
+
+A `GraphConfig` is a specification that describes the topology and functionality
+of a MediaPipe graph. In the specification, a node in the graph represents an
+instance of a particular calculator. All the necessary configurations of the
+node, such its type, inputs and outputs must be described in the specification.
+Description of the node can also include several optional fields, such as
+node-specific options, input policy and executor, discussed in
+[Synchronization](synchronization.md).
+
+`GraphConfig` has several other fields to configure the global graph-level
+settings, eg, graph executor configs, number of threads, and maximum queue size
+of input streams. Several graph-level settings are useful for tuning the
+performance of the graph on different platforms (eg, desktop v.s. mobile). For
+instance, on mobile, attaching a heavy model-inference calculator to a separate
+executor can improve the performance of a real-time application since this
+enables thread locality.
+
+Below is a trivial `GraphConfig` example where we have series of passthrough
+calculators :
+
+```proto
+# This graph named main_pass_throughcals_nosubgraph.pbtxt contains 4
+# passthrough calculators.
+input_stream: "in"
+node {
+    calculator: "PassThroughCalculator"
+    input_stream: "in"
+    output_stream: "out1"
+}
+node {
+    calculator: "PassThroughCalculator"
+    input_stream: "out1"
+    output_stream: "out2"
+}
+node {
+    calculator: "PassThroughCalculator"
+    input_stream: "out2"
+    output_stream: "out3"
+}
+node {
+    calculator: "PassThroughCalculator"
+    input_stream: "out3"
+    output_stream: "out4"
+}
+```
+
+## Subgraph
+
+To modularize a `CalculatorGraphConfig` into sub-modules and assist with re-use
+of perception solutions, a MediaPipe graph can be defined as a `Subgraph`. The
+public interface of a subgraph consists of a set of input and output streams
+similar to a calculator's public interface. The subgraph can then be included in
+an `CalculatorGraphConfig` as if it were a calculator. When a MediaPipe graph is
+loaded from a `CalculatorGraphConfig`, each subgraph node is replaced by the
+corresponding graph of calculators. As a result, the semantics and performance
+of the subgraph is identical to the corresponding graph of calculators.
+
+Below is an example of how to create a subgraph named `TwoPassThroughSubgraph`.
+
+1.  Defining the subgraph.
+
+    ```proto
+    # This subgraph is defined in two_pass_through_subgraph.pbtxt
+    # and is registered as "TwoPassThroughSubgraph"
+
+    type: "TwoPassThroughSubgraph"
+    input_stream: "out1"
+    output_stream: "out3"
+
+    node {
+        calculator: "PassThroughculator"
+        input_stream: "out1"
+        output_stream: "out2"
+    }
+    node {
+        calculator: "PassThroughculator"
+        input_stream: "out2"
+        output_stream: "out3"
+    }
+    ```
+
+    The public interface to the subgraph consists of:
+
+    *   Graph input streams
+    *   Graph output streams
+    *   Graph input side packets
+    *   Graph output side packets
+
+2.  Register the subgraph using BUILD rule `mediapipe_simple_subgraph`. The
+    parameter `register_as` defines the component name for the new subgraph.
+
+    ```proto
+    # Small section of BUILD file for registering the "TwoPassThroughSubgraph"
+    # subgraph for use by main graph main_pass_throughcals.pbtxt
+
+    mediapipe_simple_subgraph(
+        name = "twopassthrough_subgraph",
+        graph = "twopassthrough_subgraph.pbtxt",
+        register_as = "TwoPassThroughSubgraph",
+        deps = [
+                "//mediapipe/calculators/core:pass_through_calculator",
+                "//mediapipe/framework:calculator_graph",
+        ],
+    )
+    ```
+
+3.  Use the subgraph in the main graph.
+
+    ```proto
+    # This main graph is defined in main_pass_throughcals.pbtxt
+    # using subgraph called "TwoPassThroughSubgraph"
+
+    input_stream: "in"
+    node {
+        calculator: "PassThroughCalculator"
+        input_stream: "in"
+        output_stream: "out1"
+    }
+    node {
+        calculator: "TwoPassThroughSubgraph"
+        input_stream: "out1"
+        output_stream: "out3"
+    }
+    node {
+        calculator: "PassThroughCalculator"
+        input_stream: "out3"
+        output_stream: "out4"
+    }
+    ```
+
+## Cycles
+
+<!-- TODO: add discussion of PreviousLoopbackCalculator -->
+
+By default, MediaPipe requires calculator graphs to be acyclic and treats cycles
+in a graph as errors. If a graph is intended to have cycles, the cycles need to
+be annotated in the graph config. This page describes how to do that.
+
+NOTE: The current approach is experimental and subject to change. We welcome
+your feedback.
+
+Please use the `CalculatorGraphTest.Cycle` unit test in
+`mediapipe/framework/calculator_graph_test.cc` as sample code. Shown
+below is the cyclic graph in the test. The `sum` output of the adder is the sum
+of the integers generated by the integer source calculator.
+
+![a cyclic graph that adds a stream of integers](../images/cyclic_integer_sum_graph.svg "A cyclic graph")
+
+This simple graph illustrates all the issues in supporting cyclic graphs.
+
+### Back Edge Annotation
+
+We require that an edge in each cycle be annotated as a back edge. This allows
+MediaPipe’s topological sort to work, after removing all the back edges.
+
+There are usually multiple ways to select the back edges. Which edges are marked
+as back edges affects which nodes are considered as upstream and which nodes are
+considered as downstream, which in turn affects the priorities MediaPipe assigns
+to the nodes.
+
+For example, the `CalculatorGraphTest.Cycle` test marks the `old_sum` edge as a
+back edge, so the Delay node is considered as a downstream node of the adder
+node and is given a higher priority. Alternatively, we could mark the `sum`
+input to the delay node as the back edge, in which case the delay node would be
+considered as an upstream node of the adder node and is given a lower priority.
+
+### Initial Packet
+
+For the adder calculator to be runnable when the first integer from the integer
+source arrives, we need an initial packet, with value 0 and with the same
+timestamp, on the `old_sum` input stream to the adder. This initial packet
+should be output by the delay calculator in the `Open()` method.
+
+### Delay in a Loop
+
+Each loop should incur a delay to align the previous `sum` output with the next
+integer input. This is also done by the delay node. So the delay node needs to
+know the following about the timestamps of the integer source calculator:
+
+*   The timestamp of the first output.
+
+*   The timestamp delta between successive outputs.
+
+We plan to add an alternative scheduling policy that only cares about packet
+ordering and ignores packet timestamps, which will eliminate this inconvenience.
+
+### Early Termination of a Calculator When One Input Stream is Done
+
+By default, MediaPipe calls the `Close()` method of a non-source calculator when
+all of its input streams are done. In the example graph, we want to stop the
+adder node as soon as the integer source is done. This is accomplished by
+configuring the adder node with an alternative input stream handler,
+`EarlyCloseInputStreamHandler`.
+
+### Relevant Source Code
+
+#### Delay Calculator
+
+Note the code in `Open()` that outputs the initial packet and the code in
+`Process()` that adds a (unit) delay to input packets. As noted above, this
+delay node assumes that its output stream is used alongside an input stream with
+packet timestamps 0, 1, 2, 3, ...
+
+```c++
+class UnitDelayCalculator : public Calculator {
+ public:
+  static ::util::Status FillExpectations(
+      const CalculatorOptions& extendable_options, PacketTypeSet* inputs,
+      PacketTypeSet* outputs, PacketTypeSet* input_side_packets) {
+    inputs->Index(0)->Set<int>("An integer.");
+    outputs->Index(0)->Set<int>("The input delayed by one time unit.");
+    return ::mediapipe::OkStatus();
+  }
+
+  ::util::Status Open() final {
+    Output()->Add(new int(0), Timestamp(0));
+    return ::mediapipe::OkStatus();
+  }
+
+  ::util::Status Process() final {
+    const Packet& packet = Input()->Value();
+    Output()->AddPacket(packet.At(packet.Timestamp().NextAllowedInStream()));
+    return ::mediapipe::OkStatus();
+  }
+};
+```
+
+#### Graph Config
+
+Note the `back_edge` annotation and the alternative `input_stream_handler`.
+
+```proto
+node {
+  calculator: 'GlobalCountSourceCalculator'
+  input_side_packet: 'global_counter'
+  output_stream: 'integers'
+}
+node {
+  calculator: 'IntAdderCalculator'
+  input_stream: 'integers'
+  input_stream: 'old_sum'
+  input_stream_info: {
+    tag_index: ':1'  # 'old_sum'
+    back_edge: true
+  }
+  output_stream: 'sum'
+  input_stream_handler {
+    input_stream_handler: 'EarlyCloseInputStreamHandler'
+  }
+}
+node {
+  calculator: 'UnitDelayCalculator'
+  input_stream: 'sum'
+  output_stream: 'old_sum'
+}
+```
diff --git a/mediapipe/docs/packets.md b/docs/framework_concepts/packets.md
similarity index 81%
rename from mediapipe/docs/packets.md
rename to docs/framework_concepts/packets.md
index 2e52ae956..bb0b61d6a 100644
--- a/mediapipe/docs/packets.md
+++ b/docs/framework_concepts/packets.md
@@ -1,10 +1,21 @@
-### Packets
+---
+layout: default
+title: Packets
+parent: Framework Concepts
+nav_order: 3
+---
 
-- [Creating a packet](#creating-a-packet)
+# Packets
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
 
 Each calculator is a node of of a graph. We describe how to create a new calculator, how to initialize a calculator, how to perform its calculations, input and output streams, timestamps, and options
 
-#### Creating a packet
+## Creating a packet
+
 Packets are generally created with `MediaPipe::Adopt()` (from packet.h).
 
 ```c++
diff --git a/mediapipe/docs/scheduling_sync.md b/docs/framework_concepts/synchronization.md
similarity index 98%
rename from mediapipe/docs/scheduling_sync.md
rename to docs/framework_concepts/synchronization.md
index 7f77a989c..5482aeb76 100644
--- a/mediapipe/docs/scheduling_sync.md
+++ b/docs/framework_concepts/synchronization.md
@@ -1,4 +1,16 @@
-# Framework Architecture
+---
+layout: default
+title: Synchronization
+parent: Framework Concepts
+nav_order: 4
+---
+
+# Synchronization
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
 
 ## Scheduling mechanics
 
diff --git a/mediapipe/docs/android_archive_library.md b/docs/getting_started/android_archive_library.md
similarity index 88%
rename from mediapipe/docs/android_archive_library.md
rename to docs/getting_started/android_archive_library.md
index f0fef4113..0b2c6181b 100644
--- a/mediapipe/docs/android_archive_library.md
+++ b/docs/getting_started/android_archive_library.md
@@ -1,4 +1,16 @@
-## MediaPipe Android Archive Library
+---
+layout: default
+title: MediaPipe Android Archive
+parent: Getting Started
+nav_order: 7
+---
+
+# MediaPipe Android Archive
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
 
 ***Experimental Only***
 
@@ -9,15 +21,15 @@ target to generate a custom AAR file for their own projects. This is necessary
 in order to include specific resources such as MediaPipe calculators needed for
 each project.
 
-### Steps to build a MediaPipe AAR
+## Steps to build a MediaPipe AAR
 
 1.  Create a mediapipe_aar() target.
 
     In the MediaPipe directory, create a new mediapipe_aar() target in a BUILD
     file. You need to figure out what calculators are used in the graph and
     provide the calculator dependencies to the mediapipe_aar(). For example, to
-    build an AAR for [face detection gpu](./face_detection_mobile_gpu.md), you
-    can put the following code into
+    build an AAR for [MediaPipe Face Detection](../solutions/face_detection.md),
+    you can put the following code into
     mediapipe/examples/android/src/java/com/google/mediapipe/apps/aar_example/BUILD.
 
     ```
@@ -54,7 +66,7 @@ each project.
     /absolute/path/to/your/preferred/location
     ```
 
-### Steps to use a MediaPipe AAR in Android Studio with Gradle
+## Steps to use a MediaPipe AAR in Android Studio with Gradle
 
 1.  Start Android Studio and go to your project.
 
@@ -65,7 +77,7 @@ each project.
     /path/to/your/app/libs/
     ```
 
-    ![Screenshot](images/mobile/aar_location.png)
+    ![Screenshot](../images/mobile/aar_location.png)
 
 3.  Make app/src/main/assets and copy assets (graph, model, and etc) into
     app/src/main/assets.
@@ -85,7 +97,7 @@ each project.
     cp mediapipe/models/face_detection_front_labelmap.txt /path/to/your/app/src/main/assets/
     ```
 
-    ![Screenshot](images/mobile/assets_location.png)
+    ![Screenshot](../images/mobile/assets_location.png)
 
 4.  Make app/src/main/jniLibs and copy OpenCV JNI libraries into
     app/src/main/jniLibs.
@@ -100,7 +112,7 @@ each project.
     cp -R ~/Downloads/OpenCV-android-sdk/sdk/native/libs/arm* /path/to/your/app/src/main/jniLibs/
     ```
 
-    ![Screenshot](images/mobile/android_studio_opencv_location.png)
+    ![Screenshot](../images/mobile/android_studio_opencv_location.png)
 
 5.  Modify app/build.gradle to add MediaPipe dependencies and MediaPipe AAR.
 
@@ -127,6 +139,8 @@ each project.
     ```
 
 6.  Follow our Android app examples to use MediaPipe in Android Studio for your
-    use case. If you are looking for an example, a face detection
-    example can be found
-    [here](https://github.com/jiuqiant/mediapipe_face_detection_aar_example) and a multi-hand tracking example can be found [here](https://github.com/jiuqiant/mediapipe_multi_hands_tracking_aar_example).
+    use case. If you are looking for an example, a face detection example can be
+    found
+    [here](https://github.com/jiuqiant/mediapipe_face_detection_aar_example) and
+    a multi-hand tracking example can be found
+    [here](https://github.com/jiuqiant/mediapipe_multi_hands_tracking_aar_example).
diff --git a/mediapipe/docs/building_examples.md b/docs/getting_started/building_examples.md
similarity index 85%
rename from mediapipe/docs/building_examples.md
rename to docs/getting_started/building_examples.md
index 73c139fea..c69355456 100644
--- a/mediapipe/docs/building_examples.md
+++ b/docs/getting_started/building_examples.md
@@ -1,8 +1,16 @@
-# Building MediaPipe Examples
+---
+layout: default
+title: Building MediaPipe Examples
+parent: Getting Started
+nav_order: 2
+---
 
-*   [Android](#android)
-*   [iOS](#ios)
-*   [Desktop](#desktop)
+# Building MediaPipe Examples
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
 
 ## Android
 
@@ -29,8 +37,9 @@ export ANDROID_NDK_HOME=<path to the Android NDK>
 
 In order to use MediaPipe on earlier Android versions, MediaPipe needs to switch
 to a lower Android API level. You can achieve this by specifying `api_level =
-<api level integer>` in android_ndk_repository() and/or android_sdk_repository()
-in the [`WORKSPACE`](https://github.com/google/mediapipe/tree/master/WORKSPACE) file.
+$YOUR_INTENDED_API_LEVEL` in android_ndk_repository() and/or
+android_sdk_repository() in the
+[`WORKSPACE`](https://github.com/google/mediapipe/tree/master/WORKSPACE) file.
 
 Please verify all the necessary packages are installed.
 
@@ -42,16 +51,19 @@ Please verify all the necessary packages are installed.
 
 ### Option 1: Build with Bazel in Command Line
 
-1.  To build an Android example app, for instance, for MediaPipe Hand, run:
+1.  To build an Android example app, build against the corresponding
+    `android_binary` build target. For instance, for
+    [MediaPipe Hand](../solutions/hand.md) the target is `handtrackinggpu` in
+    the
+    [BUILD](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/handtrackinggpu/BUILD)
+    file:
 
     Note: To reduce the binary size, consider appending `--linkopt="-s"` to the
     command below to strip symbols.
 
-    ~~~
-      ```bash
-    bazel build -c opt --config=android_arm64 mediapipe/examples/android/src/java/com/google/mediapipe/apps/handtrackinggpu
+    ```bash
+    bazel build -c opt --config=android_arm64 mediapipe/examples/android/src/java/com/google/mediapipe/apps/handtrackinggpu:handtrackinggpu
     ```
-    ~~~
 
 1.  Install it on a device with:
 
@@ -74,13 +86,13 @@ app:
 
 1.  Install and launch Android Studio 3.5.
 
-2.  Select `Configure` | `SDK Manager` | `SDK Platforms`.
+2.  Select `Configure` -> `SDK Manager` -> `SDK Platforms`.
 
     *   Verify that Android SDK Platform API Level 28 or 29 is installed.
     *   Take note of the Android SDK Location, e.g.,
         `/usr/local/home/Android/Sdk`.
 
-3.  Select `Configure` | `SDK Manager` | `SDK Tools`.
+3.  Select `Configure` -> `SDK Manager` -> `SDK Tools`.
 
     *   Verify that Android SDK Build-Tools 28 or 29 is installed.
     *   Verify that Android SDK Platform-Tools 28 or 29 is installed.
@@ -102,10 +114,10 @@ app:
     export ANDROID_NDK_HOME=/usr/local/home/Android/Sdk/ndk/<version number>
     ```
 
-5.  Select `Configure` | `Plugins` install `Bazel`.
+5.  Select `Configure` -> `Plugins` to install `Bazel`.
 
-6.  On Linux, select `File` | `Settings`| `Bazel settings`. On macos, select
-    `Android Studio` | `Preferences` | `Bazel settings`. Then, modify `Bazel
+6.  On Linux, select `File` -> `Settings` -> `Bazel settings`. On macos, select
+    `Android Studio` -> `Preferences` -> `Bazel settings`. Then, modify `Bazel
     binary location` to be the same as the output of `$ which bazel`.
 
 7.  Select `Import Bazel Project`.
@@ -132,7 +144,7 @@ app:
       --host_crosstool_top=@bazel_tools//tools/cpp:toolchain
     ```
 
-8.  Select `Bazel` | `Sync` | `Sync project with Build files`.
+8.  Select `Bazel` -> `Sync` -> `Sync project with Build files`.
 
     Note: Even after doing step 4, if you still see the error: `"no such package
     '@androidsdk//': Either the path attribute of android_sdk_repository or the
@@ -154,11 +166,11 @@ app:
 
 9.  Connect an Android device to the workstation.
 
-10. Select `Run...` | `Edit Configurations...`.
+10. Select `Run...` -> `Edit Configurations...`.
 
-    *   Select `Templates` | `Bazel Command`.
+    *   Select `Templates` -> `Bazel Command`.
     *   Enter Target Expression:
-        `//mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectioncpu`
+        `//mediapipe/examples/android/src/java/com/google/mediapipe/apps/handtrackinggpu:handtrackinggpu`
     *   Enter Bazel command: `mobile-install`.
     *   Enter Bazel flags: `-c opt --config=android_arm64`.
     *   Press the `[+]` button to add the new configuration.
@@ -215,15 +227,14 @@ app:
 
 ### Option 1: Build with Bazel in Command Line
 
-1.  Modify the `bundle_id` field of the app's `ios_application` target to use
-    your own identifier. For instance, for
-    [MediaPipe Hand](./hand_tracking_mobile_gpu.md), the `bundle_id` is in the
+1.  Modify the `bundle_id` field of the app's `ios_application` build target to
+    use your own identifier. For instance, for
+    [MediaPipe Hand](../solutions/hand.md), the `bundle_id` is in the
     `HandTrackingGpuApp` target in the
     [BUILD](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/handtrackinggpu/BUILD)
     file.
 
-2.  Again using [MediaPipe Hand](./hand_tracking_mobile_gpu.md) for example,
-    run:
+2.  Again using [MediaPipe Hand](../solutions/hand.md) for example, run:
 
     ```bash
     bazel build -c opt --config=ios_arm64 mediapipe/examples/ios/handtrackinggpu:HandTrackingGpuApp
@@ -287,7 +298,7 @@ the previous section.
 
 ### Option 1: Running on CPU
 
-1.  To build, for example, [MediaPipe Hand](./hand_tracking_mobile_gpu.md), run:
+1.  To build, for example, [MediaPipe Hand](../solutions/hand.md), run:
 
     ```bash
     bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 mediapipe/examples/desktop/hand_tracking:hand_tracking_cpu
@@ -306,9 +317,9 @@ the previous section.
 ### Option 2: Running on GPU
 
 Note: This currently works only on Linux, and please first follow
-[OpenGL ES Setup on Linux Desktop](./gpu.md#opengl-es-setup-on-linux-desktop).
+[OpenGL ES Setup on Linux Desktop](./gpu_support.md#opengl-es-setup-on-linux-desktop).
 
-1.  To build, for example, [MediaPipe Hand](./hand_tracking_mobile_gpu.md), run:
+1.  To build, for example, [MediaPipe Hand](../solutions/hand.md), run:
 
     ```bash
     bazel build -c opt --copt -DMESA_EGL_NO_X11_HEADERS --copt -DEGL_NO_X11 \
diff --git a/mediapipe/docs/how_to_questions.md b/docs/getting_started/faq.md
similarity index 92%
rename from mediapipe/docs/how_to_questions.md
rename to docs/getting_started/faq.md
index 321a21b6f..75bf8ad97 100644
--- a/mediapipe/docs/how_to_questions.md
+++ b/docs/getting_started/faq.md
@@ -1,12 +1,16 @@
-## Questions and Answers
+---
+layout: default
+title: FAQ
+parent: Getting Started
+nav_order: 9
+---
 
--   [How to convert ImageFrames and GpuBuffers](#how-to-convert-imageframes-and-gpubuffers)
--   [How to visualize perceived results](#how-to-visualize-perception-results)
--   [How to run calculators in parallel](#how-to-run-calculators-in-parallel)
--   [Output timestamps when using ImmediateInputStreamHandler](#output-timestamps-when-using-immediateinputstreamhandler)
--   [How to change settings at runtime](#how-to-change-settings-at-runtime)
--   [How to process real-time input streams](#how-to-process-real-time-input-streams)
--   [Can I run MediaPipe on MS Windows?](#can-i-run-mediapipe-on-ms-windows)
+# FAQ
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
 
 ### How to convert ImageFrames and GpuBuffers
 
diff --git a/docs/getting_started/getting_started.md b/docs/getting_started/getting_started.md
new file mode 100644
index 000000000..be7150543
--- /dev/null
+++ b/docs/getting_started/getting_started.md
@@ -0,0 +1,13 @@
+---
+layout: default
+title: Getting Started
+nav_order: 2
+has_children: true
+---
+
+# Getting Started
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
diff --git a/docs/getting_started/gpu_support.md b/docs/getting_started/gpu_support.md
new file mode 100644
index 000000000..2aae63a2e
--- /dev/null
+++ b/docs/getting_started/gpu_support.md
@@ -0,0 +1,186 @@
+---
+layout: default
+title: GPU Support
+parent: Getting Started
+nav_order: 6
+---
+
+# GPU Support
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
+
+## OpenGL ES Support
+
+MediaPipe supports OpenGL ES up to version 3.2 on Android/Linux and up to ES 3.0
+on iOS. In addition, MediaPipe also supports Metal on iOS.
+
+OpenGL ES 3.1 or greater is required (on Android/Linux systems) for running
+machine learning inference calculators and graphs.
+
+## Disable OpenGL ES Support
+
+By default, building MediaPipe (with no special bazel flags) attempts to compile
+and link against OpenGL ES (and for iOS also Metal) libraries.
+
+On platforms where OpenGL ES is not available (see also
+[OpenGL ES Setup on Linux Desktop](#opengl-es-setup-on-linux-desktop)), you
+should disable OpenGL ES support with:
+
+```
+$ bazel build --define MEDIAPIPE_DISABLE_GPU=1 <my-target>
+```
+
+Note: On Android and iOS, OpenGL ES is required by MediaPipe framework and the
+support should never be disabled.
+
+## OpenGL ES Setup on Linux Desktop
+
+On Linux desktop with video cards that support OpenGL ES 3.1+, MediaPipe can run
+GPU compute and rendering and perform TFLite inference on GPU.
+
+To check if your Linux desktop GPU can run MediaPipe with OpenGL ES:
+
+```bash
+$ sudo apt-get install mesa-common-dev libegl1-mesa-dev libgles2-mesa-dev
+$ sudo apt-get install mesa-utils
+$ glxinfo | grep -i opengl
+```
+
+For example, it may print:
+
+```bash
+$ glxinfo | grep -i opengl
+...
+OpenGL ES profile version string: OpenGL ES 3.2 NVIDIA 430.50
+OpenGL ES profile shading language version string: OpenGL ES GLSL ES 3.20
+OpenGL ES profile extensions:
+```
+
+*Notice the ES 3.20 text above.*
+
+You need to see ES 3.1 or greater printed in order to perform TFLite inference
+on GPU in MediaPipe. With this setup, build with:
+
+```
+$ bazel build --copt -DMESA_EGL_NO_X11_HEADERS --copt -DEGL_NO_X11 <my-target>
+```
+
+If only ES 3.0 or below is supported, you can still build MediaPipe targets that
+don't require TFLite inference on GPU with:
+
+```
+$ bazel build --copt -DMESA_EGL_NO_X11_HEADERS --copt -DEGL_NO_X11 --copt -DMEDIAPIPE_DISABLE_GL_COMPUTE <my-target>
+```
+
+Note: MEDIAPIPE_DISABLE_GL_COMPUTE is already defined automatically on all Apple
+systems (Apple doesn't support OpenGL ES 3.1+).
+
+## TensorFlow CUDA Support and Setup on Linux Desktop
+
+MediaPipe framework doesn't require CUDA for GPU compute and rendering. However,
+MediaPipe can work with TensorFlow to perform GPU inference on video cards that
+support CUDA.
+
+To enable TensorFlow GPU inference with MediaPipe, the first step is to follow
+the
+[TensorFlow GPU documentation](https://www.tensorflow.org/install/gpu#software_requirements)
+to install the required NVIDIA software on your Linux desktop.
+
+After installation, update `$PATH` and `$LD_LIBRARY_PATH` and run `ldconfig`
+with:
+
+```
+$ export PATH=/usr/local/cuda-10.1/bin${PATH:+:${PATH}}
+$ export LD_LIBRARY_PATH=/usr/local/cuda/extras/CUPTI/lib64,/usr/local/cuda-10.1/lib64${LD_LIBRARY_PATH:+:${LD_LIBRARY_PATH}}
+$ sudo ldconfig
+```
+
+It's recommended to verify the installation of CUPTI, CUDA, CuDNN, and NVCC:
+
+```
+$ ls /usr/local/cuda/extras/CUPTI
+/lib64
+libcupti.so       libcupti.so.10.1.208  libnvperf_host.so        libnvperf_target.so
+libcupti.so.10.1  libcupti_static.a     libnvperf_host_static.a
+
+$ ls /usr/local/cuda-10.1
+LICENSE  bin  extras   lib64      libnvvp           nvml  samples  src      tools
+README   doc  include  libnsight  nsightee_plugins  nvvm  share    targets  version.txt
+
+$ nvcc -V
+nvcc: NVIDIA (R) Cuda compiler driver
+Copyright (c) 2005-2019 NVIDIA Corporation
+Built on Sun_Jul_28_19:07:16_PDT_2019
+Cuda compilation tools, release 10.1, V10.1.243
+
+$ ls /usr/lib/x86_64-linux-gnu/ | grep libcudnn.so
+libcudnn.so
+libcudnn.so.7
+libcudnn.so.7.6.4
+```
+
+Setting `$TF_CUDA_PATHS` is the way to declare where the CUDA library is. Note
+that the following code snippet also adds `/usr/lib/x86_64-linux-gnu` and
+`/usr/include` into `$TF_CUDA_PATHS` for cudablas and libcudnn.
+
+```
+$ export TF_CUDA_PATHS=/usr/local/cuda-10.1,/usr/lib/x86_64-linux-gnu,/usr/include
+```
+
+To make MediaPipe get TensorFlow's CUDA settings, find TensorFlow's
+[.bazelrc](https://github.com/tensorflow/tensorflow/blob/master/.bazelrc) and
+copy the `build:using_cuda` and `build:cuda` section into MediaPipe's .bazelrc
+file. For example, as of April 23, 2020, TensorFlow's CUDA setting is the
+following:
+
+```
+# This config refers to building with CUDA available. It does not necessarily
+# mean that we build CUDA op kernels.
+build:using_cuda --define=using_cuda=true
+build:using_cuda --action_env TF_NEED_CUDA=1
+build:using_cuda --crosstool_top=@local_config_cuda//crosstool:toolchain
+
+# This config refers to building CUDA op kernels with nvcc.
+build:cuda --config=using_cuda
+build:cuda --define=using_cuda_nvcc=true
+```
+
+Finally, build MediaPipe with TensorFlow GPU with two more flags `--config=cuda`
+and `--spawn_strategy=local`. For example:
+
+```
+$ bazel build -c opt --config=cuda --spawn_strategy=local \
+    --define no_aws_support=true --copt -DMESA_EGL_NO_X11_HEADERS \
+    mediapipe/examples/desktop/object_detection:object_detection_tensorflow
+```
+
+While the binary is running, it prints out the GPU device info:
+
+```
+I external/org_tensorflow/tensorflow/stream_executor/platform/default/dso_loader.cc:44] Successfully opened dynamic library libcuda.so.1
+I external/org_tensorflow/tensorflow/core/common_runtime/gpu/gpu_device.cc:1544] Found device 0 with properties: pciBusID: 0000:00:04.0 name: Tesla T4 computeCapability: 7.5 coreClock: 1.59GHz coreCount: 40 deviceMemorySize: 14.75GiB deviceMemoryBandwidth: 298.08GiB/s
+I external/org_tensorflow/tensorflow/core/common_runtime/gpu/gpu_device.cc:1686] Adding visible gpu devices: 0
+```
+
+You can monitor the GPU usage to verify whether the GPU is used for model
+inference.
+
+```
+$ nvidia-smi --query-gpu=utilization.gpu --format=csv --loop=1
+
+0 %
+0 %
+4 %
+5 %
+83 %
+21 %
+22 %
+27 %
+29 %
+100 %
+0 %
+0%
+```
diff --git a/mediapipe/docs/hello_world_android.md b/docs/getting_started/hello_world_android.md
similarity index 97%
rename from mediapipe/docs/hello_world_android.md
rename to docs/getting_started/hello_world_android.md
index a83b39a47..2794ea4f8 100644
--- a/mediapipe/docs/hello_world_android.md
+++ b/docs/getting_started/hello_world_android.md
@@ -1,4 +1,16 @@
-# Hello World! in MediaPipe on Android
+---
+layout: default
+title: Hello World! on Android
+parent: Getting Started
+nav_order: 3
+---
+
+# Hello World! on Android
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
 
 ## Introduction
 
@@ -14,7 +26,7 @@ graph on Android.
 A simple camera app for real-time Sobel edge detection applied to a live video
 stream on an Android device.
 
-![edge_detection_android_gpu_gif](images/mobile/edge_detection_android_gpu.gif)
+![edge_detection_android_gpu_gif](../images/mobile/edge_detection_android_gpu.gif)
 
 ## Setup
 
@@ -56,7 +68,7 @@ node: {
 
 A visualization of the graph is shown below:
 
-![edge_detection_mobile_gpu](images/mobile/edge_detection_mobile_gpu.png)
+![edge_detection_mobile_gpu](../images/mobile/edge_detection_mobile_gpu.png)
 
 This graph has a single input stream named `input_video` for all incoming frames
 that will be provided by your device's camera.
@@ -247,7 +259,7 @@ adb install bazel-bin/$APPLICATION_PATH/helloworld.apk
 Open the application on your device. It should display a screen with the text
 `Hello World!`.
 
-![bazel_hello_world_android](images/mobile/bazel_hello_world_android.png)
+![bazel_hello_world_android](../images/mobile/bazel_hello_world_android.png)
 
 ## Using the camera via `CameraX`
 
@@ -364,7 +376,7 @@ Add the following line in the `$APPLICATION_PATH/res/values/strings.xml` file:
 When the user doesn't grant camera permission, the screen will now look like
 this:
 
-![missing_camera_permission_android](images/mobile/missing_camera_permission_android.png)
+![missing_camera_permission_android](../images/mobile/missing_camera_permission_android.png)
 
 Now, we will add the [`SurfaceTexture`] and [`SurfaceView`] objects to
 `MainActivity`:
@@ -740,7 +752,7 @@ And that's it! You should now be able to successfully build and run the
 application on the device and see Sobel edge detection running on a live camera
 feed! Congrats!
 
-![edge_detection_android_gpu_gif](images/mobile/edge_detection_android_gpu.gif)
+![edge_detection_android_gpu_gif](../images/mobile/edge_detection_android_gpu.gif)
 
 If you ran into any issues, please see the full code of the tutorial
 [here](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/basic).
diff --git a/mediapipe/docs/hello_world_desktop.md b/docs/getting_started/hello_world_desktop.md
similarity index 93%
rename from mediapipe/docs/hello_world_desktop.md
rename to docs/getting_started/hello_world_desktop.md
index 236b8675e..28a9aea8f 100644
--- a/mediapipe/docs/hello_world_desktop.md
+++ b/docs/getting_started/hello_world_desktop.md
@@ -1,4 +1,16 @@
-## Hello World for C++
+---
+layout: default
+title: Hello World! on Desktop (C++)
+parent: Getting Started
+nav_order: 5
+---
+
+# Hello World! on Desktop (C++)
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
 
 1.  Ensure you have a working version of MediaPipe. See
     [installation instructions](./install.md).
@@ -52,7 +64,7 @@
     You can visualize this graph using
     [MediaPipe Visualizer](https://viz.mediapipe.dev) by pasting the
     CalculatorGraphConfig content below into the visualizer. See
-    [here](./visualizer.md) for help on the visualizer.
+    [here](../tools/visualizer.md) for help on the visualizer.
 
     ```bash
         input_stream: "in"
@@ -72,7 +84,7 @@
     This graph consists of 1 graph input stream (`in`) and 1 graph output stream
     (`out`), and 2 [`PassThroughCalculator`]s connected serially.
 
-    ![hello_world graph](./images/hello_world.png)
+    ![hello_world graph](../images/hello_world.png)
 
 4.  Before running the graph, an `OutputStreamPoller` object is connected to the
     output stream in order to later retrieve the graph output, and a graph run
diff --git a/mediapipe/docs/hello_world_ios.md b/docs/getting_started/hello_world_ios.md
similarity index 97%
rename from mediapipe/docs/hello_world_ios.md
rename to docs/getting_started/hello_world_ios.md
index ac9f76885..1c6c44961 100644
--- a/mediapipe/docs/hello_world_ios.md
+++ b/docs/getting_started/hello_world_ios.md
@@ -1,4 +1,16 @@
-# Hello World! in MediaPipe on iOS
+---
+layout: default
+title: Hello World! on iOS
+parent: Getting Started
+nav_order: 4
+---
+
+# Hello World! on iOS
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
 
 ## Introduction
 
@@ -14,7 +26,7 @@ graph on iOS.
 A simple camera app for real-time Sobel edge detection applied to a live video
 stream on an iOS device.
 
-![edge_detection_ios_gpu_gif](images/mobile/edge_detection_ios_gpu.gif)
+![edge_detection_ios_gpu_gif](../images/mobile/edge_detection_ios_gpu.gif)
 
 ## Setup
 
@@ -54,7 +66,7 @@ node: {
 
 A visualization of the graph is shown below:
 
-![edge_detection_mobile_gpu](images/mobile/edge_detection_mobile_gpu.png)
+![edge_detection_mobile_gpu](../images/mobile/edge_detection_mobile_gpu.png)
 
 This graph has a single input stream named `input_video` for all incoming frames
 that will be provided by your device's camera.
@@ -538,7 +550,7 @@ method to receive packets on this output stream and display them on the screen:
 And that is all! Build and run the app on your iOS device. You should see the
 results of running the edge detection graph on a live video feed. Congrats!
 
-![edge_detection_ios_gpu_gif](images/mobile/edge_detection_ios_gpu.gif)
+![edge_detection_ios_gpu_gif](../images/mobile/edge_detection_ios_gpu.gif)
 
 If you ran into any issues, please see the full code of the tutorial
 [here](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/edgedetectiongpu).
diff --git a/mediapipe/docs/help.md b/docs/getting_started/help.md
similarity index 89%
rename from mediapipe/docs/help.md
rename to docs/getting_started/help.md
index 6667afb78..a9d2ba7b9 100644
--- a/mediapipe/docs/help.md
+++ b/docs/getting_started/help.md
@@ -1,17 +1,24 @@
-## Getting Help
+---
+layout: default
+title: Getting Help
+parent: Getting Started
+nav_order: 8
+---
 
--   [Technical questions](#technical-questions)
--   [Bugs and feature requests](#bugs-and-feature-requests)
+# Getting Help
+{: .no_toc }
 
-Below are the various ways to get help:
+1. TOC
+{:toc}
+---
 
-### Technical questions
+## Technical questions
 
 For help with technical or algorithmic questions, visit
 [Stack Overflow](https://stackoverflow.com/questions/tagged/mediapipe) to find
 answers and support from the MediaPipe community.
 
-### Bugs and feature requests
+## Bugs and feature requests
 
 To report bugs or make feature requests,
 [file an issue on GitHub](https://github.com/google/mediapipe/issues).
diff --git a/mediapipe/docs/install.md b/docs/getting_started/install.md
similarity index 96%
rename from mediapipe/docs/install.md
rename to docs/getting_started/install.md
index f842b60a6..3fa83e95e 100644
--- a/mediapipe/docs/install.md
+++ b/docs/getting_started/install.md
@@ -1,4 +1,16 @@
-## Installing MediaPipe
+---
+layout: default
+title: Installation
+parent: Getting Started
+nav_order: 1
+---
+
+# Installation
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
 
 Note: To interoperate with OpenCV, OpenCV 3.x and above are preferred. OpenCV
 2.x currently works but interoperability support may be deprecated in the
@@ -11,22 +23,11 @@ Note: To make Mediapipe work with TensorFlow, please set Python 3.7 as the
 default Python version and install the Python "six" library by running `pip3
 install --user six`.
 
-Choose your operating system:
+Note: To build and run Android example apps, see these
+[instructions](./building_examples.md#android). To build and run iOS example
+apps, see these [instructions](./building_examples.md#ios).
 
--   [Installing on Debian and Ubuntu](#installing-on-debian-and-ubuntu)
--   [Installing on CentOS](#installing-on-centos)
--   [Installing on macOS](#installing-on-macos)
--   [Installing on Windows](#installing-on-windows)
--   [Installing on Windows Subsystem for Linux (WSL)](#installing-on-windows-subsystem-for-linux-wsl)
--   [Installing using Docker](#installing-using-docker)
-
-To build and run Android example apps, see these
-[instuctions](./building_examples.md#android).
-
-To build and run iOS example apps, see these
-[instuctions](./building_examples.md#ios).
-
-### Installing on Debian and Ubuntu
+## Installing on Debian and Ubuntu
 
 1.  Checkout MediaPipe repository.
 
@@ -137,7 +138,7 @@ To build and run iOS example apps, see these
     # Hello World!
     ```
 
-### Installing on CentOS
+## Installing on CentOS
 
 1.  Checkout MediaPipe repository.
 
@@ -220,7 +221,7 @@ To build and run iOS example apps, see these
     # Hello World!
     ```
 
-### Installing on macOS
+## Installing on macOS
 
 1.  Prework:
 
@@ -352,7 +353,7 @@ To build and run iOS example apps, see these
     # Hello World!
     ```
 
-### Installing on Windows
+## Installing on Windows
 
 **Disclaimer**: Running MediaPipe on Windows is experimental.
 
@@ -457,7 +458,7 @@ next section.
 
     ```
 
-### Installing on Windows Subsystem for Linux (WSL)
+## Installing on Windows Subsystem for Linux (WSL)
 
 Note: The pre-built OpenCV packages don't support cameras in WSL. Unless you
 [compile](https://funvision.blogspot.com/2019/12/opencv-web-camera-and-video-streams-in.html)
@@ -580,7 +581,7 @@ cameras. Alternatively, you use a video file as input.
     # Hello World!
     ```
 
-### Installing using Docker
+## Installing using Docker
 
 This will use a Docker image that will isolate mediapipe's installation from the rest of the system.
 
@@ -630,7 +631,7 @@ This will use a Docker image that will isolate mediapipe's installation from the
     # Hello World!
     ```
 
-4.  Build Mediapipe [Android demos](./examples.md).
+4.  Build a MediaPipe Android example.
 
     ```bash
     $ docker run -it --name mediapipe mediapipe:latest
diff --git a/mediapipe/docs/troubleshooting.md b/docs/getting_started/troubleshooting.md
similarity index 91%
rename from mediapipe/docs/troubleshooting.md
rename to docs/getting_started/troubleshooting.md
index e407f6198..9d1bedac4 100644
--- a/mediapipe/docs/troubleshooting.md
+++ b/docs/getting_started/troubleshooting.md
@@ -1,12 +1,16 @@
-# Troubleshooting
+---
+layout: default
+title: Troubleshooting
+parent: Getting Started
+nav_order: 10
+---
 
--   [Native method not found](#native-method-not-found)
--   [No registered calculator found](#no-registered-calculator-found)
--   [Out Of Memory error](#out-of-memory-error)
--   [Graph hangs](#graph-hangs)
--   [Calculator is scheduled infrequently](#calculator-is-scheduled-infrequently)
--   [Output timing is uneven](#output-timing-is-uneven)
--   [CalculatorGraph lags behind inputs](#calculatorgraph-lags-behind-inputs)
+# Troubleshooting
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
 
 ## Native method not found
 
@@ -55,7 +59,7 @@ running MediaPipe graph. This can occur for a number of reasons, such as:
 
 For problem (1), it may be necessary to drop some old packets in older to
 process the more recent packets. For some hints, see:
-[How to process realtime input streams](how_to_questions.md).
+[`How to process realtime input streams`].
 
 For problem (2), it could be that one input stream is lacking packets for some
 reason. A device or a calculator may be misconfigured or may produce packets
@@ -63,7 +67,7 @@ only sporadically. This can cause downstream calculators to wait for many
 packets that will never arrive, which in turn causes packets to accumulate on
 some of their input streams. MediaPipe addresses this sort of problem using
 "timestamp bounds". For some hints see:
-[How to process realtime input streams](how_to_questions.md).
+[`How to process realtime input streams`].
 
 The MediaPipe setting [`CalculatorGraphConfig::max_queue_size`] limits the
 number of packets enqueued on any input stream by throttling inputs to the
@@ -122,14 +126,14 @@ each packet as early as possible. Normally the lowest possible latency is the
 total time required by each calculator along a "critical path" of successive
 calculators. The latency of the a MediaPipe graph could be worse than the ideal
 due to delays introduced to display frames a even intervals as described in
-[Output timing is uneven](troubleshooting.md?cl=252235797#output-timing-is-uneven).
+[Output timing is uneven](#output-timing-is-uneven).
 
 If some of the calculators in the graph cannot keep pace with the realtime input
 streams, then latency will continue to increase, and it becomes necessary to
 drop some input packets. The recommended technique is to use the MediaPipe
 calculators designed specifically for this purpose such as
 [`FlowLimiterCalculator`] as described in
-[How to process realtime input streams](how_to_questions.md).
+[`How to process realtime input streams`].
 
 [`CalculatorGraphConfig`]: https://github.com/google/mediapipe/tree/master/mediapipe/framework/calculator.proto
 [`CalculatorGraphConfig::max_queue_size`]: https://github.com/google/mediapipe/tree/master/mediapipe/framework/calculator.proto
@@ -142,3 +146,4 @@ calculators designed specifically for this purpose such as
 [`Timestamp::Done`]: https://github.com/google/mediapipe/tree/master/mediapipe/framework/timestamp.h
 [`CalculatorBase::Close`]: https://github.com/google/mediapipe/tree/master/mediapipe/framework/calculator_base.h
 [`FlowLimiterCalculator`]: https://github.com/google/mediapipe/tree/master/mediapipe/calculators/core/flow_limiter_calculator.cc
+[`How to process realtime input streams`]: faq.md#how-to-process-realtime-input-streams
diff --git a/docs/images/accelerated.png b/docs/images/accelerated.png
new file mode 100644
index 000000000..8c9d241ca
Binary files /dev/null and b/docs/images/accelerated.png differ
diff --git a/docs/images/accelerated_small.png b/docs/images/accelerated_small.png
new file mode 100644
index 000000000..759542dc4
Binary files /dev/null and b/docs/images/accelerated_small.png differ
diff --git a/mediapipe/docs/images/add_ipa.png b/docs/images/add_ipa.png
similarity index 100%
rename from mediapipe/docs/images/add_ipa.png
rename to docs/images/add_ipa.png
diff --git a/mediapipe/docs/images/app_ipa.png b/docs/images/app_ipa.png
similarity index 100%
rename from mediapipe/docs/images/app_ipa.png
rename to docs/images/app_ipa.png
diff --git a/mediapipe/docs/images/app_ipa_added.png b/docs/images/app_ipa_added.png
similarity index 100%
rename from mediapipe/docs/images/app_ipa_added.png
rename to docs/images/app_ipa_added.png
diff --git a/mediapipe/docs/images/autoflip_edited_example.gif b/docs/images/autoflip_edited_example.gif
similarity index 100%
rename from mediapipe/docs/images/autoflip_edited_example.gif
rename to docs/images/autoflip_edited_example.gif
diff --git a/mediapipe/docs/images/autoflip_graph.png b/docs/images/autoflip_graph.png
similarity index 100%
rename from mediapipe/docs/images/autoflip_graph.png
rename to docs/images/autoflip_graph.png
diff --git a/mediapipe/docs/images/autoflip_is_required.gif b/docs/images/autoflip_is_required.gif
similarity index 100%
rename from mediapipe/docs/images/autoflip_is_required.gif
rename to docs/images/autoflip_is_required.gif
diff --git a/mediapipe/docs/images/bazel_permission.png b/docs/images/bazel_permission.png
similarity index 100%
rename from mediapipe/docs/images/bazel_permission.png
rename to docs/images/bazel_permission.png
diff --git a/mediapipe/docs/images/click_subgraph_handdetection.png b/docs/images/click_subgraph_handdetection.png
similarity index 100%
rename from mediapipe/docs/images/click_subgraph_handdetection.png
rename to docs/images/click_subgraph_handdetection.png
diff --git a/mediapipe/docs/images/console_error.png b/docs/images/console_error.png
similarity index 100%
rename from mediapipe/docs/images/console_error.png
rename to docs/images/console_error.png
diff --git a/docs/images/cross_platform.png b/docs/images/cross_platform.png
new file mode 100644
index 000000000..09dedc96a
Binary files /dev/null and b/docs/images/cross_platform.png differ
diff --git a/docs/images/cross_platform_small.png b/docs/images/cross_platform_small.png
new file mode 100644
index 000000000..7476327b2
Binary files /dev/null and b/docs/images/cross_platform_small.png differ
diff --git a/mediapipe/docs/images/cyclic_integer_sum_graph.svg b/docs/images/cyclic_integer_sum_graph.svg
similarity index 100%
rename from mediapipe/docs/images/cyclic_integer_sum_graph.svg
rename to docs/images/cyclic_integer_sum_graph.svg
diff --git a/mediapipe/docs/images/device.png b/docs/images/device.png
similarity index 100%
rename from mediapipe/docs/images/device.png
rename to docs/images/device.png
diff --git a/mediapipe/docs/images/editor_view.png b/docs/images/editor_view.png
similarity index 100%
rename from mediapipe/docs/images/editor_view.png
rename to docs/images/editor_view.png
diff --git a/mediapipe/docs/images/face_detection_desktop.png b/docs/images/face_detection_desktop.png
similarity index 100%
rename from mediapipe/docs/images/face_detection_desktop.png
rename to docs/images/face_detection_desktop.png
diff --git a/docs/images/face_mesh_ar_effects.gif b/docs/images/face_mesh_ar_effects.gif
new file mode 100644
index 000000000..868a40c4d
Binary files /dev/null and b/docs/images/face_mesh_ar_effects.gif differ
diff --git a/mediapipe/docs/images/favicon.ico b/docs/images/favicon.ico
similarity index 100%
rename from mediapipe/docs/images/favicon.ico
rename to docs/images/favicon.ico
diff --git a/mediapipe/docs/images/faviconv2.ico b/docs/images/faviconv2.ico
similarity index 100%
rename from mediapipe/docs/images/faviconv2.ico
rename to docs/images/faviconv2.ico
diff --git a/mediapipe/docs/images/gpu_example_graph.png b/docs/images/gpu_example_graph.png
similarity index 100%
rename from mediapipe/docs/images/gpu_example_graph.png
rename to docs/images/gpu_example_graph.png
diff --git a/mediapipe/docs/images/graph_visual.png b/docs/images/graph_visual.png
similarity index 100%
rename from mediapipe/docs/images/graph_visual.png
rename to docs/images/graph_visual.png
diff --git a/mediapipe/docs/images/hand_tracking_desktop.png b/docs/images/hand_tracking_desktop.png
similarity index 100%
rename from mediapipe/docs/images/hand_tracking_desktop.png
rename to docs/images/hand_tracking_desktop.png
diff --git a/mediapipe/docs/images/hello_world.png b/docs/images/hello_world.png
similarity index 100%
rename from mediapipe/docs/images/hello_world.png
rename to docs/images/hello_world.png
diff --git a/mediapipe/docs/images/iconv2.png b/docs/images/iconv2.png
similarity index 100%
rename from mediapipe/docs/images/iconv2.png
rename to docs/images/iconv2.png
diff --git a/docs/images/knift_stop_sign.gif b/docs/images/knift_stop_sign.gif
new file mode 100644
index 000000000..a84b4aa19
Binary files /dev/null and b/docs/images/knift_stop_sign.gif differ
diff --git a/mediapipe/docs/images/logo.png b/docs/images/logo.png
similarity index 100%
rename from mediapipe/docs/images/logo.png
rename to docs/images/logo.png
diff --git a/mediapipe/docs/images/logo_horizontal_black.png b/docs/images/logo_horizontal_black.png
similarity index 100%
rename from mediapipe/docs/images/logo_horizontal_black.png
rename to docs/images/logo_horizontal_black.png
diff --git a/docs/images/logo_horizontal_color.png b/docs/images/logo_horizontal_color.png
new file mode 100644
index 000000000..6779a0d2a
Binary files /dev/null and b/docs/images/logo_horizontal_color.png differ
diff --git a/mediapipe/docs/images/logo_horizontal_white.png b/docs/images/logo_horizontal_white.png
similarity index 100%
rename from mediapipe/docs/images/logo_horizontal_white.png
rename to docs/images/logo_horizontal_white.png
diff --git a/mediapipe/docs/images/logov2.png b/docs/images/logov2.png
similarity index 100%
rename from mediapipe/docs/images/logov2.png
rename to docs/images/logov2.png
diff --git a/mediapipe/docs/images/maingraph_visualizer.png b/docs/images/maingraph_visualizer.png
similarity index 100%
rename from mediapipe/docs/images/maingraph_visualizer.png
rename to docs/images/maingraph_visualizer.png
diff --git a/mediapipe/docs/images/mediapipe_small.png b/docs/images/mediapipe_small.png
similarity index 100%
rename from mediapipe/docs/images/mediapipe_small.png
rename to docs/images/mediapipe_small.png
diff --git a/mediapipe/docs/images/mobile/aar_location.png b/docs/images/mobile/aar_location.png
similarity index 100%
rename from mediapipe/docs/images/mobile/aar_location.png
rename to docs/images/mobile/aar_location.png
diff --git a/mediapipe/docs/images/mobile/android_studio_opencv_location.png b/docs/images/mobile/android_studio_opencv_location.png
similarity index 100%
rename from mediapipe/docs/images/mobile/android_studio_opencv_location.png
rename to docs/images/mobile/android_studio_opencv_location.png
diff --git a/mediapipe/docs/images/mobile/assets_location.png b/docs/images/mobile/assets_location.png
similarity index 100%
rename from mediapipe/docs/images/mobile/assets_location.png
rename to docs/images/mobile/assets_location.png
diff --git a/mediapipe/docs/images/mobile/bazel_hello_world_android.png b/docs/images/mobile/bazel_hello_world_android.png
similarity index 100%
rename from mediapipe/docs/images/mobile/bazel_hello_world_android.png
rename to docs/images/mobile/bazel_hello_world_android.png
diff --git a/mediapipe/docs/images/mobile/box_tracking_subgraph.png b/docs/images/mobile/box_tracking_subgraph.png
similarity index 100%
rename from mediapipe/docs/images/mobile/box_tracking_subgraph.png
rename to docs/images/mobile/box_tracking_subgraph.png
diff --git a/mediapipe/docs/images/mobile/edge_detection_android_gpu.gif b/docs/images/mobile/edge_detection_android_gpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/edge_detection_android_gpu.gif
rename to docs/images/mobile/edge_detection_android_gpu.gif
diff --git a/mediapipe/docs/images/mobile/edge_detection_ios_gpu.gif b/docs/images/mobile/edge_detection_ios_gpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/edge_detection_ios_gpu.gif
rename to docs/images/mobile/edge_detection_ios_gpu.gif
diff --git a/mediapipe/docs/images/mobile/edge_detection_mobile_gpu.png b/docs/images/mobile/edge_detection_mobile_gpu.png
similarity index 100%
rename from mediapipe/docs/images/mobile/edge_detection_mobile_gpu.png
rename to docs/images/mobile/edge_detection_mobile_gpu.png
diff --git a/mediapipe/docs/images/mobile/face_detection_android_gpu.gif b/docs/images/mobile/face_detection_android_gpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/face_detection_android_gpu.gif
rename to docs/images/mobile/face_detection_android_gpu.gif
diff --git a/mediapipe/docs/images/mobile/face_detection_android_gpu_small.gif b/docs/images/mobile/face_detection_android_gpu_small.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/face_detection_android_gpu_small.gif
rename to docs/images/mobile/face_detection_android_gpu_small.gif
diff --git a/mediapipe/docs/images/mobile/face_detection_mobile_cpu.png b/docs/images/mobile/face_detection_mobile_cpu.png
similarity index 100%
rename from mediapipe/docs/images/mobile/face_detection_mobile_cpu.png
rename to docs/images/mobile/face_detection_mobile_cpu.png
diff --git a/mediapipe/docs/images/mobile/face_detection_mobile_gpu.png b/docs/images/mobile/face_detection_mobile_gpu.png
similarity index 100%
rename from mediapipe/docs/images/mobile/face_detection_mobile_gpu.png
rename to docs/images/mobile/face_detection_mobile_gpu.png
diff --git a/mediapipe/docs/images/mobile/face_landmark_front_gpu_subgraph.png b/docs/images/mobile/face_landmark_front_gpu_subgraph.png
similarity index 100%
rename from mediapipe/docs/images/mobile/face_landmark_front_gpu_subgraph.png
rename to docs/images/mobile/face_landmark_front_gpu_subgraph.png
diff --git a/mediapipe/docs/images/mobile/face_mesh_android_gpu.gif b/docs/images/mobile/face_mesh_android_gpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/face_mesh_android_gpu.gif
rename to docs/images/mobile/face_mesh_android_gpu.gif
diff --git a/mediapipe/docs/images/mobile/face_mesh_android_gpu_small.gif b/docs/images/mobile/face_mesh_android_gpu_small.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/face_mesh_android_gpu_small.gif
rename to docs/images/mobile/face_mesh_android_gpu_small.gif
diff --git a/mediapipe/docs/images/mobile/face_mesh_mobile.png b/docs/images/mobile/face_mesh_mobile.png
similarity index 100%
rename from mediapipe/docs/images/mobile/face_mesh_mobile.png
rename to docs/images/mobile/face_mesh_mobile.png
diff --git a/mediapipe/docs/images/mobile/face_renderer_gpu_subgraph.png b/docs/images/mobile/face_renderer_gpu_subgraph.png
similarity index 100%
rename from mediapipe/docs/images/mobile/face_renderer_gpu_subgraph.png
rename to docs/images/mobile/face_renderer_gpu_subgraph.png
diff --git a/mediapipe/docs/images/mobile/hair_segmentation_android_gpu.gif b/docs/images/mobile/hair_segmentation_android_gpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/hair_segmentation_android_gpu.gif
rename to docs/images/mobile/hair_segmentation_android_gpu.gif
diff --git a/mediapipe/docs/images/mobile/hair_segmentation_android_gpu_small.gif b/docs/images/mobile/hair_segmentation_android_gpu_small.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/hair_segmentation_android_gpu_small.gif
rename to docs/images/mobile/hair_segmentation_android_gpu_small.gif
diff --git a/mediapipe/docs/images/mobile/hair_segmentation_mobile_gpu.png b/docs/images/mobile/hair_segmentation_mobile_gpu.png
similarity index 100%
rename from mediapipe/docs/images/mobile/hair_segmentation_mobile_gpu.png
rename to docs/images/mobile/hair_segmentation_mobile_gpu.png
diff --git a/mediapipe/docs/images/mobile/hand_crops.png b/docs/images/mobile/hand_crops.png
similarity index 100%
rename from mediapipe/docs/images/mobile/hand_crops.png
rename to docs/images/mobile/hand_crops.png
diff --git a/mediapipe/docs/images/mobile/hand_detection_android_gpu.gif b/docs/images/mobile/hand_detection_android_gpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/hand_detection_android_gpu.gif
rename to docs/images/mobile/hand_detection_android_gpu.gif
diff --git a/mediapipe/docs/images/mobile/hand_detection_android_gpu_small.gif b/docs/images/mobile/hand_detection_android_gpu_small.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/hand_detection_android_gpu_small.gif
rename to docs/images/mobile/hand_detection_android_gpu_small.gif
diff --git a/mediapipe/docs/images/mobile/hand_detection_gpu_subgraph.png b/docs/images/mobile/hand_detection_gpu_subgraph.png
similarity index 100%
rename from mediapipe/docs/images/mobile/hand_detection_gpu_subgraph.png
rename to docs/images/mobile/hand_detection_gpu_subgraph.png
diff --git a/mediapipe/docs/images/mobile/hand_detection_mobile.png b/docs/images/mobile/hand_detection_mobile.png
similarity index 100%
rename from mediapipe/docs/images/mobile/hand_detection_mobile.png
rename to docs/images/mobile/hand_detection_mobile.png
diff --git a/mediapipe/docs/images/mobile/hand_landmark_gpu_subgraph.png b/docs/images/mobile/hand_landmark_gpu_subgraph.png
similarity index 100%
rename from mediapipe/docs/images/mobile/hand_landmark_gpu_subgraph.png
rename to docs/images/mobile/hand_landmark_gpu_subgraph.png
diff --git a/mediapipe/docs/images/mobile/hand_renderer_gpu_subgraph.png b/docs/images/mobile/hand_renderer_gpu_subgraph.png
similarity index 100%
rename from mediapipe/docs/images/mobile/hand_renderer_gpu_subgraph.png
rename to docs/images/mobile/hand_renderer_gpu_subgraph.png
diff --git a/mediapipe/docs/images/mobile/hand_tracking_3d_android_gpu.gif b/docs/images/mobile/hand_tracking_3d_android_gpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/hand_tracking_3d_android_gpu.gif
rename to docs/images/mobile/hand_tracking_3d_android_gpu.gif
diff --git a/mediapipe/docs/images/mobile/hand_tracking_android_gpu.gif b/docs/images/mobile/hand_tracking_android_gpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/hand_tracking_android_gpu.gif
rename to docs/images/mobile/hand_tracking_android_gpu.gif
diff --git a/mediapipe/docs/images/mobile/hand_tracking_android_gpu_small.gif b/docs/images/mobile/hand_tracking_android_gpu_small.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/hand_tracking_android_gpu_small.gif
rename to docs/images/mobile/hand_tracking_android_gpu_small.gif
diff --git a/mediapipe/docs/images/mobile/hand_tracking_mobile.png b/docs/images/mobile/hand_tracking_mobile.png
similarity index 100%
rename from mediapipe/docs/images/mobile/hand_tracking_mobile.png
rename to docs/images/mobile/hand_tracking_mobile.png
diff --git a/mediapipe/docs/images/mobile/missing_camera_permission_android.png b/docs/images/mobile/missing_camera_permission_android.png
similarity index 100%
rename from mediapipe/docs/images/mobile/missing_camera_permission_android.png
rename to docs/images/mobile/missing_camera_permission_android.png
diff --git a/mediapipe/docs/images/mobile/multi_hand_detection_gpu_subgraph.png b/docs/images/mobile/multi_hand_detection_gpu_subgraph.png
similarity index 100%
rename from mediapipe/docs/images/mobile/multi_hand_detection_gpu_subgraph.png
rename to docs/images/mobile/multi_hand_detection_gpu_subgraph.png
diff --git a/mediapipe/docs/images/mobile/multi_hand_landmark_subgraph.png b/docs/images/mobile/multi_hand_landmark_subgraph.png
similarity index 100%
rename from mediapipe/docs/images/mobile/multi_hand_landmark_subgraph.png
rename to docs/images/mobile/multi_hand_landmark_subgraph.png
diff --git a/mediapipe/docs/images/mobile/multi_hand_renderer_gpu_subgraph.png b/docs/images/mobile/multi_hand_renderer_gpu_subgraph.png
similarity index 100%
rename from mediapipe/docs/images/mobile/multi_hand_renderer_gpu_subgraph.png
rename to docs/images/mobile/multi_hand_renderer_gpu_subgraph.png
diff --git a/mediapipe/docs/images/mobile/multi_hand_tracking_3d_android_gpu.gif b/docs/images/mobile/multi_hand_tracking_3d_android_gpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/multi_hand_tracking_3d_android_gpu.gif
rename to docs/images/mobile/multi_hand_tracking_3d_android_gpu.gif
diff --git a/mediapipe/docs/images/mobile/multi_hand_tracking_3d_android_gpu_small.gif b/docs/images/mobile/multi_hand_tracking_3d_android_gpu_small.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/multi_hand_tracking_3d_android_gpu_small.gif
rename to docs/images/mobile/multi_hand_tracking_3d_android_gpu_small.gif
diff --git a/mediapipe/docs/images/mobile/multi_hand_tracking_android_gpu.gif b/docs/images/mobile/multi_hand_tracking_android_gpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/multi_hand_tracking_android_gpu.gif
rename to docs/images/mobile/multi_hand_tracking_android_gpu.gif
diff --git a/mediapipe/docs/images/mobile/multi_hand_tracking_mobile.png b/docs/images/mobile/multi_hand_tracking_mobile.png
similarity index 100%
rename from mediapipe/docs/images/mobile/multi_hand_tracking_mobile.png
rename to docs/images/mobile/multi_hand_tracking_mobile.png
diff --git a/mediapipe/docs/images/mobile/object_detection_3d_android_gpu.png b/docs/images/mobile/object_detection_3d_android_gpu.png
similarity index 100%
rename from mediapipe/docs/images/mobile/object_detection_3d_android_gpu.png
rename to docs/images/mobile/object_detection_3d_android_gpu.png
diff --git a/mediapipe/docs/images/mobile/object_detection_android_cpu.gif b/docs/images/mobile/object_detection_android_cpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/object_detection_android_cpu.gif
rename to docs/images/mobile/object_detection_android_cpu.gif
diff --git a/mediapipe/docs/images/mobile/object_detection_android_gpu.gif b/docs/images/mobile/object_detection_android_gpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/object_detection_android_gpu.gif
rename to docs/images/mobile/object_detection_android_gpu.gif
diff --git a/mediapipe/docs/images/mobile/object_detection_android_gpu_small.gif b/docs/images/mobile/object_detection_android_gpu_small.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/object_detection_android_gpu_small.gif
rename to docs/images/mobile/object_detection_android_gpu_small.gif
diff --git a/mediapipe/docs/images/mobile/object_detection_gpu_subgraph.png b/docs/images/mobile/object_detection_gpu_subgraph.png
similarity index 100%
rename from mediapipe/docs/images/mobile/object_detection_gpu_subgraph.png
rename to docs/images/mobile/object_detection_gpu_subgraph.png
diff --git a/mediapipe/docs/images/mobile/object_detection_mobile_cpu.png b/docs/images/mobile/object_detection_mobile_cpu.png
similarity index 100%
rename from mediapipe/docs/images/mobile/object_detection_mobile_cpu.png
rename to docs/images/mobile/object_detection_mobile_cpu.png
diff --git a/mediapipe/docs/images/mobile/object_detection_mobile_gpu.png b/docs/images/mobile/object_detection_mobile_gpu.png
similarity index 100%
rename from mediapipe/docs/images/mobile/object_detection_mobile_gpu.png
rename to docs/images/mobile/object_detection_mobile_gpu.png
diff --git a/mediapipe/docs/images/mobile/object_tracking_android_gpu.gif b/docs/images/mobile/object_tracking_android_gpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/object_tracking_android_gpu.gif
rename to docs/images/mobile/object_tracking_android_gpu.gif
diff --git a/mediapipe/docs/images/mobile/object_tracking_android_gpu_detection_only.gif b/docs/images/mobile/object_tracking_android_gpu_detection_only.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/object_tracking_android_gpu_detection_only.gif
rename to docs/images/mobile/object_tracking_android_gpu_detection_only.gif
diff --git a/mediapipe/docs/images/mobile/object_tracking_android_gpu_small.gif b/docs/images/mobile/object_tracking_android_gpu_small.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/object_tracking_android_gpu_small.gif
rename to docs/images/mobile/object_tracking_android_gpu_small.gif
diff --git a/mediapipe/docs/images/mobile/object_tracking_mobile_gpu.png b/docs/images/mobile/object_tracking_mobile_gpu.png
similarity index 100%
rename from mediapipe/docs/images/mobile/object_tracking_mobile_gpu.png
rename to docs/images/mobile/object_tracking_mobile_gpu.png
diff --git a/mediapipe/docs/images/mobile/object_tracking_renderer_gpu_subgraph.png b/docs/images/mobile/object_tracking_renderer_gpu_subgraph.png
similarity index 100%
rename from mediapipe/docs/images/mobile/object_tracking_renderer_gpu_subgraph.png
rename to docs/images/mobile/object_tracking_renderer_gpu_subgraph.png
diff --git a/mediapipe/docs/images/mobile/object_tracking_subgraph.png b/docs/images/mobile/object_tracking_subgraph.png
similarity index 100%
rename from mediapipe/docs/images/mobile/object_tracking_subgraph.png
rename to docs/images/mobile/object_tracking_subgraph.png
diff --git a/mediapipe/docs/images/mobile/objectron_chair_android_gpu.gif b/docs/images/mobile/objectron_chair_android_gpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/objectron_chair_android_gpu.gif
rename to docs/images/mobile/objectron_chair_android_gpu.gif
diff --git a/mediapipe/docs/images/mobile/objectron_chair_android_gpu_small.gif b/docs/images/mobile/objectron_chair_android_gpu_small.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/objectron_chair_android_gpu_small.gif
rename to docs/images/mobile/objectron_chair_android_gpu_small.gif
diff --git a/mediapipe/docs/images/mobile/objectron_detection_subgraph.png b/docs/images/mobile/objectron_detection_subgraph.png
similarity index 100%
rename from mediapipe/docs/images/mobile/objectron_detection_subgraph.png
rename to docs/images/mobile/objectron_detection_subgraph.png
diff --git a/mediapipe/docs/images/mobile/objectron_shoe_android_gpu.gif b/docs/images/mobile/objectron_shoe_android_gpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/objectron_shoe_android_gpu.gif
rename to docs/images/mobile/objectron_shoe_android_gpu.gif
diff --git a/mediapipe/docs/images/mobile/objectron_shoe_android_gpu_small.gif b/docs/images/mobile/objectron_shoe_android_gpu_small.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/objectron_shoe_android_gpu_small.gif
rename to docs/images/mobile/objectron_shoe_android_gpu_small.gif
diff --git a/mediapipe/docs/images/mobile/objectron_tracking_subgraph.png b/docs/images/mobile/objectron_tracking_subgraph.png
similarity index 100%
rename from mediapipe/docs/images/mobile/objectron_tracking_subgraph.png
rename to docs/images/mobile/objectron_tracking_subgraph.png
diff --git a/mediapipe/docs/images/mobile/renderer_gpu.png b/docs/images/mobile/renderer_gpu.png
similarity index 100%
rename from mediapipe/docs/images/mobile/renderer_gpu.png
rename to docs/images/mobile/renderer_gpu.png
diff --git a/mediapipe/docs/images/mobile/template_matching_android_cpu.gif b/docs/images/mobile/template_matching_android_cpu.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/template_matching_android_cpu.gif
rename to docs/images/mobile/template_matching_android_cpu.gif
diff --git a/mediapipe/docs/images/mobile/template_matching_android_cpu_small.gif b/docs/images/mobile/template_matching_android_cpu_small.gif
similarity index 100%
rename from mediapipe/docs/images/mobile/template_matching_android_cpu_small.gif
rename to docs/images/mobile/template_matching_android_cpu_small.gif
diff --git a/mediapipe/docs/images/mobile/template_matching_mobile_graph.png b/docs/images/mobile/template_matching_mobile_graph.png
similarity index 100%
rename from mediapipe/docs/images/mobile/template_matching_mobile_graph.png
rename to docs/images/mobile/template_matching_mobile_graph.png
diff --git a/mediapipe/docs/images/mobile/template_matching_mobile_template.jpg b/docs/images/mobile/template_matching_mobile_template.jpg
similarity index 100%
rename from mediapipe/docs/images/mobile/template_matching_mobile_template.jpg
rename to docs/images/mobile/template_matching_mobile_template.jpg
diff --git a/mediapipe/docs/images/multi_hand_tracking_android_gpu.gif b/docs/images/multi_hand_tracking_android_gpu.gif
similarity index 100%
rename from mediapipe/docs/images/multi_hand_tracking_android_gpu.gif
rename to docs/images/multi_hand_tracking_android_gpu.gif
diff --git a/mediapipe/docs/images/multi_hand_tracking_android_gpu_small.gif b/docs/images/multi_hand_tracking_android_gpu_small.gif
similarity index 100%
rename from mediapipe/docs/images/multi_hand_tracking_android_gpu_small.gif
rename to docs/images/multi_hand_tracking_android_gpu_small.gif
diff --git a/mediapipe/docs/images/multi_hand_tracking_desktop.png b/docs/images/multi_hand_tracking_desktop.png
similarity index 100%
rename from mediapipe/docs/images/multi_hand_tracking_desktop.png
rename to docs/images/multi_hand_tracking_desktop.png
diff --git a/mediapipe/docs/images/object_detection_desktop_tensorflow.png b/docs/images/object_detection_desktop_tensorflow.png
similarity index 100%
rename from mediapipe/docs/images/object_detection_desktop_tensorflow.png
rename to docs/images/object_detection_desktop_tensorflow.png
diff --git a/mediapipe/docs/images/object_detection_desktop_tflite.png b/docs/images/object_detection_desktop_tflite.png
similarity index 100%
rename from mediapipe/docs/images/object_detection_desktop_tflite.png
rename to docs/images/object_detection_desktop_tflite.png
diff --git a/docs/images/objectron_data_annotation.gif b/docs/images/objectron_data_annotation.gif
new file mode 100644
index 000000000..6466f7735
Binary files /dev/null and b/docs/images/objectron_data_annotation.gif differ
diff --git a/docs/images/objectron_example_results.png b/docs/images/objectron_example_results.png
new file mode 100644
index 000000000..977da33cc
Binary files /dev/null and b/docs/images/objectron_example_results.png differ
diff --git a/docs/images/objectron_network_architecture.png b/docs/images/objectron_network_architecture.png
new file mode 100644
index 000000000..2f0b6d9b2
Binary files /dev/null and b/docs/images/objectron_network_architecture.png differ
diff --git a/docs/images/objectron_sample_network_results.png b/docs/images/objectron_sample_network_results.png
new file mode 100644
index 000000000..e3ae90f8a
Binary files /dev/null and b/docs/images/objectron_sample_network_results.png differ
diff --git a/docs/images/objectron_synthetic_data_generation.gif b/docs/images/objectron_synthetic_data_generation.gif
new file mode 100644
index 000000000..77705cca3
Binary files /dev/null and b/docs/images/objectron_synthetic_data_generation.gif differ
diff --git a/docs/images/open_source.png b/docs/images/open_source.png
new file mode 100644
index 000000000..f337c8748
Binary files /dev/null and b/docs/images/open_source.png differ
diff --git a/docs/images/open_source_small.png b/docs/images/open_source_small.png
new file mode 100644
index 000000000..c64ca50d3
Binary files /dev/null and b/docs/images/open_source_small.png differ
diff --git a/mediapipe/docs/images/packet_cloner_calculator.png b/docs/images/packet_cloner_calculator.png
similarity index 100%
rename from mediapipe/docs/images/packet_cloner_calculator.png
rename to docs/images/packet_cloner_calculator.png
diff --git a/docs/images/ready_to_use.png b/docs/images/ready_to_use.png
new file mode 100644
index 000000000..fbccbe830
Binary files /dev/null and b/docs/images/ready_to_use.png differ
diff --git a/docs/images/ready_to_use_small.png b/docs/images/ready_to_use_small.png
new file mode 100644
index 000000000..5091faaf6
Binary files /dev/null and b/docs/images/ready_to_use_small.png differ
diff --git a/mediapipe/docs/images/realtime_face_detection.gif b/docs/images/realtime_face_detection.gif
similarity index 100%
rename from mediapipe/docs/images/realtime_face_detection.gif
rename to docs/images/realtime_face_detection.gif
diff --git a/mediapipe/docs/images/side_packet.png b/docs/images/side_packet.png
similarity index 100%
rename from mediapipe/docs/images/side_packet.png
rename to docs/images/side_packet.png
diff --git a/mediapipe/docs/images/side_packet_code.png b/docs/images/side_packet_code.png
similarity index 100%
rename from mediapipe/docs/images/side_packet_code.png
rename to docs/images/side_packet_code.png
diff --git a/mediapipe/docs/images/special_nodes.png b/docs/images/special_nodes.png
similarity index 100%
rename from mediapipe/docs/images/special_nodes.png
rename to docs/images/special_nodes.png
diff --git a/mediapipe/docs/images/special_nodes_code.png b/docs/images/special_nodes_code.png
similarity index 100%
rename from mediapipe/docs/images/special_nodes_code.png
rename to docs/images/special_nodes_code.png
diff --git a/mediapipe/docs/images/startup_screen.png b/docs/images/startup_screen.png
similarity index 100%
rename from mediapipe/docs/images/startup_screen.png
rename to docs/images/startup_screen.png
diff --git a/mediapipe/docs/images/stream_code.png b/docs/images/stream_code.png
similarity index 100%
rename from mediapipe/docs/images/stream_code.png
rename to docs/images/stream_code.png
diff --git a/mediapipe/docs/images/stream_ui.png b/docs/images/stream_ui.png
similarity index 100%
rename from mediapipe/docs/images/stream_ui.png
rename to docs/images/stream_ui.png
diff --git a/mediapipe/docs/images/upload_2pbtxt.png b/docs/images/upload_2pbtxt.png
similarity index 100%
rename from mediapipe/docs/images/upload_2pbtxt.png
rename to docs/images/upload_2pbtxt.png
diff --git a/mediapipe/docs/images/upload_button.png b/docs/images/upload_button.png
similarity index 100%
rename from mediapipe/docs/images/upload_button.png
rename to docs/images/upload_button.png
diff --git a/mediapipe/docs/images/upload_graph_button.png b/docs/images/upload_graph_button.png
similarity index 100%
rename from mediapipe/docs/images/upload_graph_button.png
rename to docs/images/upload_graph_button.png
diff --git a/mediapipe/docs/images/visualizer/ios_download_container.png b/docs/images/visualizer/ios_download_container.png
similarity index 100%
rename from mediapipe/docs/images/visualizer/ios_download_container.png
rename to docs/images/visualizer/ios_download_container.png
diff --git a/mediapipe/docs/images/visualizer/ios_window_devices.png b/docs/images/visualizer/ios_window_devices.png
similarity index 100%
rename from mediapipe/docs/images/visualizer/ios_window_devices.png
rename to docs/images/visualizer/ios_window_devices.png
diff --git a/mediapipe/docs/images/visualizer/viz_chart_view.png b/docs/images/visualizer/viz_chart_view.png
similarity index 100%
rename from mediapipe/docs/images/visualizer/viz_chart_view.png
rename to docs/images/visualizer/viz_chart_view.png
diff --git a/mediapipe/docs/images/visualizer/viz_click_upload.png b/docs/images/visualizer/viz_click_upload.png
similarity index 100%
rename from mediapipe/docs/images/visualizer/viz_click_upload.png
rename to docs/images/visualizer/viz_click_upload.png
diff --git a/mediapipe/docs/images/visualizer/viz_click_upload_trace_file.png b/docs/images/visualizer/viz_click_upload_trace_file.png
similarity index 100%
rename from mediapipe/docs/images/visualizer/viz_click_upload_trace_file.png
rename to docs/images/visualizer/viz_click_upload_trace_file.png
diff --git a/docs/images/visualizer_runner.png b/docs/images/visualizer_runner.png
new file mode 100644
index 000000000..5224a0949
Binary files /dev/null and b/docs/images/visualizer_runner.png differ
diff --git a/mediapipe/docs/images/web_effect.gif b/docs/images/web_effect.gif
similarity index 100%
rename from mediapipe/docs/images/web_effect.gif
rename to docs/images/web_effect.gif
diff --git a/mediapipe/docs/images/web_segmentation.gif b/docs/images/web_segmentation.gif
similarity index 100%
rename from mediapipe/docs/images/web_segmentation.gif
rename to docs/images/web_segmentation.gif
diff --git a/docs/index.md b/docs/index.md
new file mode 100644
index 000000000..95a54cc1a
--- /dev/null
+++ b/docs/index.md
@@ -0,0 +1,141 @@
+---
+layout: default
+title: Home
+nav_order: 1
+---
+
+![MediaPipe](images/mediapipe_small.png)
+
+--------------------------------------------------------------------------------
+
+## Cross-platform ML solutions made simple
+
+[MediaPipe](https://google.github.io/mediapipe/) is the simplest way for researchers
+and developers to build world-class ML solutions and applications for mobile,
+desktop/cloud, web and IoT devices.
+
+![accelerated.png](images/accelerated_small.png)                                                               | ![cross_platform.png](images/cross_platform_small.png)
+:------------------------------------------------------------------------------------------------------------: | :----------------------------------------------------:
+***End-to-End acceleration***: *built-in fast ML inference and processing accelerated even on common hardware* | ***Build one, deploy anywhere***: *Unified solution works across Android, iOS, desktop/cloud, web and IoT*
+![ready_to_use.png](images/ready_to_use_small.png)                                                             | ![open_source.png](images/open_source_small.png)
+***Ready-to-use solutions***: *Cutting-edge ML solutions demonstrating full power of the framework*            | ***Free and open source***: *Framework and solutions both under Apache 2.0, fully extensible and customizable*
+
+## ML solutions in MediaPipe
+
+Face Detection                                                                                                                 | Face Mesh                                                                                                       | Hand                                                                                                      | Hair Segmentation
+:----------------------------------------------------------------------------------------------------------------------------: | :-------------------------------------------------------------------------------------------------------------: | :-------------------------------------------------------------------------------------------------------: | :---------------:
+[![face_detection](images/mobile/face_detection_android_gpu_small.gif)](https://google.github.io/mediapipe/solutions/face_detection) | [![face_mesh](images/mobile/face_mesh_android_gpu_small.gif)](https://google.github.io/mediapipe/solutions/face_mesh) | [![hand](images/mobile/hand_tracking_android_gpu_small.gif)](https://google.github.io/mediapipe/solutions/hand) | [![hair_segmentation](images/mobile/hair_segmentation_android_gpu_small.gif)](https://google.github.io/mediapipe/solutions/hair_segmentation)
+
+Object Detection                                                                                                                     | Box Tracking                                                                                                                | Objectron                                                                                                             | KNIFT
+:----------------------------------------------------------------------------------------------------------------------------------: | :-------------------------------------------------------------------------------------------------------------------------: | :-------------------------------------------------------------------------------------------------------------------: | :---:
+[![object_detection](images/mobile/object_detection_android_gpu_small.gif)](https://google.github.io/mediapipe/solutions/object_detection) | [![box_tracking](images/mobile/object_tracking_android_gpu_small.gif)](https://google.github.io/mediapipe/solutions/box_tracking) | [![objectron](images/mobile/objectron_chair_android_gpu_small.gif)](https://google.github.io/mediapipe/solutions/objectron) | [![knift](images/mobile/template_matching_android_cpu_small.gif)](https://google.github.io/mediapipe/solutions/knift)
+
+<!-- []() in the first cell is needed to preserve table formatting in GitHub Pages. -->
+<!-- Whenever this table is updated, paste a copy to solutions/solutions.md. -->
+
+[]()                                                                          | Android | iOS | Desktop | Web | Coral
+:---------------------------------------------------------------------------- | :-----: | :-: | :-----: | :-: | :---:
+[Face Detection](https://google.github.io/mediapipe/solutions/face_detection)       | ✅       | ✅   | ✅       | ✅   | ✅
+[Face Mesh](https://google.github.io/mediapipe/solutions/face_mesh)                 | ✅       | ✅   | ✅       |     |
+[Hand](https://google.github.io/mediapipe/solutions/hand)                           | ✅       | ✅   | ✅       | ✅   |
+[Hair Segmentation](https://google.github.io/mediapipe/solutions/hair_segmentation) | ✅       |     | ✅       | ✅   |
+[Object Detection](https://google.github.io/mediapipe/solutions/object_detection)   | ✅       | ✅   | ✅       |     | ✅
+[Box Tracking](https://google.github.io/mediapipe/solutions/box_tracking)           | ✅       | ✅   | ✅       |     |
+[Objectron](https://google.github.io/mediapipe/solutions/objectron)                 | ✅       |     |         |     |
+[KNIFT](https://google.github.io/mediapipe/solutions/knift)                         | ✅       |     |         |     |
+[AutoFlip](https://google.github.io/mediapipe/solutions/autoflip)                   |         |     | ✅       |     |
+[MediaSequence](https://google.github.io/mediapipe/solutions/media_sequence)        |         |     | ✅       |     |
+[YouTube 8M](https://google.github.io/mediapipe/solutions/youtube_8m)               |         |     | ✅       |     |
+
+## MediaPipe on the Web
+
+MediaPipe on the Web is an effort to run the same ML solutions built for mobile
+and desktop also in web browsers. The official API is under construction, but
+the core technology has been proven effective. Please see
+[MediaPipe on the Web](https://developers.googleblog.com/2020/01/mediapipe-on-web.html)
+in Google Developers Blog for details.
+
+You can use the following links to load a demo in the MediaPipe Visualizer, and
+over there click the "Runner" icon in the top bar like shown below. The demos
+use your webcam video as input, which is processed all locally in real-time and
+never leaves your device.
+
+![visualizer_runner](images/visualizer_runner.png)
+
+*   [MediaPipe Face Detection](https://viz.mediapipe.dev/demo/face_detection)
+*   [MediaPipe Hand](https://viz.mediapipe.dev/demo/hand_tracking)
+*   [MediaPipe Hand (palm/hand detection only)](https://viz.mediapipe.dev/demo/hand_detection)
+*   [MediaPipe Hair Segmentation](https://viz.mediapipe.dev/demo/hair_segmentation)
+
+## Getting started
+
+Learn how to [install](https://google.github.io/mediapipe/getting_started/install)
+MediaPipe and
+[build example applications](https://google.github.io/mediapipe/getting_started/building_examples),
+and start exploring our ready-to-use
+[solutions](https://google.github.io/mediapipe/solutions/solutions) that you can
+further extend and customize.
+
+The source code is hosted in the
+[MediaPipe Github repository](https://github.com/google/mediapipe), and you can
+run code search using
+[Google Open Source Code Search](https://cs.opensource.google/mediapipe/mediapipe).
+
+## Publications
+
+*   [MediaPipe KNIFT: Template-based feature matching](https://developers.googleblog.com/2020/04/mediapipe-knift-template-based-feature-matching.html)
+    in Google Developers Blog
+*   [Alfred Camera: Smart camera features using MediaPipe](https://developers.googleblog.com/2020/03/alfred-camera-smart-camera-features-using-mediapipe.html)
+    in Google Developers Blog
+*   [Real-Time 3D Object Detection on Mobile Devices with MediaPipe](https://ai.googleblog.com/2020/03/real-time-3d-object-detection-on-mobile.html)
+    in Google AI Blog
+*   [AutoFlip: An Open Source Framework for Intelligent Video Reframing](https://ai.googleblog.com/2020/02/autoflip-open-source-framework-for.html)
+    in Google AI Blog
+*   [MediaPipe on the Web](https://developers.googleblog.com/2020/01/mediapipe-on-web.html)
+    in Google Developers Blog
+*   [Object Detection and Tracking using MediaPipe](https://developers.googleblog.com/2019/12/object-detection-and-tracking-using-mediapipe.html)
+    in Google Developers Blog
+*   [On-Device, Real-Time Hand Tracking with MediaPipe](https://ai.googleblog.com/2019/08/on-device-real-time-hand-tracking-with.html)
+    in Google AI Blog
+*   [MediaPipe: A Framework for Building Perception Pipelines](https://arxiv.org/abs/1906.08172)
+
+## Videos
+
+*   [YouTube Channel](https://www.youtube.com/channel/UCObqmpuSMx-usADtL_qdMAw)
+
+## Events
+
+*   [MediaPipe Seattle Meetup, Google Building Waterside, 13 Feb 2020](https://mediapipe.page.link/seattle2020)
+*   [AI Nextcon 2020, 12-16 Feb 2020, Seattle](http://aisea20.xnextcon.com/)
+*   [MediaPipe Madrid Meetup, 16 Dec 2019](https://www.meetup.com/Madrid-AI-Developers-Group/events/266329088/)
+*   [MediaPipe London Meetup, Google 123 Building, 12 Dec 2019](https://www.meetup.com/London-AI-Tech-Talk/events/266329038)
+*   [ML Conference, Berlin, 11 Dec 2019](https://mlconference.ai/machine-learning-advanced-development/mediapipe-building-real-time-cross-platform-mobile-web-edge-desktop-video-audio-ml-pipelines/)
+*   [MediaPipe Berlin Meetup, Google Berlin, 11 Dec 2019](https://www.meetup.com/Berlin-AI-Tech-Talk/events/266328794/)
+*   [The 3rd Workshop on YouTube-8M Large Scale Video Understanding Workshop,
+    Seoul, Korea ICCV
+    2019](https://research.google.com/youtube8m/workshop2019/index.html)
+*   [AI DevWorld 2019, 10 Oct 2019, San Jose, CA](https://aidevworld.com)
+*   [Google Industry Workshop at ICIP 2019, 24 Sept 2019, Taipei, Taiwan](http://2019.ieeeicip.org/?action=page4&id=14#Google)
+    ([presentation](https://docs.google.com/presentation/d/e/2PACX-1vRIBBbO_LO9v2YmvbHHEt1cwyqH6EjDxiILjuT0foXy1E7g6uyh4CesB2DkkEwlRDO9_lWfuKMZx98T/pub?start=false&loop=false&delayms=3000&slide=id.g556cc1a659_0_5))
+*   [Open sourced at CVPR 2019, 17~20 June, Long Beach, CA](https://sites.google.com/corp/view/perception-cv4arvr/mediapipe)
+
+## Community
+
+*   [Awesome MediaPipe](https://mediapipe.org) - A curated list of awesome
+    MediaPipe related frameworks, libraries and software
+*   [Slack community](https://mediapipe.slack.com) for MediaPipe users
+*   [Discuss](https://groups.google.com/forum/#!forum/mediapipe) - General
+    community discussion around MediaPipe
+
+## Alpha Disclaimer
+
+MediaPipe is currently in alpha at v0.7. We may be still making breaking API
+changes and expect to get to stable APIs by v1.0.
+
+## Contributing
+
+We welcome contributions. Please follow these
+[guidelines](https://github.com/google/mediapipe/blob/master/CONTRIBUTING.md).
+
+We use GitHub issues for tracking requests and bugs. Please post questions to
+the MediaPipe Stack Overflow with a `mediapipe` tag.
diff --git a/mediapipe/docs/index.rst b/docs/index.rst
similarity index 84%
rename from mediapipe/docs/index.rst
rename to docs/index.rst
index 870d02b2b..d112c3cda 100644
--- a/mediapipe/docs/index.rst
+++ b/docs/index.rst
@@ -41,18 +41,20 @@ User Documentation
 .. toctree::
    :maxdepth: 3
 
-   install
-   concepts
-   calculator
+   getting_started/install
    Examples <examples>
-   visualizer
-   measure_performance
-   how_to_questions
-   troubleshooting
-   help
-   framework_concepts
-   gpu
-   scheduling_sync
+   tools/visualizer
+   tools/tracing_and_profiling
+   tools/performance_benchmarking
+   getting_started/help
+   getting_started/faq
+   getting_started/troubleshooting
+   framework_concepts/framework_concepts
+   framework_concepts/calculators
+   framework_concepts/graphs
+   framework_concepts/packets
+   framework_concepts/synchronization
+   framework_concepts/gpu
    license
 
 Indices and tables
diff --git a/mediapipe/docs/license.md b/docs/license.md
similarity index 99%
rename from mediapipe/docs/license.md
rename to docs/license.md
index 9a98f8910..9787bc748 100644
--- a/mediapipe/docs/license.md
+++ b/docs/license.md
@@ -1,3 +1,7 @@
+---
+nav_exclude: true
+---
+
 License
 ===============
 Copyright 2019 The MediaPipe Authors.  All rights reserved.
diff --git a/docs/solutions/autoflip.md b/docs/solutions/autoflip.md
new file mode 100644
index 000000000..f78b4ae95
--- /dev/null
+++ b/docs/solutions/autoflip.md
@@ -0,0 +1,356 @@
+---
+layout: default
+title: AutoFlip (Saliency-aware Video Cropping)
+parent: Solutions
+nav_order: 9
+---
+
+# AutoFlip: Saliency-aware Video Cropping
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
+
+## Overview
+
+AutoFlip is an automatic video cropping pipeline built on top of MediaPipe. This
+example focuses on demonstrating how to use AutoFlip to convert an input video
+to arbitrary aspect ratios.
+
+For overall context on AutoFlip, please read this
+[Google AI Blog](https://ai.googleblog.com/2020/02/autoflip-open-source-framework-for.html).
+
+![graph is_required](../images/autoflip_edited_example.gif)
+
+## Building
+
+Run the following command to build the AutoFlip pipeline:
+
+Note: AutoFlip currently only works with OpenCV 3. Please verify your OpenCV
+version beforehand.
+
+```bash
+bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 mediapipe/examples/desktop/autoflip:run_autoflip
+```
+
+## Running
+
+```bash
+GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/autoflip/run_autoflip \
+  --calculator_graph_config_file=mediapipe/examples/desktop/autoflip/autoflip_graph.pbtxt \
+  --input_side_packets=input_video_path=/absolute/path/to/the/local/video/file,output_video_path=/absolute/path/to/save/the/output/video/file,aspect_ratio=1:1
+```
+
+Use the `aspect_ratio` flag to provide the output aspect ratio. The format
+should be `width:height`, where the `width` and `height` are two positive
+integers. AutoFlip supports both landscape-to-portrait and portrait-to-landscape
+conversions. The pipeline internally compares the target aspect ratio against
+the original one, and determines the correct conversion automatically.
+
+We have put a couple test videos under this
+[Google Drive folder](https://drive.google.com/corp/drive/u/0/folders/1KK9LV--Ey0UEVpxssVLhVl7dypgJSQgk).
+You could download the videos into your local file system, then modify the
+command above accordingly to run AutoFlip against the videos.
+
+## MediaPipe Graph
+
+![graph visualization](../images/autoflip_graph.png)
+
+To visualize the graph as shown above, copy the text specification of the graph
+below and paste it into [MediaPipe Visualizer](https://viz.mediapipe.dev).
+
+```bash
+# Autoflip graph that only renders the final cropped video. For use with
+# end user applications.
+max_queue_size: -1
+
+# VIDEO_PREP: Decodes an input video file into images and a video header.
+node {
+  calculator: "OpenCvVideoDecoderCalculator"
+  input_side_packet: "INPUT_FILE_PATH:input_video_path"
+  output_stream: "VIDEO:video_raw"
+  output_stream: "VIDEO_PRESTREAM:video_header"
+  output_side_packet: "SAVED_AUDIO_PATH:audio_path"
+}
+
+# VIDEO_PREP: Scale the input video before feature extraction.
+node {
+  calculator: "ScaleImageCalculator"
+  input_stream: "FRAMES:video_raw"
+  input_stream: "VIDEO_HEADER:video_header"
+  output_stream: "FRAMES:video_frames_scaled"
+  node_options: {
+    [type.googleapis.com/mediapipe.ScaleImageCalculatorOptions]: {
+      preserve_aspect_ratio: true
+      output_format: SRGB
+      target_width: 480
+      algorithm: DEFAULT_WITHOUT_UPSCALE
+    }
+  }
+}
+
+# VIDEO_PREP: Create a low frame rate stream for feature extraction.
+node {
+  calculator: "PacketThinnerCalculator"
+  input_stream: "video_frames_scaled"
+  output_stream: "video_frames_scaled_downsampled"
+  node_options: {
+    [type.googleapis.com/mediapipe.PacketThinnerCalculatorOptions]: {
+      thinner_type: ASYNC
+      period: 200000
+    }
+  }
+}
+
+# DETECTION: find borders around the video and major background color.
+node {
+  calculator: "BorderDetectionCalculator"
+  input_stream: "VIDEO:video_raw"
+  output_stream: "DETECTED_BORDERS:borders"
+}
+
+# DETECTION: find shot/scene boundaries on the full frame rate stream.
+node {
+  calculator: "ShotBoundaryCalculator"
+  input_stream: "VIDEO:video_frames_scaled"
+  output_stream: "IS_SHOT_CHANGE:shot_change"
+  options {
+    [type.googleapis.com/mediapipe.autoflip.ShotBoundaryCalculatorOptions] {
+      min_shot_span: 0.2
+      min_motion: 0.3
+      window_size: 15
+      min_shot_measure: 10
+      min_motion_with_shot_measure: 0.05
+    }
+  }
+}
+
+# DETECTION: find faces on the down sampled stream
+node {
+  calculator: "AutoFlipFaceDetectionSubgraph"
+  input_stream: "VIDEO:video_frames_scaled_downsampled"
+  output_stream: "DETECTIONS:face_detections"
+}
+node {
+  calculator: "FaceToRegionCalculator"
+  input_stream: "VIDEO:video_frames_scaled_downsampled"
+  input_stream: "FACES:face_detections"
+  output_stream: "REGIONS:face_regions"
+}
+
+# DETECTION: find objects on the down sampled stream
+node {
+  calculator: "AutoFlipObjectDetectionSubgraph"
+  input_stream: "VIDEO:video_frames_scaled_downsampled"
+  output_stream: "DETECTIONS:object_detections"
+}
+node {
+  calculator: "LocalizationToRegionCalculator"
+  input_stream: "DETECTIONS:object_detections"
+  output_stream: "REGIONS:object_regions"
+  options {
+    [type.googleapis.com/mediapipe.autoflip.LocalizationToRegionCalculatorOptions] {
+      output_all_signals: true
+    }
+  }
+}
+
+# SIGNAL FUSION: Combine detections (with weights) on each frame
+node {
+  calculator: "SignalFusingCalculator"
+  input_stream: "shot_change"
+  input_stream: "face_regions"
+  input_stream: "object_regions"
+  output_stream: "salient_regions"
+  options {
+    [type.googleapis.com/mediapipe.autoflip.SignalFusingCalculatorOptions] {
+      signal_settings {
+        type { standard: FACE_CORE_LANDMARKS }
+        min_score: 0.85
+        max_score: 0.9
+        is_required: false
+      }
+      signal_settings {
+        type { standard: FACE_ALL_LANDMARKS }
+        min_score: 0.8
+        max_score: 0.85
+        is_required: false
+      }
+      signal_settings {
+        type { standard: FACE_FULL }
+        min_score: 0.8
+        max_score: 0.85
+        is_required: false
+      }
+      signal_settings {
+        type: { standard: HUMAN }
+        min_score: 0.75
+        max_score: 0.8
+        is_required: false
+      }
+      signal_settings {
+        type: { standard: PET }
+        min_score: 0.7
+        max_score: 0.75
+        is_required: false
+      }
+      signal_settings {
+        type: { standard: CAR }
+        min_score: 0.7
+        max_score: 0.75
+        is_required: false
+      }
+      signal_settings {
+        type: { standard: OBJECT }
+        min_score: 0.1
+        max_score: 0.2
+        is_required: false
+      }
+    }
+  }
+}
+
+# CROPPING: make decisions about how to crop each frame.
+node {
+  calculator: "SceneCroppingCalculator"
+  input_side_packet: "EXTERNAL_ASPECT_RATIO:aspect_ratio"
+  input_stream: "VIDEO_FRAMES:video_raw"
+  input_stream: "KEY_FRAMES:video_frames_scaled_downsampled"
+  input_stream: "DETECTION_FEATURES:salient_regions"
+  input_stream: "STATIC_FEATURES:borders"
+  input_stream: "SHOT_BOUNDARIES:shot_change"
+  output_stream: "CROPPED_FRAMES:cropped_frames"
+  node_options: {
+    [type.googleapis.com/mediapipe.autoflip.SceneCroppingCalculatorOptions]: {
+      max_scene_size: 600
+      key_frame_crop_options: {
+        score_aggregation_type: CONSTANT
+      }
+      scene_camera_motion_analyzer_options: {
+        motion_stabilization_threshold_percent: 0.5
+        salient_point_bound: 0.499
+      }
+      padding_parameters: {
+        blur_cv_size: 200
+        overlay_opacity: 0.6
+      }
+      target_size_type: MAXIMIZE_TARGET_DIMENSION
+    }
+  }
+}
+
+# ENCODING(required): encode the video stream for the final cropped output.
+node {
+  calculator: "VideoPreStreamCalculator"
+  # Fetch frame format and dimension from input frames.
+  input_stream: "FRAME:cropped_frames"
+  # Copying frame rate and duration from original video.
+  input_stream: "VIDEO_PRESTREAM:video_header"
+  output_stream: "output_frames_video_header"
+}
+
+node {
+  calculator: "OpenCvVideoEncoderCalculator"
+  input_stream: "VIDEO:cropped_frames"
+  input_stream: "VIDEO_PRESTREAM:output_frames_video_header"
+  input_side_packet: "OUTPUT_FILE_PATH:output_video_path"
+  input_side_packet: "AUDIO_FILE_PATH:audio_path"
+  node_options: {
+    [type.googleapis.com/mediapipe.OpenCvVideoEncoderCalculatorOptions]: {
+      codec: "avc1"
+      video_format: "mp4"
+    }
+  }
+}
+```
+
+## Advanced Parameters
+
+### Required vs. Best-Effort Saliency Features
+
+AutoFlip allows users to implement and specify custom features to be used in the
+camera trajectory computation. If the user would like to detect and preserve
+scenes of lions in a wildlife protection video, for example, they could
+implement and add a feature detection calculator for lions into the pipeline.
+Refer to `AutoFlipFaceDetectionSubgraph` and `FaceToRegionCalculator`, or
+`AutoFlipObjectDetectionSubgraph` and `LocalizationToRegionCalculator` for
+examples of how to create new feature detection calculators.
+
+After adding different feature signals into the graph, use the
+`SignalFusingCalculator` node to specify types and weights for different feature
+signals. For example, in the graph above, we specified a `face_region` and an
+`object_region` input streams, to represent face signals and agnostic object
+signals, respectively.
+
+The larger the weight, the more important the features will be considered when
+AutoFlip computes the camera trajectory. Use the `is_required` flag to mark a
+feature as a hard constraint, in which case the computed camera trajectory will
+try best to cover these feature types in the cropped videos. If for some reason
+the required features cannot be all covered (for example, when they are too
+spread out in the video), AutoFlip will apply a padding effect to cover as much
+salient content as possible. See an illustration below.
+
+![graph is_required](../images/autoflip_is_required.gif)
+
+### Stable vs Tracking Camera Motion
+
+AutoFlip makes a decision on each scene whether to have the cropped viewpoint
+follow an object or if the crop should remain stable (centered on detected
+objects). The parameter `motion_stabilization_threshold_percent` value is used
+to make the decision to track action or keep the camera stable. If, over the
+duration of the scene, all detected focus objects remain within this ratio of
+the frame (e.g. 0.5 = 50% or 1920 * .5 = 960 pixels on 1080p video) then the
+camera is held steady. Otherwise the camera tracks activity within the frame.
+
+### Snap To Center
+
+For some scenes the camera viewpoint will remain stable at the center of
+activity (see `motion_stabilization_threshold_percent` setting). In this case,
+if the determined best stable viewpoint is within
+`snap_center_max_distance_percent` of the frame's center the camera will be
+shifted to be locked to the center of the frame. This setting is useful for
+videos where the camera operator did a good job already centering content or if
+titles and logos are expected to appear in the center of the frame. It may be
+less useful on raw content where objects are not already well positioned on
+screen.
+
+### Visualization to Facilitate Debugging
+
+`SceneCroppingCalculator` provides two extra output streams
+`KEY_FRAME_CROP_REGION_VIZ_FRAMES` and `SALIENT_POINT_FRAME_VIZ_FRAMES` to
+visualize the cropping window as well as salient points detected on each frame.
+You could modify the `SceneCroppingCalculator` node like below to enable these
+two output streams.
+
+```bash
+node {
+  calculator: "SceneCroppingCalculator"
+  input_side_packet: "EXTERNAL_ASPECT_RATIO:aspect_ratio"
+  input_stream: "VIDEO_FRAMES:video_raw"
+  input_stream: "KEY_FRAMES:video_frames_scaled_downsampled"
+  input_stream: "DETECTION_FEATURES:salient_regions"
+  input_stream: "STATIC_FEATURES:borders"
+  input_stream: "SHOT_BOUNDARIES:shot_change"
+  output_stream: "CROPPED_FRAMES:cropped_frames"
+  output_stream: "KEY_FRAME_CROP_REGION_VIZ_FRAMES:key_frame_crop_viz_frames"
+  output_stream: "SALIENT_POINT_FRAME_VIZ_FRAMES:salient_point_viz_frames"
+  node_options: {
+    [type.googleapis.com/mediapipe.autoflip.SceneCroppingCalculatorOptions]: {
+      max_scene_size: 600
+      key_frame_crop_options: {
+        score_aggregation_type: CONSTANT
+      }
+      scene_camera_motion_analyzer_options: {
+        motion_stabilization_threshold_percent: 0.5
+        salient_point_bound: 0.499
+      }
+      padding_parameters: {
+        blur_cv_size: 200
+        overlay_opacity: 0.6
+      }
+      target_size_type: MAXIMIZE_TARGET_DIMENSION
+    }
+  }
+}
+```
diff --git a/docs/solutions/box_tracking.md b/docs/solutions/box_tracking.md
new file mode 100644
index 000000000..84da8565d
--- /dev/null
+++ b/docs/solutions/box_tracking.md
@@ -0,0 +1,146 @@
+---
+layout: default
+title: Box Tracking
+parent: Solutions
+nav_order: 6
+---
+
+# MediaPipe Box Tracking
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
+
+## Overview
+
+MediaPipe Box Tracking has been powering real-time tracking in
+[Motion Stills](https://ai.googleblog.com/2016/12/get-moving-with-new-motion-stills.html),
+[YouTube's privacy blur](https://youtube-creators.googleblog.com/2016/02/blur-moving-objects-in-your-video-with.html),
+and [Google Lens](https://lens.google.com/) for several years, leveraging
+classic computer vision approaches.
+
+The box tracking solution consumes image frames from a video or camera stream,
+and starting box positions with timestamps, indicating 2D regions of interest to
+track, and computes the tracked box positions for each frame. In this specific
+use case, the starting box positions come from object detection, but the
+starting position can also be provided manually by the user or another system.
+Our solution consists of three main components: a motion analysis component, a
+flow packager component, and a box tracking component. Each component is
+encapsulated as a MediaPipe calculator, and the box tracking solution as a whole
+is represented as a MediaPipe
+[subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/tracking/subgraphs/box_tracking_gpu.pbtxt).
+
+Note: To visualize a graph, copy the graph and paste it into
+[MediaPipe Visualizer](https://viz.mediapipe.dev/).
+
+In the
+[box tracking subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/tracking/subgraphs/box_tracking_gpu.pbtxt),
+the MotionAnalysis calculator extracts features (e.g. high-gradient corners)
+across the image, tracks those features over time, classifies them into
+foreground and background features, and estimates both local motion vectors and
+the global motion model. The FlowPackager calculator packs the estimated motion
+metadata into an efficient format. The BoxTracker calculator takes this motion
+metadata from the FlowPackager calculator and the position of starting boxes,
+and tracks the boxes over time. Using solely the motion data (without the need
+for the RGB frames) produced by the MotionAnalysis calculator, the BoxTracker
+calculator tracks individual objects or regions while discriminating from
+others. Please see
+[Object Detection and Tracking using MediaPipe](https://developers.googleblog.com/2019/12/object-detection-and-tracking-using-mediapipe.html)
+in Google Developers Blog for more details.
+
+An advantage of our architecture is that by separating motion analysis into a
+dedicated MediaPipe calculator and tracking features over the whole image, we
+enable great flexibility and constant computation independent of the number of
+regions tracked! By not having to rely on the RGB frames during tracking, our
+tracking solution provides the flexibility to cache the metadata across a batch
+of frame. Caching enables tracking of regions both backwards and forwards in
+time; or even sync directly to a specified timestamp for tracking with random
+access.
+
+## Object Detection and Tracking
+
+MediaPipe Box Tracking can be paired with ML inference, resulting in valuable
+and efficient pipelines. For instance, box tracking can be paired with ML-based
+object detection to create an object detection and tracking pipeline. With
+tracking, this pipeline offers several advantages over running detection per
+frame (e.g., [MediaPipe Object Detection](./object_detection.md)):
+
+*   It provides instance based tracking, i.e. the object ID is maintained across
+    frames.
+*   Detection does not have to run every frame. This enables running heavier
+    detection models that are more accurate while keeping the pipeline
+    lightweight and real-time on mobile devices.
+*   Object localization is temporally consistent with the help of tracking,
+    meaning less jitter is observable across frames.
+
+![object_tracking_android_gpu.gif](../images/mobile/object_tracking_android_gpu.gif) |
+:----------------------------------------------------------------------------------: |
+*Fig 1. Box tracking paired with ML-based object detection.*                         |
+
+The object detection and tracking pipeline can be implemented as a MediaPipe
+[graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/tracking/object_detection_tracking_mobile_gpu.pbtxt),
+which internally utilizes an
+[object detection subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/tracking/subgraphs/object_detection_gpu.pbtxt),
+an
+[object tracking subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/tracking/subgraphs/object_tracking_gpu.pbtxt),
+and a
+[renderer subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/tracking/subgraphs/renderer_gpu.pbtxt).
+
+In general, the object detection subgraph (which performs ML model inference
+internally) runs only upon request, e.g. at an arbitrary frame rate or triggered
+by specific signals. More specifically, in this particular
+[graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/tracking/object_detection_tracking_mobile_gpu.pbtxt)
+a PacketResampler calculator temporally subsamples the incoming video frames to
+0.5 fps before they are passed into the object detection subgraph. This frame
+rate can be configured differently as an option in PacketResampler.
+
+The object tracking subgraph runs in real-time on every incoming frame to track
+the detected objects. It expands the
+[box tracking subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/tracking/subgraphs/box_tracking_gpu.pbtxt)
+with additional functionality: when new detections arrive it uses IoU
+(Intersection over Union) to associate the current tracked objects/boxes with
+new detections to remove obsolete or duplicated boxes.
+
+## Example Apps
+
+Please first see general instructions for
+[Android](../getting_started/building_examples.md#android), [iOS](../getting_started/building_examples.md#ios)
+and [desktop](../getting_started/building_examples.md#desktop) on how to build MediaPipe
+examples.
+
+Note: To visualize a graph, copy the graph and paste it into
+[MediaPipe Visualizer](https://viz.mediapipe.dev/). For more information on how
+to visualize its associated subgraphs, please see
+[visualizer documentation](../visualizer.md).
+
+### Mobile
+
+Note: Object detection is using TensorFlow Lite on GPU while tracking is on CPU.
+
+*   Graph:
+    [`mediapipe/graphs/tracking/object_detection_tracking_mobile_gpu.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/tracking/object_detection_tracking_mobile_gpu.pbtxt)
+*   Android target:
+    [(or download prebuilt ARM64 APK)](https://drive.google.com/open?id=1UXL9jX4Wpp34TsiVogugV3J3T9_C5UK-)
+    [`mediapipe/examples/android/src/java/com/google/mediapipe/apps/objecttrackinggpu:objecttrackinggpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objecttrackinggpu/BUILD)
+*   iOS target: Not available
+
+### Desktop
+
+*   Running on CPU (both for object detection using TensorFlow Lite and
+    tracking):
+    *   Graph:
+        [`mediapipe/graphs/tracking/object_detection_tracking_desktop_live.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/tracking/object_detection_tracking_desktop_live.pbtxt)
+    *   Target:
+        [`mediapipe/examples/desktop/object_tracking:object_tracking_cpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/desktop/object_tracking/BUILD)
+*   Running on GPU: Not available
+
+## Resources
+
+*   Google Developers Blog:
+    [Object Detection and Tracking using MediaPipe](https://developers.googleblog.com/2019/12/object-detection-and-tracking-using-mediapipe.html)
+*   Google AI Blog:
+    [Get moving with the new Motion Stills](https://ai.googleblog.com/2016/12/get-moving-with-new-motion-stills.html)
+*   YouTube Creator Blog: [Blur moving objects in your video with the new Custom
+    blurring tool on
+    YouTube](https://youtube-creators.googleblog.com/2016/02/blur-moving-objects-in-your-video-with.html)
diff --git a/docs/solutions/face_detection.md b/docs/solutions/face_detection.md
new file mode 100644
index 000000000..a8e844df4
--- /dev/null
+++ b/docs/solutions/face_detection.md
@@ -0,0 +1,110 @@
+---
+layout: default
+title: Face Detection
+parent: Solutions
+nav_order: 1
+---
+
+# MediaPipe Face Detection
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
+
+## Overview
+
+MediaPipe Face Detection is an ultrafast face detection solution that comes with
+6 landmarks and multi-face support. It is based on
+[BlazeFace](https://arxiv.org/abs/1907.05047), a lightweight and well-performing
+face detector tailored for mobile GPU inference. The detector's super-realtime
+performance enables it to be applied to any live viewfinder experience that
+requires an accurate facial region of interest as an input for other
+task-specific models, such as 3D facial keypoint or geometry estimation (e.g.,
+[MediaPipe Face Mesh](./face_mesh.md)), facial features or expression
+classification, and face region segmentation. BlazeFace uses a lightweight
+feature extraction network inspired by, but distinct from
+[MobileNetV1/V2](https://ai.googleblog.com/2018/04/mobilenetv2-next-generation-of-on.html),
+a GPU-friendly anchor scheme modified from
+[Single Shot MultiBox Detector (SSD)](https://arxiv.org/abs/1512.02325), and an
+improved tie resolution strategy alternative to non-maximum suppression. For
+more information about BlazeFace, please see the [Resources](#resources)
+section.
+
+![face_detection_android_gpu.gif](../images/mobile/face_detection_android_gpu.gif)
+
+## Example Apps
+
+Please first see general instructions for
+[Android](../getting_started/building_examples.md#android), [iOS](../getting_started/building_examples.md#ios)
+and [desktop](../getting_started/building_examples.md#desktop) on how to build MediaPipe
+examples.
+
+Note: To visualize a graph, copy the graph and paste it into
+[MediaPipe Visualizer](https://viz.mediapipe.dev/). For more information on how
+to visualize its associated subgraphs, please see
+[visualizer documentation](../visualizer.md).
+
+### Mobile
+
+#### GPU Pipeline
+
+*   Graph:
+    [`mediapipe/graphs/face_detection/face_detection_mobile_gpu.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/face_detection/face_detection_mobile_gpu.pbtxt)
+*   Android target:
+    [(or download prebuilt ARM64 APK)](https://drive.google.com/open?id=1DZTCy1gp238kkMnu4fUkwI3IrF77Mhy5)
+    [`mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectiongpu:facedetectiongpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectiongpu/BUILD)
+*   iOS target:
+    [`mediapipe/examples/ios/facedetectiongpu:FaceDetectionGpuApp`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/facedetectiongpu/BUILD)
+
+#### CPU Pipeline
+
+This is very similar to the [GPU pipeline](#gpu-pipeline) except that at the
+beginning and the end of the pipeline it performs GPU-to-CPU and CPU-to-GPU
+image transfer respectively. As a result, the rest of graph, which shares the
+same configuration as the GPU pipeline, runs entirely on CPU.
+
+*   Graph:
+    [`mediapipe/graphs/face_detection/face_detection_mobile_cpu.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/face_detection/face_detection_mobile_cpu.pbtxt)
+*   Android target:
+    [(or download prebuilt ARM64 APK)](https://drive.google.com/open?id=1npiZY47jbO5m2YaL63o5QoCQs40JC6C7)
+    [`mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectioncpu:facedetectioncpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectioncpu/BUILD)
+*   iOS target:
+    [`mediapipe/examples/ios/facedetectioncpu:FaceDetectionCpuApp`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/facedetectioncpu/BUILD)
+
+### Desktop
+
+*   Running on CPU:
+    *   Graph:
+        [`mediapipe/graphs/face_detection/face_detection_desktop_live.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/face_detection/face_detection_desktop_live.pbtxt)
+    *   Target:
+        [`mediapipe/examples/desktop/face_detection:face_detection_cpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/desktop/face_detection/BUILD)
+*   Running on GPU
+    *   Graph:
+        [`mediapipe/graphs/face_detection/face_detection_mobile_gpu.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/face_detection/face_detection_mobile_gpu.pbtxt)
+    *   Target:
+        [`mediapipe/examples/desktop/face_detection:face_detection_gpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/desktop/face_detection/BUILD)
+
+### Web
+
+Please refer to [these instructions](../index.md#mediapipe-on-the-web).
+
+### Coral
+
+Please refer to
+[these instructions](https://github.com/google/mediapipe/tree/master/mediapipe/examples/coral/README.md)
+to cross-compile and run MediaPipe examples on the
+[Coral Dev Board](https://coral.ai/products/dev-board).
+
+## Resources
+
+*   Paper:
+    [BlazeFace: Sub-millisecond Neural Face Detection on Mobile GPUs](https://arxiv.org/abs/1907.05047)
+    ([presentation](https://docs.google.com/presentation/d/1YCtASfnYyZtH-41QvnW5iZxELFnf0MF-pPWSLGj8yjQ/present?slide=id.g5bc8aeffdd_1_0))
+    ([poster](https://drive.google.com/file/d/1u6aB6wxDY7X2TmeUUKgFydulNtXkb3pu/view))
+*   For front-facing/selfie camera:
+    [TFLite model](https://github.com/google/mediapipe/tree/master/mediapipe/models/face_detection_front.tflite),
+    [TFLite model quantized for EdgeTPU/Coral](https://github.com/google/mediapipe/tree/master/mediapipe/examples/coral/models/face-detector-quantized_edgetpu.tflite)
+*   For back-facing camera:
+    [TFLite model ](https://github.com/google/mediapipe/tree/master/mediapipe/models/face_detection_back.tflite)
+*   [Model card](https://drive.google.com/file/d/1f39lSzU5Oq-j_OXgS67KfN5wNsoeAZ4V/view)
diff --git a/docs/solutions/face_mesh.md b/docs/solutions/face_mesh.md
new file mode 100644
index 000000000..17b7b9d16
--- /dev/null
+++ b/docs/solutions/face_mesh.md
@@ -0,0 +1,160 @@
+---
+layout: default
+title: Face Mesh
+parent: Solutions
+nav_order: 2
+---
+
+# MediaPipe Face Mesh
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
+
+## Overview
+
+MediaPipe Face Mesh is a face geometry solution that estimates 468 3D face
+landmarks in real-time even on mobile devices. It employs machine learning (ML)
+to infer the 3D surface geometry, requiring only a single camera input without
+the need for a dedicated depth sensor. Utilizing lightweight model architectures
+together with GPU acceleration throughout the pipeline, the solution delivers
+real-time performance critical for live experiences. The core of the solution is
+the same as what powers
+[YouTube Stories](https://youtube-creators.googleblog.com/2018/11/introducing-more-ways-to-share-your.html)'
+creator effects, the
+[Augmented Faces API in ARCore](https://developers.google.com/ar/develop/java/augmented-faces/)
+and the
+[ML Kit Face Contour Detection API](https://firebase.google.com/docs/ml-kit/face-detection-concepts#contours).
+
+![face_mesh_ar_effects.gif](../images/face_mesh_ar_effects.gif) |
+:-------------------------------------------------------------: |
+*Fig 1. AR effects utilizing facial surface geometry.*          |
+
+## ML Pipeline
+
+Our ML pipeline consists of two real-time deep neural network models that work
+together: A detector that operates on the full image and computes face locations
+and a 3D face landmark model that operates on those locations and predicts the
+approximate surface geometry via regression. Having the face accurately cropped
+drastically reduces the need for common data augmentations like affine
+transformations consisting of rotations, translation and scale changes. Instead
+it allows the network to dedicate most of its capacity towards coordinate
+prediction accuracy. In addition, in our pipeline the crops can also be
+generated based on the face landmarks identified in the previous frame, and only
+when the landmark model could no longer identify face presence is the face
+detector invoked to relocalize the face. This strategy is similar to that
+employed in our [MediaPipe Hand](./hand.md) solution, which uses a palm detector
+together with a hand landmark model.
+
+The pipeline is implemented as a MediaPipe
+[graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/face_mesh/face_mesh_mobile.pbtxt)
+that uses a
+[face landmark subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/modules/face_landmark/face_landmark_front_gpu.pbtxt)
+from the
+[face landmark module](https://github.com/google/mediapipe/tree/master/mediapipe/modules/face_landmark),
+and renders using a dedicated
+[face renderer subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/face_mesh/subgraphs/face_renderer_gpu.pbtxt).
+The
+[face landmark subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/modules/face_landmark/face_landmark_front_gpu.pbtxt)
+internally uses a
+[face_detection_subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/modules/face_detection/face_detection_front_gpu.pbtxt)
+from the
+[face detection module](https://github.com/google/mediapipe/tree/master/mediapipe/modules/face_detection).
+
+Note: To visualize a graph, copy the graph and paste it into
+[MediaPipe Visualizer](https://viz.mediapipe.dev/). For more information on how
+to visualize its associated subgraphs, please see
+[visualizer documentation](../visualizer.md).
+
+## Models
+
+### Face Detection Model
+
+The face detector is the same [BlazeFace](https://arxiv.org/abs/1907.05047)
+model used in [MediaPipe Face Detection](./face_detection.md). Please refer to
+[MediaPipe Face Detection](./face_detection.md) for details.
+
+### Face Landmark Model
+
+For 3D face landmarks we employed transfer learning and trained a network with
+several objectives: the network simultaneously predicts 3D landmark coordinates
+on synthetic rendered data and 2D semantic contours on annotated real-world
+data. The resulting network provided us with reasonable 3D landmark predictions
+not just on synthetic but also on real-world data.
+
+The 3D landmark network receives as input a cropped video frame without
+additional depth input. The model outputs the positions of the 3D points, as
+well as the probability of a face being present and reasonably aligned in the
+input. A common alternative approach is to predict a 2D heatmap for each
+landmark, but it is not amenable to depth prediction and has high computational
+costs for so many points. We further improve the accuracy and robustness of our
+model by iteratively bootstrapping and refining predictions. That way we can
+grow our dataset to increasingly challenging cases, such as grimaces, oblique
+angle and occlusions.
+
+You can find more information about the face landmark model in this
+[paper](https://arxiv.org/abs/1907.06724).
+
+![face_mesh_android_gpu.gif](../images/mobile/face_mesh_android_gpu.gif)   |
+:------------------------------------------------------------------------: |
+*Fig 2. Output of MediaPipe Face Mesh: the red box indicates the cropped area as input to the landmark model, the red dots represent the 468 landmarks in 3D, and the green lines connecting landmarks illustrate the contours around the eyes, eyebrows, lips and the entire face.* |
+
+## Example Apps
+
+Please first see general instructions for
+[Android](../getting_started/building_examples.md#android), [iOS](../getting_started/building_examples.md#ios) and
+[desktop](../getting_started/building_examples.md#desktop) on how to build MediaPipe examples.
+
+Note: To visualize a graph, copy the graph and paste it into
+[MediaPipe Visualizer](https://viz.mediapipe.dev/). For more information on how
+to visualize its associated subgraphs, please see
+[visualizer documentation](../visualizer.md).
+
+### Mobile
+
+*   Graph:
+    [`mediapipe/graphs/face_mesh/face_mesh_mobile.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/face_mesh/face_mesh_mobile.pbtxt)
+*   Android target:
+    [(or download prebuilt ARM64 APK)](https://drive.google.com/open?id=1pUmd7CXCL_onYMbsZo5p91cH0oNnR4gi)
+    [`mediapipe/examples/android/src/java/com/google/mediapipe/apps/facemeshgpu:facemeshgpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facemeshgpu/BUILD)
+*   iOS target:
+    [`mediapipe/examples/ios/facemeshgpu:FaceMeshGpuApp`](http:/mediapipe/examples/ios/facemeshgpu/BUILD)
+
+Tip: Maximum number of faces to detect/process is set to 1 by default. To change
+it, for Android modify `NUM_FACES` in
+[MainActivity.java](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facemeshgpu/MainActivity.java),
+and for iOS modify `kNumFaces` in
+[ViewController.mm](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/facemeshgpu/ViewController.mm).
+
+### Desktop
+
+*   Running on CPU
+    *   Graph:
+        [`mediapipe/graphs/face_mesh/face_mesh_desktop_live.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/face_mesh/face_mesh_desktop_live.pbtxt)
+    *   Target:
+        [`mediapipe/examples/desktop/face_mesh:face_mesh_cpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/desktop/face_mesh/BUILD)
+*   Running on GPU
+    *   Graph:
+        [`mediapipe/graphs/face_mesh/face_mesh_desktop_live_gpu.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/face_mesh/face_mesh_desktop_live_gpu.pbtxt)
+    *   Target:
+        [`mediapipe/examples/desktop/face_mesh:face_mesh_gpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/desktop/face_mesh/BUILD)
+
+Tip: Maximum number of faces to detect/process is set to 1 by default. To change
+it, in the graph file modify the option of `ConstantSidePacketCalculator`.
+
+## Resources
+
+*   Google AI Blog:
+    [Real-Time AR Self-Expression with Machine Learning](https://ai.googleblog.com/2019/03/real-time-ar-self-expression-with.html)
+*   TensorFlow Blog:
+    [Face and hand tracking in the browser with MediaPipe and TensorFlow.js](https://blog.tensorflow.org/2020/03/face-and-hand-tracking-in-browser-with-mediapipe-and-tensorflowjs.html)
+*   Paper:
+    [Real-time Facial Surface Geometry from Monocular Video on Mobile GPUs](https://arxiv.org/abs/1907.06724)
+    ([poster](https://docs.google.com/presentation/d/1-LWwOMO9TzEVdrZ1CS1ndJzciRHfYDJfbSxH_ke_JRg/present?slide=id.g5986dd4b4c_4_212))
+*   Face detection model:
+    [TFLite model](https://github.com/google/mediapipe/tree/master/mediapipe/models/face_detection_front.tflite)
+*   Face landmark mode:
+    [TFLite model](https://github.com/google/mediapipe/tree/master/mediapipe/models/face_landmark.tflite),
+    [TF.js model](https://tfhub.dev/mediapipe/facemesh/1)
+*   [Model card](https://drive.google.com/file/d/1VFC_wIpw4O7xBOiTgUldl79d9LA-LsnA/view)
diff --git a/docs/solutions/hair_segmentation.md b/docs/solutions/hair_segmentation.md
new file mode 100644
index 000000000..87361040a
--- /dev/null
+++ b/docs/solutions/hair_segmentation.md
@@ -0,0 +1,58 @@
+---
+layout: default
+title: Hair Segmentation
+parent: Solutions
+nav_order: 4
+---
+
+# MediaPipe Hair Segmentation
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
+
+![hair_segmentation_android_gpu_gif](../images/mobile/hair_segmentation_android_gpu.gif)
+
+## Example Apps
+
+Please first see general instructions for
+[Android](../getting_started/building_examples.md#android), [iOS](../getting_started/building_examples.md#ios)
+and [desktop](../getting_started/building_examples.md#desktop) on how to build MediaPipe
+examples.
+
+Note: To visualize a graph, copy the graph and paste it into
+[MediaPipe Visualizer](https://viz.mediapipe.dev/). For more information on how
+to visualize its associated subgraphs, please see
+[visualizer documentation](../visualizer.md).
+
+### Mobile
+
+*   Graph:
+    [`mediapipe/graphs/hair_segmentation/hair_segmentation_mobile_gpu.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hair_segmentation/hair_segmentation_mobile_gpu.pbtxt)
+*   Android target:
+    [(or download prebuilt ARM64 APK)](https://drive.google.com/open?id=1mmLtyL8IRfCUbqqu0-E-Hgjr_e6P3XAy)
+    [`mediapipe/examples/android/src/java/com/google/mediapipe/apps/hairsegmentationgpu:hairsegmentationgpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/hairsegmentationgpu/BUILD)
+*   iOS target: Not available
+
+### Desktop
+
+*   Running on CPU: Not available
+*   Running on GPU
+    *   Graph:
+        [`mediapipe/graphs/hair_segmentation/hair_segmentation_mobile_gpu.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hair_segmentation/hair_segmentation_mobile_gpu.pbtxt)
+    *   Target:
+        [`mediapipe/examples/desktop/hair_segmentation:hair_segmentation_gpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/desktop/hair_segmentation/BUILD)
+
+### Web
+
+Please refer to [these instructions](../index.md#mediapipe-on-the-web).
+
+## Resources
+
+*   Paper:
+    [Real-time Hair segmentation and recoloring on Mobile GPUs](https://arxiv.org/abs/1907.06740)
+    ([presentation](https://drive.google.com/file/d/1C8WYlWdDRNtU1_pYBvkkG5Z5wqYqf0yj/view))
+    ([supplementary video](https://drive.google.com/file/d/1LPtM99Ch2ogyXYbDNpEqnUfhFq0TfLuf/view))
+*   [TFLite model](https://github.com/google/mediapipe/tree/master/mediapipe/models/hair_segmentation.tflite)
+*   [Model card](https://drive.google.com/file/d/1lPwJ8BD_-3UUor4LayQ0xpa_RIC_hoRh/view)
diff --git a/docs/solutions/hand.md b/docs/solutions/hand.md
new file mode 100644
index 000000000..bef5e220e
--- /dev/null
+++ b/docs/solutions/hand.md
@@ -0,0 +1,231 @@
+---
+layout: default
+title: Hand
+parent: Solutions
+nav_order: 3
+---
+
+# MediaPipe Hand
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
+
+## Overview
+
+The ability to perceive the shape and motion of hands can be a vital component
+in improving the user experience across a variety of technological domains and
+platforms. For example, it can form the basis for sign language understanding
+and hand gesture control, and can also enable the overlay of digital content and
+information on top of the physical world in augmented reality. While coming
+naturally to people, robust real-time hand perception is a decidedly challenging
+computer vision task, as hands often occlude themselves or each other (e.g.
+finger/palm occlusions and hand shakes) and lack high contrast patterns.
+
+MediaPipe Hand is a high-fidelity hand and finger tracking solution. It employs
+machine learning (ML) to infer 21 3D landmarks of a hand from just a single
+frame. Whereas current state-of-the-art approaches rely primarily on powerful
+desktop environments for inference, our method achieves real-time performance on
+a mobile phone, and even scales to multiple hands. We hope that providing this
+hand perception functionality to the wider research and development community
+will result in an emergence of creative use cases, stimulating new applications
+and new research avenues.
+
+![hand_tracking_3d_android_gpu.gif](../images/mobile/hand_tracking_3d_android_gpu.gif) |
+:------------------------------------------------------------------------------------: |
+*Fig 1. Tracked 3D hand landmarks are represented by dots in different shades, with the brighter ones denoting landmarks closer to the camera.* |
+
+## ML Pipeline
+
+MediaPipe Hand utilizes an ML pipeline consisting of multiple models working
+together: A palm detection model that operates on the full image and returns an
+oriented hand bounding box. A hand landmark model that operates on the cropped
+image region defined by the palm detector and returns high-fidelity 3D hand
+keypoints. This strategy is similar to that employed in our
+[MediaPipe Face Mesh](./face_mesh.md) solution, which uses a face detector
+together with a face landmark model.
+
+Providing the accurately cropped hand image to the hand landmark model
+drastically reduces the need for data augmentation (e.g. rotations, translation
+and scale) and instead allows the network to dedicate most of its capacity
+towards coordinate prediction accuracy. In addition, in our pipeline the crops
+can also be generated based on the hand landmarks identified in the previous
+frame, and only when the landmark model could no longer identify hand presence
+is palm detection invoked to relocalize the hand.
+
+The pipeline is implemented as a MediaPipe
+[graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/hand_tracking_mobile.pbtxt),
+which internally utilizes a
+[palm/hand detection subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/subgraphs/hand_detection_gpu.pbtxt),
+a
+[hand landmark subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/subgraphs/hand_landmark_gpu.pbtxt)
+and a
+[renderer subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/subgraphs/renderer_gpu.pbtxt).
+
+Note: To visualize a graph, copy the graph and paste it into
+[MediaPipe Visualizer](https://viz.mediapipe.dev/). For more information on how
+to visualize its associated subgraphs, please see
+[visualizer documentation](../visualizer.md).
+
+## Models
+
+### Palm Detection Model
+
+To detect initial hand locations, we designed a
+[single-shot detector](https://arxiv.org/abs/1512.02325) model optimized for
+mobile real-time uses in a manner similar to the face detection model in
+[MediaPipe Face Mesh](./face_mesh.md). Detecting hands is a decidedly complex
+task: our
+[model](https://github.com/google/mediapipe/tree/master/mediapipe/models/palm_detection.tflite) has
+to work across a variety of hand sizes with a large scale span (~20x) relative
+to the image frame and be able to detect occluded and self-occluded hands.
+Whereas faces have high contrast patterns, e.g., in the eye and mouth region,
+the lack of such features in hands makes it comparatively difficult to detect
+them reliably from their visual features alone. Instead, providing additional
+context, like arm, body, or person features, aids accurate hand localization.
+
+Our method addresses the above challenges using different strategies. First, we
+train a palm detector instead of a hand detector, since estimating bounding
+boxes of rigid objects like palms and fists is significantly simpler than
+detecting hands with articulated fingers. In addition, as palms are smaller
+objects, the non-maximum suppression algorithm works well even for two-hand
+self-occlusion cases, like handshakes. Moreover, palms can be modelled using
+square bounding boxes (anchors in ML terminology) ignoring other aspect ratios,
+and therefore reducing the number of anchors by a factor of 3-5. Second, an
+encoder-decoder feature extractor is used for bigger scene context awareness
+even for small objects (similar to the RetinaNet approach). Lastly, we minimize
+the focal loss during training to support a large amount of anchors resulting
+from the high scale variance.
+
+With the above techniques, we achieve an average precision of 95.7% in palm
+detection. Using a regular cross entropy loss and no decoder gives a baseline of
+just 86.22%.
+
+### Hand Landmark Model
+
+After the palm detection over the whole image our subsequent hand landmark
+[model](https://github.com/google/mediapipe/tree/master/mediapipe/models/hand_landmark.tflite)
+performs precise keypoint localization of 21 3D hand-knuckle coordinates inside
+the detected hand regions via regression, that is direct coordinate prediction.
+The model learns a consistent internal hand pose representation and is robust
+even to partially visible hands and self-occlusions.
+
+To obtain ground truth data, we have manually annotated ~30K real-world images
+with 21 3D coordinates, as shown below (we take Z-value from image depth map, if
+it exists per corresponding coordinate). To better cover the possible hand poses
+and provide additional supervision on the nature of hand geometry, we also
+render a high-quality synthetic hand model over various backgrounds and map it
+to the corresponding 3D coordinates.
+
+| ![hand_crops.png](../images/mobile/hand_crops.png)                          |
+| :-------------------------------------------------------------------------: |
+| *Fig 2. Top: Aligned hand crops passed to the tracking network with ground truth annotation. Bottom: Rendered synthetic hand images with ground truth annotation.* |
+
+## Example Apps
+
+Please first see general instructions for
+[Android](../getting_started/building_examples.md#android), [iOS](../getting_started/building_examples.md#ios)
+and [desktop](../getting_started/building_examples.md#desktop) on how to build MediaPipe
+examples.
+
+Note: To visualize a graph, copy the graph and paste it into
+[MediaPipe Visualizer](https://viz.mediapipe.dev/). For more information on how
+to visualize its associated subgraphs, please see
+[visualizer documentation](../visualizer.md).
+
+### Mobile
+
+#### Main Example
+
+*   Graph:
+    [`mediapipe/graphs/hand_tracking/hand_tracking_mobile.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/hand_tracking_mobile.pbtxt)
+*   Android target:
+    [(or download prebuilt ARM64 APK)](https://drive.google.com/open?id=1uCjS0y0O0dTDItsMh8x2cf4-l3uHW1vE)
+    [`mediapipe/examples/android/src/java/com/google/mediapipe/apps/handtrackinggpu:handtrackinggpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/handtrackinggpu/BUILD)
+*   iOS target:
+    [`mediapipe/examples/ios/handtrackinggpu:HandTrackingGpuApp`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/handtrackinggpu/BUILD)
+
+#### With Multi-hand Support
+
+*   Graph:
+    [`mediapipe/graphs/hand_tracking/multi_hand_tracking_mobile.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/multi_hand_tracking_mobile.pbtxt)
+*   Android target:
+    [(or download prebuilt ARM64 APK)](https://drive.google.com/open?id=1Wk6V9EVaz1ks_MInPqqVGvvJD01SGXDc)
+    [`mediapipe/examples/android/src/java/com/google/mediapipe/apps/multihandtrackinggpu:multihandtrackinggpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/multihandtrackinggpu/BUILD)
+*   iOS target:
+    [`mediapipe/examples/ios/multihandtrackinggpu:MultiHandTrackingGpuApp`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/multihandtrackinggpu/BUILD)
+
+There are two key differences between this graph and that in the
+[main example](#main-example) (which handles only one hand):
+
+1.  There is a `NormalizedRectVectorHasMinSize` calculator, that checks if in
+    input vector of `NormalizedRect` objects has a minimum size equal to `N`. In
+    this graph, if the vector contains fewer than `N` objects,
+    `MultiHandDetection` subgraph runs. Otherwise, the `GateCalculator` doesn't
+    send any image packets to the `MultiHandDetection` subgraph. This way, the
+    main graph is efficient in that it avoids running the costly hand detection
+    step when there are already `N` hands in the frame.
+2.  The `MergeCalculator` has been replaced by the `AssociationNormRect`
+    calculator. This `AssociationNormRect` takes as input a vector of
+    `NormalizedRect` objects from the `MultiHandDetection` subgraph on the
+    current frame, and a vector of `NormalizedRect` objects from the
+    `MultiHandLandmark` subgraph from the previous frame, and performs an
+    association operation between these objects. This calculator ensures that
+    the output vector doesn't contain overlapping regions based on the specified
+    `min_similarity_threshold`.
+
+#### Palm/Hand Detection Only (no landmarks)
+
+*   Graph:
+    [`mediapipe/graphs/hand_tracking/hand_detection_mobile.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/hand_detection_mobile.pbtxt)
+*   Android target:
+    [(or download prebuilt ARM64 APK)](https://drive.google.com/open?id=1qUlTtH7Ydg-wl_H6VVL8vueu2UCTu37E)
+    [`mediapipe/examples/android/src/java/com/google/mediapipe/apps/handdetectiongpu:handdetectiongpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/handdetectiongpu/BUILD)
+*   iOS target:
+    [`mediapipe/examples/ios/handdetectiongpu:HandDetectionGpuApp`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/handdetectiongpu/BUILD)
+
+### Desktop
+
+#### Main Example
+
+*   Running on CPU
+    *   Graph:
+        [`mediapipe/graphs/hand_tracking/hand_tracking_desktop_live.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/hand_tracking_desktop_live.pbtxt)
+    *   Target:
+        [`mediapipe/examples/desktop/hand_tracking:hand_tracking_cpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/desktop/hand_tracking/BUILD)
+*   Running on GPU
+    *   Graph:
+        [`mediapipe/graphs/hand_tracking/hand_tracking_mobile.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/hand_tracking_mobile.pbtxt)
+    *   Target:
+        [`mediapipe/examples/desktop/hand_tracking:hand_tracking_gpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/desktop/hand_tracking/BUILD)
+
+#### With Multi-hand Support
+
+*   Running on CPU
+    *   Graph:
+        [`mediapipe/graphs/hand_tracking/multi_hand_tracking_desktop_live.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/multi_hand_tracking_desktop_live)
+    *   Target:
+        [`mediapipe/examples/desktop/multi_hand_tracking:multi_hand_tracking_cpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/desktop/multi_hand_tracking/BUILD)
+*   Running on GPU
+    *   Graph:
+        [`mediapipe/graphs/hand_tracking/multi_hand_tracking_mobile.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/multi_hand_tracking_mobile.pbtxt)
+    *   Target:
+        [`mediapipe/examples/desktop/multi_hand_tracking:multi_hand_tracking_gpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/desktop/multi_hand_tracking/BUILD)
+
+### Web
+
+Please refer to [these instructions](../index.md#mediapipe-on-the-web).
+
+## Resources
+
+*   Google AI Blog: [On-Device, Real-Time Hand Tracking with MediaPipe](https://ai.googleblog.com/2019/08/on-device-real-time-hand-tracking-with.html)
+*   TensorFlow Blog: [Face and hand tracking in the browser with MediaPipe and
+    TensorFlow.js](https://blog.tensorflow.org/2020/03/face-and-hand-tracking-in-browser-with-mediapipe-and-tensorflowjs.html)
+*   Palm detection model:
+    [TFLite model](https://github.com/google/mediapipe/tree/master/mediapipe/models/palm_detection.tflite),
+    [TF.js model](https://tfhub.dev/mediapipe/handdetector/1)
+*   Hand landmark model:
+    [TFLite model](https://github.com/google/mediapipe/tree/master/mediapipe/models/hand_landmark.tflite),
+    [TF.js model](https://tfhub.dev/mediapipe/handskeleton/1)
+*   [Model card](https://mediapipe.page.link/handmc)
diff --git a/docs/solutions/knift.md b/docs/solutions/knift.md
new file mode 100644
index 000000000..ec2eec154
--- /dev/null
+++ b/docs/solutions/knift.md
@@ -0,0 +1,145 @@
+---
+layout: default
+title: KNIFT (Template-based Feature Matching)
+parent: Solutions
+nav_order: 8
+---
+
+# MediaPipe KNIFT
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
+
+## Overview
+
+MediaPipe KNIFT is a template-based feature matching solution using KNIFT
+(Keypoint Neural Invariant Feature Transform).
+
+![knift_stop_sign.gif](../images/knift_stop_sign.gif)                     |
+:-----------------------------------------------------------------------: |
+*Fig 1. Matching a real Stop Sign with a Stop Sign template using KNIFT.* |
+
+In many computer vision applications, a crucial building block is to establish
+reliable correspondences between different views of an object or scene, forming
+the foundation for approaches like template matching, image retrieval and
+structure from motion. Correspondences are usually computed by extracting
+distinctive view-invariant features such as
+[SIFT](https://en.wikipedia.org/wiki/Scale-invariant_feature_transform) or
+[ORB](https://opencv-python-tutroals.readthedocs.io/en/latest/py_tutorials/py_feature2d/py_orb/py_orb.html#orb-in-opencv)
+from images. The ability to reliably establish such correspondences enables
+applications like image stitching to create panoramas or template matching for
+object recognition in videos.
+
+KNIFT is a general purpose local feature descriptor similar to SIFT or ORB.
+Likewise, KNIFT is also a compact vector representation of local image patches
+that is invariant to uniform scaling, orientation, and illumination changes.
+However unlike SIFT or ORB, which were engineered with heuristics, KNIFT is an
+[embedding](https://developers.google.com/machine-learning/crash-course/embeddings/video-lecture)
+learned directly from a large number of corresponding local patches extracted
+from nearby video frames. This data driven approach implicitly encodes complex,
+real-world spatial transformations and lighting changes in the embedding. As a
+result, the KNIFT feature descriptor appears to be more robust, not only to
+[affine distortions](https://en.wikipedia.org/wiki/Affine_transformation), but
+to some degree of
+[perspective distortions](https://en.wikipedia.org/wiki/Perspective_distortion_\(photography\))
+as well.
+
+For more information, please see
+[MediaPipe KNIFT: Template-based feature matching](https://developers.googleblog.com/2020/04/mediapipe-knift-template-based-feature-matching.html)
+in Google Developers Blog.
+
+![template_matching_mobile_cpu.gif](../images/mobile/template_matching_android_cpu.gif) |
+:-------------------------------------------------------------------------------------: |
+*Fig 2. Matching US dollar bills using KNIFT.*                                          |
+
+## Example Apps
+
+### Matching US Dollar Bills
+
+In MediaPipe, we've already provided an
+[index file](https://github.com/google/mediapipe/tree/master/mediapipe/models/knift_index.pb)
+pre-computed from the 3 template images (of US dollar bills) shown below. If
+you'd like to use your own template images, see
+[Matching Your Own Template Images](#matching-your-own-template-images).
+
+![template_matching_mobile_template.jpg](../images/mobile/template_matching_mobile_template.jpg)
+
+Please first see general instructions for
+[Android](../getting_started/building_examples.md#android) on how to build MediaPipe examples.
+
+Note: To visualize a graph, copy the graph and paste it into
+[MediaPipe Visualizer](https://viz.mediapipe.dev/). For more information on how
+to visualize its associated subgraphs, please see
+[visualizer documentation](../visualizer.md).
+
+*   Graph:
+    [`mediapipe/graphs/template_matching/template_matching_mobile_cpu.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/template_matching/template_matching_mobile_cpu.pbtxt)
+*   Android target:
+    [(or download prebuilt ARM64 APK)](https://drive.google.com/open?id=1tSWRfes9rAM4NrzmJBplguNQQvaeBZSa)
+    [`mediapipe/examples/android/src/java/com/google/mediapipe/apps/templatematchingcpu:templatematchingcpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/templatematchingcpu/BUILD)
+
+Note: MediaPipe uses OpenCV 3 by default. However, because of
+[issues](https://github.com/opencv/opencv/issues/11488) between NDK 17+ and
+OpenCV 3 when using
+[knnMatch](https://docs.opencv.org/3.4/db/d39/classcv_1_1DescriptorMatcher.html#a378f35c9b1a5dfa4022839a45cdf0e89),
+for this example app please use the following commands to temporarily switch to
+OpenCV 4, and switch back to OpenCV 3 afterwards.
+
+```bash
+# Switch to OpenCV 4
+sed -i -e 's:3.4.3/opencv-3.4.3:4.0.1/opencv-4.0.1:g' WORKSPACE
+sed -i -e 's:libopencv_java3:libopencv_java4:g' third_party/opencv_android.BUILD
+
+# Build and install app
+bazel build -c opt --config=android_arm64 mediapipe/examples/android/src/java/com/google/mediapipe/apps/templatematchingcpu
+adb install -r bazel-bin/mediapipe/examples/android/src/java/com/google/mediapipe/apps/templatematchingcpu/templatematchingcpu.apk
+
+# Switch back to OpenCV 3
+sed -i -e 's:4.0.1/opencv-4.0.1:3.4.3/opencv-3.4.3:g' WORKSPACE
+sed -i -e 's:libopencv_java4:libopencv_java3:g' third_party/opencv_android.BUILD
+```
+
+Tip: The example uses the TFLite
+[XNNPACK delegate](https://github.com/tensorflow/tensorflow/tree/master/tensorflow/lite/delegates/xnnpack)
+by default for faster inference. Users can change the
+[option in TfLiteInferenceCalculator](https://github.com/google/mediapipe/tree/master/mediapipe/calculators/tflite/tflite_inference_calculator.proto)
+to run regular TFLite inference.
+
+### Matching Your Own Template Images
+
+*   Step 1: Put all template images in a single directory.
+
+*   Step 2: To build the index file for all templates in the directory, run
+
+    ```bash
+    bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 \
+    mediapipe/examples/desktop/template_matching:template_matching_tflite
+    ```
+
+    ```bash
+    bazel-bin/mediapipe/examples/desktop/template_matching/template_matching_tflite \
+    --calculator_graph_config_file=mediapipe/graphs/template_matching/index_building.pbtxt \
+    --input_side_packets="file_directory=<template image directory>,file_suffix=png,output_index_filename=<output index filename>"
+    ```
+
+    The output index file includes the extracted KNIFT features.
+
+*   Step 3: Replace
+    [mediapipe/models/knift_index.pb](https://github.com/google/mediapipe/tree/master/mediapipe/models/knift_index.pb)
+    with the index file you generated, and update
+    [mediapipe/models/knift_labelmap.txt](https://github.com/google/mediapipe/tree/master/mediapipe/models/knift_labelmap.txt)
+    with your own template names.
+
+*   Step 4: Build and run the app using the same instructions in
+    [Matching US Dollar Bills](#matching-us-dollar-bills).
+
+## Resources
+
+*   Google Developers Blog:
+    [MediaPipe KNIFT: Template-based feature matching](https://developers.googleblog.com/2020/04/mediapipe-knift-template-based-feature-matching.html)
+*   [TFLite model for up to 200 keypoints](https://github.com/google/mediapipe/tree/master/mediapipe/models/knift_float.tflite)
+*   [TFLite model for up to 400 keypoints](https://github.com/google/mediapipe/tree/master/mediapipe/models/knift_float_400.tflite)
+*   [TFLite model for up to 1000 keypoints](https://github.com/google/mediapipe/tree/master/mediapipe/models/knift_float_1k.tflite)
+*   [Model card](https://mediapipe.page.link/knift-mc)
diff --git a/mediapipe/docs/media_sequence.md b/docs/solutions/media_sequence.md
similarity index 90%
rename from mediapipe/docs/media_sequence.md
rename to docs/solutions/media_sequence.md
index 10693ea7f..bee6d8951 100644
--- a/mediapipe/docs/media_sequence.md
+++ b/docs/solutions/media_sequence.md
@@ -1,4 +1,18 @@
-## Preparing Data Sets with MediaSequence
+---
+layout: default
+title: Dataset Preparation with MediaSequence
+parent: Solutions
+nav_order: 10
+---
+
+# Dataset Preparation with MediaSequence
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
+
+## Overview
 
 MediaPipe is a useful and general framework for media processing that can
 assist with research, development, and deployment of ML models. This example
@@ -16,7 +30,7 @@ is available about the MediaSequence pipeline, including how to use it to
 process new data sets, in the documentation of
 [MediaSequence](https://github.com/google/mediapipe/tree/master/mediapipe/util/sequence).
 
-### Preparing an example data set
+## Preparing an example data set
 
 1.  Checkout the mediapipe repository
 
@@ -79,15 +93,17 @@ process new data sets, in the documentation of
     ```
 
     and then you can import the data set in Python using
-    [read_demo_dataset.py](mediapipe/examples/desktop/media_sequence/read_demo_dataset.py)
+    [read_demo_dataset.py](https://github.com/google/mediapipe/tree/master/mediapipe/examples/desktop/media_sequence/read_demo_dataset.py)
+
+## Preparing a practical data set
 
-### Preparing a practical data set
 As an example of processing a practical data set, a similar set of commands will
 prepare the [Charades data set](https://allenai.org/plato/charades/). The
 Charades data set is a data set of human action recognition collected with and
 maintained by the Allen Institute for Artificial Intelligence. To follow this
-code lab, you must abide by the [license](https://allenai.org/plato/charades/license.txt)
-for the Charades data set provided by the Allen Institute.
+code lab, you must abide by the
+[license](https://allenai.org/plato/charades/license.txt) for the Charades data
+set provided by the Allen Institute.
 
 The Charades data set is large (~150 GB), and will take considerable time to
 download and process (4-8 hours).
@@ -102,9 +118,10 @@ python -m mediapipe.examples.desktop.media_sequence.charades_dataset \
   --path_to_graph_directory=mediapipe/graphs/media_sequence/
 ```
 
-### Preparing your own data set
-The process for preparing your own data set is described in the [MediaSequence
-documentation](https://github.com/google/mediapipe/tree/master/mediapipe/util/sequence).
+## Preparing your own data set
+
+The process for preparing your own data set is described in the
+[MediaSequence documentation](https://github.com/google/mediapipe/tree/master/mediapipe/util/sequence).
 The Python code for Charades can easily be modified to process most annotations,
 but the MediaPipe processing warrants further discussion. MediaSequence uses
 MediaPipe graphs to extract features related to the metadata or previously
diff --git a/docs/solutions/object_detection.md b/docs/solutions/object_detection.md
new file mode 100644
index 000000000..a92e57e7d
--- /dev/null
+++ b/docs/solutions/object_detection.md
@@ -0,0 +1,150 @@
+---
+layout: default
+title: Object Detection
+parent: Solutions
+nav_order: 5
+---
+
+# MediaPipe Object Detection
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
+
+![object_detection_android_gpu.gif](../images/mobile/object_detection_android_gpu.gif)
+
+## Example Apps
+
+Note: To visualize a graph, copy the graph and paste it into
+[MediaPipe Visualizer](https://viz.mediapipe.dev/). For more information on how
+to visualize its associated subgraphs, please see
+[visualizer documentation](../visualizer.md).
+
+### Mobile
+
+Please first see general instructions for
+[Android](../getting_started/building_examples.md#android) and
+[iOS](../getting_started/building_examples.md#ios) on how to build MediaPipe examples.
+
+#### GPU Pipeline
+
+*   Graph:
+    [`mediapipe/graphs/object_detection/object_detection_mobile_gpu.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection/object_detection_mobile_gpu.pbtxt)
+*   Android target:
+    [(or download prebuilt ARM64 APK)](https://drive.google.com/open?id=1di2ywCA_acf3y5rIcJHngWHAUNsUHAGz)
+    [`mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectiongpu:objectdetectiongpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectiongpu/BUILD)
+*   iOS target:
+    [`mediapipe/examples/ios/objectdetectiongpu:ObjectDetectionGpuApp`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/objectdetectiongpu/BUILD)
+
+#### CPU Pipeline
+
+This is very similar to the [GPU pipeline](#gpu-pipeline) except that at the
+beginning and the end of the pipeline it performs GPU-to-CPU and CPU-to-GPU
+image transfer respectively. As a result, the rest of graph, which shares the
+same configuration as the GPU pipeline, runs entirely on CPU.
+
+*   Graph:
+    [`mediapipe/graphs/object_detection/object_detection_mobile_cpu.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection/object_detection_mobile_cpu.pbtxt))
+*   Android target:
+    [(or download prebuilt ARM64 APK)](https://drive.google.com/open?id=1eRBK6V5Qd1LCRwexitR2OXgrBBXbOfZ5)
+    [`mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectioncpu:objectdetectioncpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectioncpu/BUILD)
+*   iOS target:
+    [`mediapipe/examples/ios/objectdetectioncpu:ObjectDetectionCpuApp`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/objectdetectioncpu/BUILD)
+
+### Desktop
+
+#### Live Camera Input
+
+Please first see general instructions for
+[desktop](../getting_started/building_examples.md#desktop) on how to build MediaPipe examples.
+
+*   Graph:
+    [`mediapipe/graphs/object_detection/object_detection_desktop_live.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection/object_detection_desktop_live.pbtxt)
+*   Target:
+    [`mediapipe/examples/desktop/object_detection:object_detection_cpu`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/desktop/object_detection/BUILD)
+
+#### Video File Input
+
+*   With a TFLite Model
+
+    This uses the same
+    [TFLite model](https://github.com/google/mediapipe/tree/master/mediapipe/models/ssdlite_object_detection.tflite)
+    (see also
+    [model info](https://github.com/google/mediapipe/tree/master/mediapipe/models/object_detection_saved_model/README.md))
+    as in [Live Camera Input](#live-camera-input) above. The pipeline is
+    implemented in this
+    [graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection/object_detection_desktop_tflite_graph.pbtxt),
+    which differs from the live-camera-input CPU-based pipeline
+    [graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection/object_detection_mobile_cpu.pbtxt)
+    simply by the additional `OpenCvVideoDecoderCalculator` and
+    `OpenCvVideoEncoderCalculator` at the beginning and the end of the graph
+    respectively.
+
+    To build the application, run:
+
+    ```bash
+    bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 mediapipe/examples/desktop/object_detection:object_detection_tflite
+    ```
+
+    To run the application, replace `<input video path>` and `<output video
+    path>` in the command below with your own paths:
+
+    Tip: You can find a test video available in
+    `mediapipe/examples/desktop/object_detection`.
+
+    ```
+    GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/object_detection/object_detection_tflite \
+    --calculator_graph_config_file=mediapipe/graphs/object_detection/object_detection_desktop_tflite_graph.pbtxt \
+    --input_side_packets=input_video_path=<input video path>,output_video_path=<output video path>
+    ```
+
+*   With a TensorFlow Model
+
+    This uses the
+    [TensorFlow model](https://github.com/google/mediapipe/tree/master/mediapipe/models/object_detection_saved_model)
+    ( see also
+    [model info](https://github.com/google/mediapipe/tree/master/mediapipe/models/object_detection_saved_model/README.md)),
+    and the pipeline is implemented in this
+    [graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection/object_detection_mobile_cpu.pbtxt).
+
+    Note: The following runs TensorFlow inference on CPU. If you would like to
+    run inference on GPU (Linux only), please follow
+    [TensorFlow CUDA Support and Setup on Linux Desktop](gpu.md#tensorflow-cuda-support-and-setup-on-linux-desktop)
+    instead.
+
+    To build the TensorFlow CPU inference example on desktop, run:
+
+    Note: This command also builds TensorFlow targets from scratch, and it may
+    take a long time (e.g., up to 30 mins) for the first time.
+
+    ```bash
+    bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 --define no_aws_support=true --linkopt=-s \
+    mediapipe/examples/desktop/object_detection:object_detection_tensorflow
+    ```
+
+    To run the application, replace `<input video path>` and `<output video
+    path>` in the command below with your own paths:
+
+    Tip: You can find a test video available in
+    `mediapipe/examples/desktop/object_detection`.
+
+    ```bash
+    GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/object_detection/object_detection_tflite \
+    --calculator_graph_config_file=mediapipe/graphs/object_detection/object_detection_desktop_tensorflow_graph.pbtxt \
+    --input_side_packets=input_video_path=<input video path>,output_video_path=<output video path>
+    ```
+
+### Coral
+
+Please refer to
+[these instructions](https://github.com/google/mediapipe/tree/master/mediapipe/examples/coral/README.md)
+to cross-compile and run MediaPipe examples on the
+[Coral Dev Board](https://coral.ai/products/dev-board).
+
+## Resources
+
+*   [TFLite model](https://github.com/google/mediapipe/tree/master/mediapipe/models/ssdlite_object_detection.tflite)
+*   [TFLite model quantized for EdgeTPU/Coral](https://github.com/google/mediapipe/tree/master/mediapipe/examples/coral/models/object-detector-quantized_edgetpu.tflite)
+*   [TensorFlow model](https://github.com/google/mediapipe/tree/master/mediapipe/models/object_detection_saved_model)
+*   [Model information](https://github.com/google/mediapipe/tree/master/mediapipe/models/object_detection_saved_model/README.md)
diff --git a/docs/solutions/objectron.md b/docs/solutions/objectron.md
new file mode 100644
index 000000000..083c443c3
--- /dev/null
+++ b/docs/solutions/objectron.md
@@ -0,0 +1,192 @@
+---
+layout: default
+title: Objectron (3D Object Detection)
+parent: Solutions
+nav_order: 7
+---
+
+# MediaPipe Objectron
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
+
+## Overview
+
+MediaPipe Objectron is a mobile real-time 3D object detection solution for
+everyday objects. It detects objects in 2D images, and estimates their poses and
+sizes through a machine learning (ML) model, trained on a newly created 3D
+dataset.
+
+![objectron_shoe_android_gpu.gif](../images/mobile/objectron_shoe_android_gpu.gif) | ![objectron_chair_android_gpu.gif](../images/mobile/objectron_chair_android_gpu.gif)
+:--------------------------------------------------------------------------------: | :----------------------------------------------------------------------------------:
+*Fig 1(a). Objectron for Shoes.*                                                   | *Fig 1(b). Objectron for Chairs.*
+
+Object detection is an extensively studied computer vision problem, but most of
+the research has focused on
+[2D object prediction](https://ai.googleblog.com/2017/06/supercharge-your-computer-vision-models.html).
+While 2D prediction only provides 2D bounding boxes, by extending prediction to
+3D, one can capture an object’s size, position and orientation in the world,
+leading to a variety of applications in robotics, self-driving vehicles, image
+retrieval, and augmented reality. Although 2D object detection is relatively
+mature and has been widely used in the industry, 3D object detection from 2D
+imagery is a challenging problem, due to the lack of data and diversity of
+appearances and shapes of objects within a category.
+
+![objectron_example_results.png](../images/objectron_example_results.png) |
+:-----------------------------------------------------------------------: |
+*Fig 2. Objectron example results.*                                       |
+
+## Obtaining Real-World 3D Training Data
+
+While there are ample amounts of 3D data for street scenes, due to the
+popularity of research into self-driving cars that rely on 3D capture sensors
+like LIDAR, datasets with ground truth 3D annotations for more granular everyday
+objects are extremely limited. To overcome this problem, we developed a novel
+data pipeline using mobile augmented reality (AR) session data. With the arrival
+of [ARCore](https://developers.google.com/ar) and
+[ARKit](https://developer.apple.com/augmented-reality/),
+[hundreds of millions](https://arinsider.co/2019/05/13/arcore-reaches-400-million-devices/)
+of smartphones now have AR capabilities and the ability to capture additional
+information during an AR session, including the camera pose, sparse 3D point
+clouds, estimated lighting, and planar surfaces.
+
+In order to label ground truth data, we built a novel annotation tool for use
+with AR session data, which allows annotators to quickly label 3D bounding boxes
+for objects. This tool uses a split-screen view to display 2D video frames on
+which are overlaid 3D bounding boxes on the left, alongside a view showing 3D
+point clouds, camera positions and detected planes on the right. Annotators draw
+3D bounding boxes in the 3D view, and verify its location by reviewing the
+projections in 2D video frames. For static objects, we only need to annotate an
+object in a single frame and propagate its location to all frames using the
+ground truth camera pose information from the AR session data, which makes the
+procedure highly efficient.
+
+| ![objectron_data_annotation.gif](../images/objectron_data_annotation.gif)    |
+| :--------------------------------------------------------------------------: |
+| *Fig 3. Real-world data annotation for 3D object detection. (Right) 3D bounding boxes are annotated in the 3D world with detected surfaces and point clouds. (Left) Projections of annotated 3D bounding boxes are overlaid on top of video frames making it easy to validate the annotation.* |
+
+## AR Synthetic Data Generation
+
+A popular approach is to complement real-world data with synthetic data in order
+to increase the accuracy of prediction. However, attempts to do so often yield
+poor, unrealistic data or, in the case of photorealistic rendering, require
+significant effort and compute. Our novel approach, called AR Synthetic Data
+Generation, places virtual objects into scenes that have AR session data, which
+allows us to leverage camera poses, detected planar surfaces, and estimated
+lighting to generate placements that are physically probable and with lighting
+that matches the scene. This approach results in high-quality synthetic data
+with rendered objects that respect the scene geometry and fit seamlessly into
+real backgrounds. By combining real-world data and AR synthetic data, we are
+able to increase the accuracy by about 10%.
+
+![objectron_synthetic_data_generation.gif](../images/objectron_synthetic_data_generation.gif) |
+:-------------------------------------------------------------------------------------------: |
+*Fig 4. An example of AR synthetic data generation. The virtual white-brown cereal box is rendered into the real scene, next to the real blue book.* |
+
+## ML Model for 3D Object Detection
+
+![objectron_network_architecture.png](../images/objectron_network_architecture.png) |
+:---------------------------------------------------------------------------------: |
+*Fig 5. Network architecture and post-processing for 3D object detection.*          |
+
+We [built a single-stage model](https://arxiv.org/abs/2003.03522) to predict the
+pose and physical size of an object from a single RGB image. The model backbone
+has an encoder-decoder architecture, built upon
+[MobileNetv2](https://ai.googleblog.com/2018/04/mobilenetv2-next-generation-of-on.html).
+We employ a multi-task learning approach, jointly predicting an object's shape
+with detection and regression. The shape task predicts the object's shape
+signals depending on what ground truth annotation is available, e.g.
+segmentation. This is optional if there is no shape annotation in training data.
+For the detection task, we use the annotated bounding boxes and fit a Gaussian
+to the box, with center at the box centroid, and standard deviations
+proportional to the box size. The goal for detection is then to predict this
+distribution with its peak representing the object’s center location. The
+regression task estimates the 2D projections of the eight bounding box vertices.
+To obtain the final 3D coordinates for the bounding box, we leverage a well
+established pose estimation algorithm
+([EPnP](https://www.epfl.ch/labs/cvlab/software/multi-view-stereo/epnp/)). It
+can recover the 3D bounding box of an object, without a priori knowledge of the
+object dimensions. Given the 3D bounding box, we can easily compute pose and
+size of the object. The model is light enough to run real-time on mobile devices
+(at 26 FPS on an Adreno 650 mobile GPU).
+
+![objectron_sample_network_results.png](../images/objectron_sample_network_results.png) |
+:-------------------------------------------------------------------------------------: |
+*Fig 6. Sample results of our network — (Left) original 2D image with estimated bounding boxes, (Middle) object detection by Gaussian distribution, (Right) predicted segmentation mask.* |
+
+## Detection and Tracking Pipeline
+
+When the model is applied to every frame captured by the mobile device, it can
+suffer from jitter due to the ambiguity of the 3D bounding box estimated in each
+frame. To mitigate this, we adopt the same detection+tracking strategy in our
+[2D object detection and tracking pipeline](./box_tracking.md#object-detection-and-tracking)
+in [MediaPipe Box Tracking](./box_tracking.md). This mitigates the need to run
+the network on every frame, allowing the use of heavier and therefore more
+accurate models, while keeping the pipeline real-time on mobile devices. It also
+retains object identity across frames and ensures that the prediction is
+temporally consistent, reducing the jitter.
+
+The Objectron 3D object detection and tracking pipeline is implemented as a
+MediaPipe
+[graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection_3d/shoe_classic_occlusion_tracking.pbtxt),
+which internally uses a
+[detection subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection_3d/subgraphs/objectron_detection_gpu.pbtxt)
+and a
+[tracking subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection_3d/subgraphs/objectron_tracking_gpu.pbtxt).
+The detection subgraph performs ML inference only once every few frames to
+reduce computation load, and decodes the output tensor to a FrameAnnotation that
+contains nine keypoints: the 3D bounding box's center and its eight vertices.
+The tracking subgraph runs every frame, using the box traker in
+[MediaPipe Box Tracking](./box_tracking.md) to track the 2D box tightly
+enclosing the projection of the 3D bounding box, and lifts the tracked 2D
+keypoints to 3D with
+[EPnP](https://www.epfl.ch/labs/cvlab/software/multi-view-stereo/epnp/). When
+new detection becomes available from the detection subgraph, the tracking
+subgraph is also responsible for consolidation between the detection and
+tracking results, based on the area of overlap.
+
+## Example Apps
+
+Please first see general instructions for
+[Android](../getting_started/building_examples.md#android) and
+[iOS](../getting_started/building_examples.md#ios) on how to build MediaPipe examples.
+
+Note: To visualize a graph, copy the graph and paste it into
+[MediaPipe Visualizer](https://viz.mediapipe.dev/). For more information on how
+to visualize its associated subgraphs, please see
+[visualizer documentation](../visualizer.md).
+
+### Objectron for Shoes
+
+*   Graph:
+    [`mediapipe/graphs/hair_segmentation/hair_segmentation_mobile_gpu.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection_3d/shoe_classic_occlusion_tracking.pbtxt)
+*   Android target:
+    [(or download prebuilt ARM64 APK)](https://drive.google.com/open?id=1S0K4hbWt3o31FfQ4QU3Rz7IHrvOUMx1d)
+    [`mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetection3d:objectdetection3d`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetection3d/BUILD)
+*   iOS target: Not available
+
+### Objectron for Chairs
+
+*   Graph:
+    [`mediapipe/graphs/hair_segmentation/hair_segmentation_mobile_gpu.pbtxt`](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection_3d/chair_classic_occlusion_tracking.pbtxt)
+*   Android target:
+    [(or download prebuilt ARM64 APK)](https://drive.google.com/open?id=1MM8K-13bXLCVS1EHQ-KgkVyEahEPrKej)
+    [`mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetection3d:objectdetection3d`](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetection3d/BUILD)
+    and add `--define chair=true` to the build command, i.e.,
+
+    ```bash
+    bazel build -c opt --config android_arm64 --define chair=true mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetection3d:objectdetection3d
+    ```
+
+*   iOS target: Not available
+
+## Resources
+
+*   Google AI Blog:
+    [Real-Time 3D Object Detection on Mobile Devices with MediaPipe](https://ai.googleblog.com/2020/03/real-time-3d-object-detection-on-mobile.html)
+*   Paper: [MobilePose: Real-Time Pose Estimation for Unseen Objects with Weak
+    Shape Supervision](https://arxiv.org/abs/2003.03522)
+*   [TFLite model for shoes](https://github.com/google/mediapipe/tree/master/mediapipe/models/object_detection_3d_sneakers.tflite)
+*   [TFLite model for chairs](https://github.com/google/mediapipe/tree/master/mediapipe/models/object_detection_3d_chair.tflite)
diff --git a/docs/solutions/solutions.md b/docs/solutions/solutions.md
new file mode 100644
index 000000000..dc25c8a72
--- /dev/null
+++ b/docs/solutions/solutions.md
@@ -0,0 +1,31 @@
+---
+layout: default
+title: Solutions
+nav_order: 3
+has_children: true
+has_toc: false
+---
+
+# Solutions
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
+
+<!-- []() in the first cell is needed to preserve table formatting in GitHub Pages. -->
+<!-- Whenever this table is updated, paste a copy to ../index.md. -->
+
+[]()                                                                          | Android | iOS | Desktop | Web | Coral
+:---------------------------------------------------------------------------- | :-----: | :-: | :-----: | :-: | :---:
+[Face Detection](https://google.github.io/mediapipe/solutions/face_detection)       | ✅       | ✅   | ✅       | ✅   | ✅
+[Face Mesh](https://google.github.io/mediapipe/solutions/face_mesh)                 | ✅       | ✅   | ✅       |     |
+[Hand](https://google.github.io/mediapipe/solutions/hand)                           | ✅       | ✅   | ✅       | ✅   |
+[Hair Segmentation](https://google.github.io/mediapipe/solutions/hair_segmentation) | ✅       |     | ✅       | ✅   |
+[Object Detection](https://google.github.io/mediapipe/solutions/object_detection)   | ✅       | ✅   | ✅       |     | ✅
+[Box Tracking](https://google.github.io/mediapipe/solutions/box_tracking)           | ✅       | ✅   | ✅       |     |
+[Objectron](https://google.github.io/mediapipe/solutions/objectron)                 | ✅       |     |         |     |
+[KNIFT](https://google.github.io/mediapipe/solutions/knift)                         | ✅       |     |         |     |
+[AutoFlip](https://google.github.io/mediapipe/solutions/autoflip)                   |         |     | ✅       |     |
+[MediaSequence](https://google.github.io/mediapipe/solutions/media_sequence)        |         |     | ✅       |     |
+[YouTube 8M](https://google.github.io/mediapipe/solutions/youtube_8m)               |         |     | ✅       |     |
diff --git a/mediapipe/docs/youtube_8m.md b/docs/solutions/youtube_8m.md
similarity index 97%
rename from mediapipe/docs/youtube_8m.md
rename to docs/solutions/youtube_8m.md
index a1f657fe5..5179e3aa5 100644
--- a/mediapipe/docs/youtube_8m.md
+++ b/docs/solutions/youtube_8m.md
@@ -1,4 +1,16 @@
-# Feature Extraction and Model Inference for YouTube-8M Challenge
+---
+layout: default
+title: YouTube-8M Feature Extraction and Model Inference
+parent: Solutions
+nav_order: 11
+---
+
+# YouTube-8M Feature Extraction and Model Inference
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
 
 MediaPipe is a useful and general framework for media processing that can assist
 with research, development, and deployment of ML models. This example focuses on
diff --git a/docs/tools/performance_benchmarking.md b/docs/tools/performance_benchmarking.md
new file mode 100644
index 000000000..f0d334f58
--- /dev/null
+++ b/docs/tools/performance_benchmarking.md
@@ -0,0 +1,18 @@
+---
+layout: default
+title: Performance Benchmarking
+parent: Tools
+nav_order: 3
+---
+
+# Performance Benchmarking
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
+
+*Coming soon.*
+
+Future mediapipe releases will include tools for visualizing and analysing the
+latency histograms and timed events captured for performance benchmarking.
diff --git a/docs/tools/tools.md b/docs/tools/tools.md
new file mode 100644
index 000000000..568ba76a7
--- /dev/null
+++ b/docs/tools/tools.md
@@ -0,0 +1,13 @@
+---
+layout: default
+title: Tools
+nav_order: 4
+has_children: true
+---
+
+# Tools
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
diff --git a/mediapipe/docs/tracer.md b/docs/tools/tracing_and_profiling.md
similarity index 61%
rename from mediapipe/docs/tracer.md
rename to docs/tools/tracing_and_profiling.md
index d3a4174c6..5018dfa5c 100644
--- a/mediapipe/docs/tracer.md
+++ b/docs/tools/tracing_and_profiling.md
@@ -1,18 +1,30 @@
-# Tracing / Profiling MediaPipe Graphs
+---
+layout: default
+title: Tracing and Profiling
+parent: Tools
+nav_order: 2
+---
 
-The MediaPipe framework includes a built-in tracer and profiler. Tracing can
-be activated using a setting in the CalculatorGraphConfig. The tracer records
-various timing events related to packet processing, including the start and
-end time of each Calculator::Process call. The tracer writes trace log files
-in binary protobuf format.  The tracer is available on Linux, Android, or iOS.
+# Tracing and Profiling
+{: .no_toc }
 
-## Enabling tracing
+1. TOC
+{:toc}
+---
 
-To enable profiling of a mediapipe graph, the proto buffer representing the graph
-must have a profiler_config message at its root. This tag is defined inside
-calculator.proto and our public definition can be found in our github repository
-with a complete list of settings. Here is a simple setup that turns on a few
-extra options:
+The MediaPipe framework includes a built-in tracer and profiler. The tracer
+records various timing events related to packet processing, including the start
+and end time of each Calculator::Process call. The tracer writes trace log files
+in binary protobuf format. The profiler further accumulates for each running
+calculator a histogram of latencies for Process calls. Tracing and profiling is
+available on Linux, Android, or iOS.
+
+## Enabling tracing and profiling
+
+To enable tracing/profiling of a mediapipe graph, the `CalculatorGraphConfig` (in
+[calculator.proto](https://github.com/google/mediapipe/tree/master/mediapipe/framework/calculator.proto))
+representing the graph must have a `profiler_config` message at its root. Here
+is a simple setup that turns on a few extra options:
 
 ```
 profiler_config {
@@ -32,7 +44,7 @@ profiler_config {
     fashion (after the fifth file is recorded, the first file is used again).
     The trace log files are named `trace_0.log` through `trace_k.log`.
 
-    See [Profiler Configuration](profiler_config.md) for other settings
+    See [Profiler configuration](#profiler_configuration) for other settings
     available in the profiler config. Note that most of the other settings are
     considered advanced, and in general should not be needed.
 
@@ -47,12 +59,12 @@ MediaPipe will emit data into a pre-specified directory:
 *   On iOS, this can be reached through XCode. Select "Window/Devices and
     Simulators" and select the "Devices" tab.
 
-    ![Windows Select Devices](images/visualizer/ios_window_devices.png)
+    ![Windows Select Devices](../images/visualizer/ios_window_devices.png)
 
     You can open the Download Container. Logs will be located in `application
     container/.xcappdata/AppData/Documents/`
 
-    ![Windows Download Container](images/visualizer/ios_download_container.png)
+    ![Windows Download Container](../images/visualizer/ios_download_container.png)
 
 Log files are written to `\<trace_log_path index\>.binarypb` where, by default,
 `\<trace_log_path\>` is equal to `mediapipe_trace_` (the entire path and file
@@ -146,14 +158,14 @@ Trace logs can be analyzed from within the visualizer.
 
 2.  Click on the "Upload" button in the upper right.
 
-    ![Click on Upload](images/visualizer/viz_click_upload.png)
+    ![Click on Upload](../images/visualizer/viz_click_upload.png)
 
 3.  Click on "Upload trace file".
 
-    ![Click on Upload](images/visualizer/viz_click_upload_trace_file.png)
+    ![Click on Upload](../images/visualizer/viz_click_upload_trace_file.png)
 
     A sample trace file has been generated for you:
-    [sample_trace_binary.pb](data/visualizer/sample_trace.binarypb)
+    [sample_trace_binary.pb](../data/visualizer/sample_trace.binarypb)
 
 4.  A file selection popup will appear. Select the `.binarypb` that holds your
     trace information.
@@ -161,7 +173,7 @@ Trace logs can be analyzed from within the visualizer.
 5.  A chart view will appear. All of your calculators will appear along the left
     with profiling information listed along the top.
 
-    ![Click on Upload](images/visualizer/viz_chart_view.png)
+    ![Click on Upload](../images/visualizer/viz_chart_view.png)
 
     Click on a header to alternately sort that column in ascending or descending
     order. You can also scroll horizontally and vertically within the control to
@@ -221,3 +233,71 @@ input_latency_stddev
 
 input_latency_total
 :   Total accumulated input_latency (in microseconds).
+
+## Profiler configuration
+
+Many of the following settings are advanced and not recommended for general
+usage. Consult [Enabling tracing and profiling](#enabling-tracing-and-profiling)
+for a friendlier introduction.
+
+histogram_interval_size_usec :Specifies the size of the runtimes histogram
+intervals (in microseconds) to generate the histogram of the Process() time. The
+last interval extends to +inf. If not specified, the interval is 1000000 usec =
+1 sec.
+
+num_histogram_intervals :Specifies the number of intervals to generate the
+histogram of the `Process()` runtime. If not specified, one interval is used.
+
+enable_profiler
+:   If true, the profiler starts profiling when graph is initialized.
+
+enable_stream_latency
+:   If true, the profiler also profiles the stream latency and input-output
+    latency. No-op if enable_profiler is false.
+
+use_packet_timestamp_for_added_packet
+:   If true, the profiler uses packet timestamp (as production time and source
+    production time) for packets added by calling
+    `CalculatorGraph::AddPacketToInputStream()`. If false, uses the profiler's
+    clock.
+
+trace_log_capacity
+:   The maximum number of trace events buffered in memory. The default value
+    buffers up to 20000 events.
+
+trace_event_types_disabled
+:   Trace event types that are not logged.
+
+trace_log_path
+:   The output directory and base-name prefix for trace log files. Log files are
+    written to: StrCat(trace_log_path, index, "`.binarypb`")
+
+trace_log_count
+:   The number of trace log files retained. The trace log files are named
+    "`trace_0.log`" through "`trace_k.log`". The default value specifies 2
+    output files retained.
+
+trace_log_interval_usec
+:   The interval in microseconds between trace log output. The default value
+    specifies trace log output once every 0.5 sec.
+
+trace_log_margin_usec
+:   The interval in microseconds between TimeNow and the highest times included
+    in trace log output. This margin allows time for events to be appended to
+    the TraceBuffer.
+
+trace_log_duration_events
+:   False specifies an event for each calculator invocation. True specifies a
+    separate event for each start and finish time.
+
+trace_log_interval_count
+:   The number of trace log intervals per file. The total log duration is:
+    `trace_log_interval_usec * trace_log_file_count * trace_log_interval_count`.
+    The default value specifies 10 intervals per file.
+
+trace_log_disabled
+:   An option to turn ON/OFF writing trace files to disk. Saving trace files to
+    disk is enabled by default.
+
+trace_enabled
+:   If true, tracer timing events are recorded and reported.
diff --git a/mediapipe/docs/visualizer.md b/docs/tools/visualizer.md
similarity index 62%
rename from mediapipe/docs/visualizer.md
rename to docs/tools/visualizer.md
index 416e4199b..4e3de07a1 100644
--- a/mediapipe/docs/visualizer.md
+++ b/docs/tools/visualizer.md
@@ -1,9 +1,16 @@
-## Visualizing & Tracing MediaPipe Graphs
+---
+layout: default
+title: Visualizer
+parent: Tools
+nav_order: 1
+---
 
--   [Working within the Editor](#working-within-the-editor)
--   [Understanding the Graph](#understanding-the-graph)
--   [Tracing the Graph](#tracing-the-graph)
--   [Visualizing Subgraphs](#visualizing-subgraphs)
+# Visualizer
+{: .no_toc }
+
+1. TOC
+{:toc}
+---
 
 To help users understand the structure of their calculator graphs and to
 understand the overall behavior of their machine learning inference pipelines,
@@ -14,20 +21,20 @@ that is available online.
     through a graph configuration that is pasted into the graph editor or
     uploaded. The user can visualize and troubleshoot a graph they have created.
 
-    ![Startup screen](./images/startup_screen.png)
+    ![Startup screen](../images/startup_screen.png)
 
-### Working within the Editor
+## Working within the Editor
 
 Getting Started:
 
 The graph can be modified by adding and editing code in the Editor view.
 
-![Editor UI](./images/editor_view.png)
+![Editor UI](../images/editor_view.png)
 
 *   Pressing the "New" button in the upper right corner will clear any existing
     code in the Editor window.
 
-    ![New Button](./images/upload_button.png)
+    ![New Button](../images/upload_button.png)
 
 *   Pressing the "Upload" button will prompt the user to select a local PBTXT
     file, which will everwrite the current code within the editor.
@@ -36,9 +43,9 @@ The graph can be modified by adding and editing code in the Editor view.
 
 *   Errors and informational messages will appear in the Feedback window.
 
-    ![Error Msg](./images/console_error.png)
+    ![Error Msg](../images/console_error.png)
 
-### Understanding the Graph
+## Understanding the Graph
 
 The visualizer graph shows the connections between calculator nodes.
 
@@ -46,39 +53,26 @@ The visualizer graph shows the connections between calculator nodes.
     enter the top of any calculator receiving the stream. (Notice the use of the
     key, "input_stream" and "output_stream").
 
-    ![Stream UI](./images/stream_ui.png)
+    ![Stream UI](../images/stream_ui.png)
 
-    ![Stream_code](./images/stream_code.png)
+    ![Stream_code](../images/stream_code.png)
 
 *   Sidepackets work the same, except that they exit a node on the right and
     enter on the left. (Notice the use of the key, "input_side_packet" and
     "output_side_packet").
 
-    ![Sidepacket UI](./images/side_packet.png)
+    ![Sidepacket UI](../images/side_packet.png)
 
-    ![Sidepacket_code](./images/side_packet_code.png)
+    ![Sidepacket_code](../images/side_packet_code.png)
 
 *   There are special nodes that represent inputs and outputs to the graph and
     can supply either side packets or streams.
 
-    ![Special nodes](./images/special_nodes.png)
+    ![Special nodes](../images/special_nodes.png)
 
-    ![Special nodes](./images/special_nodes_code.png)
+    ![Special nodes](../images/special_nodes_code.png)
 
-
-### Tracing the Graph
-
-The MediaPipe visualizer can display either a calculator graph definition or a
-calculator graph execution trace. In a MediaPipe graph, execution tracing can be
-activated using a setting in the CalculatorGraphConfig,
-`profiler_config.tracing_enabled`. When activated the tracer writes trace log
-files on either Linux, Android, or iOS.
-
-For more details on activating execution tracing, see
-[Tracing MediaPipe Graphs](./tracer.md)
-
-
-### Visualizing Subgraphs
+## Visualizing Subgraphs
 
 The MediaPipe visualizer can display multiple graphs in separate tabs. If a
 graph has a `type` field in the top level of the graph's text proto definition,
@@ -87,8 +81,8 @@ is considered a subgraph by the visualizer and colored appropriately where it is
 used. Clicking on a subgraph will navigate to the corresponding tab which holds
 the subgraph's definition.
 
-For instance, there are two graphs involved in the
-[hand detection example](./hand_detection_mobile_gpu.md): the main graph
+For instance, there are two graphs involved in
+[MediaPipe Hand](../solutions/hand.md): the main graph
 ([source pbtxt file](https://github.com/google/mediapipe/blob/master/mediapipe/graphs/hand_tracking/hand_detection_mobile.pbtxt))
 and its associated subgraph
 ([source pbtxt file](https://github.com/google/mediapipe/blob/master/mediapipe/graphs/hand_tracking/subgraphs/hand_detection_gpu.pbtxt)).
@@ -97,16 +91,16 @@ To visualize them:
 *   In the MediaPipe visualizer, click on the upload graph button and select the
     2 pbtxt files to visualize (main graph and its associated subgraph).
 
-    ![Upload graph button](./images/upload_button.png)
+    ![Upload graph button](../images/upload_button.png)
 
-    ![Choose the 2 files](./images/upload_2pbtxt.png)
+    ![Choose the 2 files](../images/upload_2pbtxt.png)
 
 *   There will be 2 additional tabs. The main graph tab is
     `hand_detection_mobile.pbtxt`.
 
-    ![hand_detection_mobile_gpu.pbtxt](./images/maingraph_visualizer.png)
+    ![hand_detection_mobile_gpu.pbtxt](../images/maingraph_visualizer.png)
 
 *   Clicking on the `HandDetection` node in purple redirects the view to the
     `hand_detection_gpu.pbtxt` tab.
 
-    ![Hand detection subgraph](./images/click_subgraph_handdetection.png)
+    ![Hand detection subgraph](../images/click_subgraph_handdetection.png)
diff --git a/mediapipe/calculators/core/split_normalized_landmark_list_calculator.cc b/mediapipe/calculators/core/split_normalized_landmark_list_calculator.cc
index e95173e0c..85bac0e9b 100644
--- a/mediapipe/calculators/core/split_normalized_landmark_list_calculator.cc
+++ b/mediapipe/calculators/core/split_normalized_landmark_list_calculator.cc
@@ -112,7 +112,9 @@ class SplitNormalizedLandmarkListCalculator : public CalculatorBase {
   ::mediapipe::Status Process(CalculatorContext* cc) override {
     const NormalizedLandmarkList& input =
         cc->Inputs().Index(0).Get<NormalizedLandmarkList>();
-    RET_CHECK_GE(input.landmark_size(), max_range_end_);
+    RET_CHECK_GE(input.landmark_size(), max_range_end_)
+        << "Max range end " << max_range_end_ << " exceeds landmarks size "
+        << input.landmark_size();
 
     if (combine_outputs_) {
       NormalizedLandmarkList output;
diff --git a/mediapipe/calculators/image/BUILD b/mediapipe/calculators/image/BUILD
index 8df493d22..7efb4a011 100644
--- a/mediapipe/calculators/image/BUILD
+++ b/mediapipe/calculators/image/BUILD
@@ -258,6 +258,7 @@ cc_library(
         ":bilateral_filter_calculator_cc_proto",
         "//mediapipe/framework:calculator_options_cc_proto",
         "//mediapipe/framework/formats:image_format_cc_proto",
+        "@com_google_absl//absl/strings",
         "//mediapipe/framework:calculator_framework",
         "//mediapipe/framework/formats:image_frame",
         "//mediapipe/framework/formats:image_frame_opencv",
diff --git a/mediapipe/calculators/image/bilateral_filter_calculator.cc b/mediapipe/calculators/image/bilateral_filter_calculator.cc
index e1d26c1e0..8d3d26f2d 100644
--- a/mediapipe/calculators/image/bilateral_filter_calculator.cc
+++ b/mediapipe/calculators/image/bilateral_filter_calculator.cc
@@ -15,6 +15,7 @@
 #include <memory>
 #include <string>
 
+#include "absl/strings/str_replace.h"
 #include "mediapipe/calculators/image/bilateral_filter_calculator.pb.h"
 #include "mediapipe/framework/calculator_framework.h"
 #include "mediapipe/framework/calculator_options.pb.h"
@@ -104,8 +105,9 @@ class BilateralFilterCalculator : public CalculatorBase {
 #if !defined(MEDIAPIPE_DISABLE_GPU)
   mediapipe::GlCalculatorHelper gpu_helper_;
   GLuint program_ = 0;
-  GLuint program_joint_ = 0;
-#endif  //  !MEDIAPIPE_DISABLE_GPU
+  GLuint vao_;
+  GLuint vbo_[2];  // vertex storage
+#endif             // !MEDIAPIPE_DISABLE_GPU
 };
 REGISTER_CALCULATOR(BilateralFilterCalculator);
 
@@ -219,9 +221,12 @@ REGISTER_CALCULATOR(BilateralFilterCalculator);
 #if !defined(MEDIAPIPE_DISABLE_GPU)
   gpu_helper_.RunInGlContext([this] {
     if (program_) glDeleteProgram(program_);
+    if (vao_) glDeleteVertexArrays(1, &vao_);
+    if (vbo_[0]) glDeleteBuffers(2, vbo_);
     program_ = 0;
-    if (program_joint_) glDeleteProgram(program_joint_);
-    program_joint_ = 0;
+    vao_ = 0;
+    vbo_[0] = 0;
+    vbo_[1] = 0;
   });
 #endif  //  !MEDIAPIPE_DISABLE_GPU
 
@@ -276,17 +281,18 @@ REGISTER_CALCULATOR(BilateralFilterCalculator);
   auto input_texture = gpu_helper_.CreateSourceTexture(input_frame);
 
   mediapipe::GlTexture output_texture;
-  const bool has_guide_image = cc->Inputs().HasTag(kInputGuideTagGpu) &&
-                               !cc->Inputs().Tag(kInputGuideTagGpu).IsEmpty();
+  const bool has_guide_image = cc->Inputs().HasTag(kInputGuideTagGpu);
 
   // Setup textures and Update image in GPU shader.
   if (has_guide_image) {
+    if (cc->Inputs().Tag(kInputGuideTagGpu).IsEmpty())
+      return mediapipe::OkStatus();
     // joint bilateral filter
-    glUseProgram(program_joint_);
+    glUseProgram(program_);
     const auto& guide_image =
         cc->Inputs().Tag(kInputGuideTagGpu).Get<mediapipe::GpuBuffer>();
     auto guide_texture = gpu_helper_.CreateSourceTexture(guide_image);
-    glUniform2f(glGetUniformLocation(program_joint_, "texel_size_guide"),
+    glUniform2f(glGetUniformLocation(program_, "texel_size_guide"),
                 1.0 / guide_image.width(), 1.0 / guide_image.height());
     output_texture = gpu_helper_.CreateDestinationTexture(
         guide_image.width(), guide_image.height(),
@@ -297,7 +303,6 @@ REGISTER_CALCULATOR(BilateralFilterCalculator);
     glActiveTexture(GL_TEXTURE2);
     glBindTexture(GL_TEXTURE_2D, guide_texture.name());
     GlRender(cc);
-    glActiveTexture(GL_TEXTURE2);
     glBindTexture(GL_TEXTURE_2D, 0);
     glActiveTexture(GL_TEXTURE1);
     glBindTexture(GL_TEXTURE_2D, 0);
@@ -314,7 +319,6 @@ REGISTER_CALCULATOR(BilateralFilterCalculator);
     glActiveTexture(GL_TEXTURE1);
     glBindTexture(GL_TEXTURE_2D, input_texture.name());
     GlRender(cc);
-    glActiveTexture(GL_TEXTURE1);
     glBindTexture(GL_TEXTURE_2D, 0);
   }
   glFlush();
@@ -335,51 +339,14 @@ REGISTER_CALCULATOR(BilateralFilterCalculator);
 
 void BilateralFilterCalculator::GlRender(CalculatorContext* cc) {
 #if !defined(MEDIAPIPE_DISABLE_GPU)
-  static const GLfloat square_vertices[] = {
-      -1.0f, -1.0f,  // bottom left
-      1.0f,  -1.0f,  // bottom right
-      -1.0f, 1.0f,   // top left
-      1.0f,  1.0f,   // top right
-  };
-  static const GLfloat texture_vertices[] = {
-      0.0f, 0.0f,  // bottom left
-      1.0f, 0.0f,  // bottom right
-      0.0f, 1.0f,  // top left
-      1.0f, 1.0f,  // top right
-  };
-
-  // vertex storage
-  GLuint vbo[2];
-  glGenBuffers(2, vbo);
-  GLuint vao;
-  glGenVertexArrays(1, &vao);
-  glBindVertexArray(vao);
-
-  // vbo 0
-  glBindBuffer(GL_ARRAY_BUFFER, vbo[0]);
-  glBufferData(GL_ARRAY_BUFFER, 4 * 2 * sizeof(GLfloat), square_vertices,
-               GL_STATIC_DRAW);
-  glEnableVertexAttribArray(ATTRIB_VERTEX);
-  glVertexAttribPointer(ATTRIB_VERTEX, 2, GL_FLOAT, 0, 0, nullptr);
-
-  // vbo 1
-  glBindBuffer(GL_ARRAY_BUFFER, vbo[1]);
-  glBufferData(GL_ARRAY_BUFFER, 4 * 2 * sizeof(GLfloat), texture_vertices,
-               GL_STATIC_DRAW);
-  glEnableVertexAttribArray(ATTRIB_TEXTURE_POSITION);
-  glVertexAttribPointer(ATTRIB_TEXTURE_POSITION, 2, GL_FLOAT, 0, 0, nullptr);
+  // bring back vao and vbo
+  glBindVertexArray(vao_);
 
   // draw
   glDrawArrays(GL_TRIANGLE_STRIP, 0, 4);
 
   // cleanup
-  glDisableVertexAttribArray(ATTRIB_VERTEX);
-  glDisableVertexAttribArray(ATTRIB_TEXTURE_POSITION);
-  glBindBuffer(GL_ARRAY_BUFFER, 0);
   glBindVertexArray(0);
-  glDeleteVertexArrays(1, &vao);
-  glDeleteBuffers(2, vbo);
-
 #endif  //  !MEDIAPIPE_DISABLE_GPU
 }
 
@@ -394,36 +361,11 @@ void BilateralFilterCalculator::GlRender(CalculatorContext* cc) {
       "texture_coordinate",
   };
 
-  // We bake our sigma values directly into the shader, so the GLSL compiler can
-  // optimize appropriately.
-  std::string sigma_options_string =
-      "const float sigma_space = " + std::to_string(sigma_space_) +
-      "; const float sigma_color = " + std::to_string(sigma_color_) + ";\n";
-
-  // Shader to do bilateral filtering on input image based on sigma space/color.
-  // Large kernel sizes are subsampled based on sqrt(sigma_space) window size,
-  // denoted as 'sparsity' below.
-  const std::string frag_src = GLES_VERSION_COMPAT
-                               R"(
-  #if __VERSION__ < 130
-    #define in varying
-  #endif  // __VERSION__ < 130
-
-  #ifdef GL_ES
-    #define fragColor gl_FragColor
-    precision highp float;
-  #else
-    #define lowp
-    #define mediump
-    #define highp
-    #define texture2D texture
-    out vec4 fragColor;
-  #endif  // defined(GL_ES)
-
-    in vec2 sample_coordinate;
-    uniform sampler2D input_frame;
-)" + sigma_options_string + R"(
-    uniform vec2 texel_size;
+  // Common functions and settings for both shaders.
+  const std::string common_string =
+      absl::StrReplaceAll(R"(
+    const float sigma_space = $space;
+    const float sigma_color = $color;
 
     const float kSparsityFactor = 0.66;  // Higher is more sparse.
     const float sparsity = max(1.0, sqrt(sigma_space) * kSparsityFactor);
@@ -435,6 +377,23 @@ void BilateralFilterCalculator::GlRender(CalculatorContext* cc) {
       float coeff = -0.5 / (sigma * sigma * 4.0 + 1.0e-6);
       return exp((x * x) * coeff);
     }
+  )",
+                          {{"$space", std::to_string(sigma_space_)},
+                           {"$color", std::to_string(sigma_color_)}});
+
+  // Shader to do bilateral filtering on input image based on sigma space/color.
+  // Large kernel sizes are subsampled based on sqrt(sigma_space) window size,
+  // denoted as 'sparsity' below.
+  const std::string frag_src =
+      std::string(mediapipe::kMediaPipeFragmentShaderPreamble) + R"(
+    DEFAULT_PRECISION(highp, float)
+
+    in vec2 sample_coordinate;
+    uniform sampler2D input_frame;
+    uniform vec2 texel_size;
+
+    )" +
+      common_string + R"(
 
     void main() {
       vec2 center_uv = sample_coordinate;
@@ -462,55 +421,25 @@ void BilateralFilterCalculator::GlRender(CalculatorContext* cc) {
       }
       new_val /= vec3(total_weight);
 
-      fragColor = vec4(new_val, 1.0);
+      gl_FragColor = vec4(new_val, 1.0);
     }
   )";
 
-  // Create shader program and set parameters.
-  mediapipe::GlhCreateProgram(mediapipe::kBasicVertexShader, frag_src.c_str(),
-                              NUM_ATTRIBUTES, (const GLchar**)&attr_name[0],
-                              attr_location, &program_);
-  RET_CHECK(program_) << "Problem initializing the program.";
-  glUseProgram(program_);
-  glUniform1i(glGetUniformLocation(program_, "input_frame"), 1);
-
   // Shader to do joint bilateral filtering on input image based on
   // sigma space/color, and a Guide image.
   // Large kernel sizes are subsampled based on sqrt(sigma_space) window size,
   // denoted as 'sparsity' below.
-  const std::string joint_frag_src = GLES_VERSION_COMPAT
-                                     R"(
-  #if __VERSION__ < 130
-    #define in varying
-  #endif  // __VERSION__ < 130
-
-  #ifdef GL_ES
-    #define fragColor gl_FragColor
-    precision highp float;
-  #else
-    #define lowp
-    #define mediump
-    #define highp
-    #define texture2D texture
-    out vec4 fragColor;
-  #endif  // defined(GL_ES)
+  const std::string joint_frag_src =
+      std::string(mediapipe::kMediaPipeFragmentShaderPreamble) + R"(
+    DEFAULT_PRECISION(highp, float)
 
     in vec2 sample_coordinate;
     uniform sampler2D input_frame;
     uniform sampler2D guide_frame;
-)" + sigma_options_string + R"(
     uniform vec2 texel_size_guide; // size of guide and resulting filtered image
 
-    const float kSparsityFactor = 0.66;  // Higher is more sparse.
-    const float sparsity = max(1.0, sqrt(sigma_space) * kSparsityFactor);
-    const float step = sparsity;
-    const float radius = sigma_space;
-    const float offset = (step > 1.0) ? (step * 0.5) : (0.0);
-
-    float gaussian(float x, float sigma) {
-      float coeff = -0.5 / (sigma * sigma * 4.0 + 1.0e-6);
-      return exp((x * x) * coeff);
-    }
+    )" +
+      common_string + R"(
 
     void main() {
       vec2 center_uv = sample_coordinate;
@@ -539,18 +468,52 @@ void BilateralFilterCalculator::GlRender(CalculatorContext* cc) {
       }
       new_val /= vec3(total_weight);
 
-      fragColor = vec4(new_val, 1.0);
+      gl_FragColor = vec4(new_val, 1.0);
     }
   )";
 
-  // Create shader program and set parameters.
-  mediapipe::GlhCreateProgram(
-      mediapipe::kBasicVertexShader, joint_frag_src.c_str(), NUM_ATTRIBUTES,
-      (const GLchar**)&attr_name[0], attr_location, &program_joint_);
-  RET_CHECK(program_joint_) << "Problem initializing the program.";
-  glUseProgram(program_joint_);
-  glUniform1i(glGetUniformLocation(program_joint_, "input_frame"), 1);
-  glUniform1i(glGetUniformLocation(program_joint_, "guide_frame"), 2);
+  // Only initialize the one shader to be used.
+  const bool has_guide_image = cc->Inputs().HasTag(kInputGuideTagGpu);
+
+  if (has_guide_image) {
+    // Create joint shader program and set parameters.
+    mediapipe::GlhCreateProgram(
+        mediapipe::kBasicVertexShader, joint_frag_src.c_str(), NUM_ATTRIBUTES,
+        (const GLchar**)&attr_name[0], attr_location, &program_);
+    RET_CHECK(program_) << "Problem initializing the program.";
+    glUseProgram(program_);
+    glUniform1i(glGetUniformLocation(program_, "input_frame"), 1);
+    glUniform1i(glGetUniformLocation(program_, "guide_frame"), 2);
+  } else {
+    // Create default shader program and set parameters.
+    mediapipe::GlhCreateProgram(mediapipe::kBasicVertexShader, frag_src.c_str(),
+                                NUM_ATTRIBUTES, (const GLchar**)&attr_name[0],
+                                attr_location, &program_);
+    RET_CHECK(program_) << "Problem initializing the program.";
+    glUseProgram(program_);
+    glUniform1i(glGetUniformLocation(program_, "input_frame"), 1);
+  }
+
+  // Generate vbos and vao.
+  glGenVertexArrays(1, &vao_);
+  glGenBuffers(2, vbo_);
+
+  // Fill in static vbo (vbo 0), to be reused in GlRender().
+  glBindVertexArray(vao_);
+  glBindBuffer(GL_ARRAY_BUFFER, vbo_[0]);
+  glBufferData(GL_ARRAY_BUFFER, 4 * 2 * sizeof(GLfloat),
+               mediapipe::kBasicSquareVertices, GL_STATIC_DRAW);
+  glEnableVertexAttribArray(ATTRIB_VERTEX);
+  glVertexAttribPointer(ATTRIB_VERTEX, 2, GL_FLOAT, 0, 0, nullptr);
+  glBindBuffer(GL_ARRAY_BUFFER, 0);
+  // Fill in static vbo (vbo 1), to be reused in GlRender().
+  glBindBuffer(GL_ARRAY_BUFFER, vbo_[1]);
+  glBufferData(GL_ARRAY_BUFFER, 4 * 2 * sizeof(GLfloat),
+               mediapipe::kBasicTextureVertices, GL_STATIC_DRAW);
+  glEnableVertexAttribArray(ATTRIB_TEXTURE_POSITION);
+  glVertexAttribPointer(ATTRIB_TEXTURE_POSITION, 2, GL_FLOAT, 0, 0, nullptr);
+  glBindBuffer(GL_ARRAY_BUFFER, 0);
+  glBindVertexArray(0);
 
 #endif  //  !MEDIAPIPE_DISABLE_GPU
 
diff --git a/mediapipe/calculators/image/image_transformation_calculator.cc b/mediapipe/calculators/image/image_transformation_calculator.cc
index d771707d7..75ed96e15 100644
--- a/mediapipe/calculators/image/image_transformation_calculator.cc
+++ b/mediapipe/calculators/image/image_transformation_calculator.cc
@@ -570,6 +570,7 @@ void ImageTransformationCalculator::ComputeOutputDimensions(
 void ImageTransformationCalculator::ComputeOutputLetterboxPadding(
     int input_width, int input_height, int output_width, int output_height,
     std::array<float, 4>* padding) {
+  padding->fill(0.f);
   if (scale_mode_ == mediapipe::ScaleMode_Mode_FIT) {
     if (rotation_ == mediapipe::RotationMode_Mode_ROTATION_90 ||
         rotation_ == mediapipe::RotationMode_Mode_ROTATION_270) {
diff --git a/mediapipe/calculators/tensorflow/vector_int_to_tensor_calculator_test.cc b/mediapipe/calculators/tensorflow/vector_int_to_tensor_calculator_test.cc
index 052a78516..369c09660 100644
--- a/mediapipe/calculators/tensorflow/vector_int_to_tensor_calculator_test.cc
+++ b/mediapipe/calculators/tensorflow/vector_int_to_tensor_calculator_test.cc
@@ -153,7 +153,7 @@ TEST_F(VectorIntToTensorCalculatorTest, TestInt64) {
   const int64 time = 1234;
   runner_->MutableInputs()
       ->Tag("SINGLE_INT")
-      .packets.push_back(MakePacket<int>(2 ^ 31).At(Timestamp(time)));
+      .packets.push_back(MakePacket<int>(1LL << 31).At(Timestamp(time)));
 
   EXPECT_TRUE(runner_->Run().ok());
 
@@ -166,7 +166,8 @@ TEST_F(VectorIntToTensorCalculatorTest, TestInt64) {
   EXPECT_EQ(1, output_tensor.dims());
   EXPECT_EQ(tf::DT_INT64, output_tensor.dtype());
   const auto vec = output_tensor.vec<tf::int64>();
-  EXPECT_EQ(2 ^ 31, vec(0));
+  // 1LL << 31 overflows the positive int and becomes negative.
+  EXPECT_EQ(static_cast<int>(1LL << 31), vec(0));
 }
 
 TEST_F(VectorIntToTensorCalculatorTest, TestUint8) {
diff --git a/mediapipe/calculators/tflite/tflite_inference_calculator.cc b/mediapipe/calculators/tflite/tflite_inference_calculator.cc
index d9aba77c6..f8e82bca6 100644
--- a/mediapipe/calculators/tflite/tflite_inference_calculator.cc
+++ b/mediapipe/calculators/tflite/tflite_inference_calculator.cc
@@ -358,6 +358,13 @@ REGISTER_CALCULATOR(TfLiteInferenceCalculator);
       cc->Options<mediapipe::TfLiteInferenceCalculatorOptions>();
   use_advanced_gpu_api_ = false;
 
+  if (use_advanced_gpu_api_ && !(gpu_input_ && gpu_output_)) {
+    LOG(WARNING)
+        << "Cannot use advanced GPU APIs, both inputs and outputs must "
+           "be GPU buffers. Falling back to the default TFLite API.";
+    use_advanced_gpu_api_ = false;
+  }
+
   MP_RETURN_IF_ERROR(LoadModel(cc));
 
   if (gpu_inference_) {
diff --git a/mediapipe/calculators/tflite/tflite_tensors_to_landmarks_calculator.cc b/mediapipe/calculators/tflite/tflite_tensors_to_landmarks_calculator.cc
index 52f9b85b7..3c41531e1 100644
--- a/mediapipe/calculators/tflite/tflite_tensors_to_landmarks_calculator.cc
+++ b/mediapipe/calculators/tflite/tflite_tensors_to_landmarks_calculator.cc
@@ -21,8 +21,9 @@
 namespace mediapipe {
 
 // A calculator for converting TFLite tensors from regression models into
-// landmarks. Note that if the landmarks in the tensor has more than 3
-// dimensions, only the first 3 dimensions will be converted to x,y,z.
+// landmarks. Note that if the landmarks in the tensor has more than 4
+// dimensions, only the first 4 dimensions will be converted to
+// [x,y,z, visibility].
 //
 // Input:
 //  TENSORS - Vector of TfLiteTensor of type kTfLiteFloat32. Only the first
@@ -205,12 +206,14 @@ REGISTER_CALCULATOR(TfLiteTensorsToLandmarksCalculator);
     if (num_dimensions > 2) {
       landmark->set_z(raw_landmarks[offset + 2]);
     }
+    if (num_dimensions > 3) {
+      landmark->set_visibility(raw_landmarks[offset + 3]);
+    }
   }
 
   // Output normalized landmarks if required.
   if (cc->Outputs().HasTag("NORM_LANDMARKS")) {
     NormalizedLandmarkList output_norm_landmarks;
-    // for (const auto& landmark : output_landmarks) {
     for (int i = 0; i < output_landmarks.landmark_size(); ++i) {
       const Landmark& landmark = output_landmarks.landmark(i);
       NormalizedLandmark* norm_landmark = output_norm_landmarks.add_landmark();
@@ -219,6 +222,7 @@ REGISTER_CALCULATOR(TfLiteTensorsToLandmarksCalculator);
       norm_landmark->set_y(static_cast<float>(landmark.y()) /
                            options_.input_image_height());
       norm_landmark->set_z(landmark.z() / options_.normalize_z());
+      norm_landmark->set_visibility(landmark.visibility());
     }
     cc->Outputs()
         .Tag("NORM_LANDMARKS")
diff --git a/mediapipe/calculators/util/BUILD b/mediapipe/calculators/util/BUILD
index 9edd8deba..b570e4ca2 100644
--- a/mediapipe/calculators/util/BUILD
+++ b/mediapipe/calculators/util/BUILD
@@ -320,6 +320,7 @@ cc_library(
         "//mediapipe/framework:calculator_options_cc_proto",
         "//mediapipe/framework/formats:image_format_cc_proto",
         "//mediapipe/util:color_cc_proto",
+        "@com_google_absl//absl/strings",
         "//mediapipe/framework:calculator_framework",
         "//mediapipe/framework/formats:image_frame",
         "//mediapipe/framework/formats:video_stream_header",
@@ -541,6 +542,19 @@ cc_library(
     alwayslink = 1,
 )
 
+cc_library(
+    name = "rect_projection_calculator",
+    srcs = ["rect_projection_calculator.cc"],
+    visibility = ["//visibility:public"],
+    deps = [
+        "//mediapipe/framework:calculator_framework",
+        "//mediapipe/framework/formats:rect_cc_proto",
+        "//mediapipe/framework/port:ret_check",
+        "//mediapipe/framework/port:status",
+    ],
+    alwayslink = 1,
+)
+
 cc_test(
     name = "detections_to_rects_calculator_test",
     size = "small",
@@ -951,6 +965,7 @@ cc_library(
     visibility = ["//visibility:public"],
     deps = [
         ":top_k_scores_calculator_cc_proto",
+        "@com_google_absl//absl/container:node_hash_map",
         "//mediapipe/framework/formats:classification_cc_proto",
         "//mediapipe/framework/port:ret_check",
         "//mediapipe/framework/port:status",
diff --git a/mediapipe/calculators/util/annotation_overlay_calculator.cc b/mediapipe/calculators/util/annotation_overlay_calculator.cc
index 29cf74962..812522f7a 100644
--- a/mediapipe/calculators/util/annotation_overlay_calculator.cc
+++ b/mediapipe/calculators/util/annotation_overlay_calculator.cc
@@ -14,6 +14,7 @@
 
 #include <memory>
 
+#include "absl/strings/str_cat.h"
 #include "mediapipe/calculators/util/annotation_overlay_calculator.pb.h"
 #include "mediapipe/framework/calculator_framework.h"
 #include "mediapipe/framework/calculator_options.pb.h"
@@ -573,31 +574,33 @@ REGISTER_CALCULATOR(AnnotationOverlayCalculator);
   };
 
   // Shader to overlay a texture onto another when overlay is non-zero.
-  const GLchar* frag_src = GLES_VERSION_COMPAT
-      R"(
-  #if __VERSION__ < 130
-    #define in varying
-  #endif  // __VERSION__ < 130
-
+  constexpr char kFragSrcBody[] = R"(
+  DEFAULT_PRECISION(mediump, float)
   #ifdef GL_ES
     #define fragColor gl_FragColor
-    precision highp float;
   #else
-    #define lowp
-    #define mediump
-    #define highp
-    #define texture2D texture
     out vec4 fragColor;
-  #endif  // defined(GL_ES)
+  #endif  // GL_ES
 
     in vec2 sample_coordinate;
     uniform sampler2D input_frame;
+    // "overlay" texture has top-left origin (OpenCV mat with annotations has
+    // been uploaded to GPU without vertical flip)
     uniform sampler2D overlay;
     uniform vec3 transparent_color;
 
     void main() {
       vec3 image_pix = texture2D(input_frame, sample_coordinate).rgb;
+  #ifdef INPUT_FRAME_HAS_TOP_LEFT_ORIGIN
+      // "input_frame" has top-left origin same as "overlay", hence overlaying
+      // as is.
       vec3 overlay_pix = texture2D(overlay, sample_coordinate).rgb;
+  #else
+      // "input_frame" has bottom-left origin, hence flipping "overlay" texture
+      // coordinates.
+      vec3 overlay_pix = texture2D(overlay, vec2(sample_coordinate.x, 1.0 - sample_coordinate.y)).rgb;
+  #endif  // INPUT_FRAME_HAS_TOP_LEFT_ORIGIN
+
       vec3 out_pix = image_pix;
       float dist = distance(overlay_pix.rgb, transparent_color);
       if (dist > 0.001) out_pix = overlay_pix;
@@ -606,8 +609,18 @@ REGISTER_CALCULATOR(AnnotationOverlayCalculator);
     }
   )";
 
+  std::string defines;
+  if (options_.gpu_uses_top_left_origin()) {
+    defines = R"(
+      #define INPUT_FRAME_HAS_TOP_LEFT_ORIGIN;
+    )";
+  }
+
+  const std::string frag_src = absl::StrCat(
+      mediapipe::kMediaPipeFragmentShaderPreamble, defines, kFragSrcBody);
+
   // Create shader program and set parameters
-  mediapipe::GlhCreateProgram(mediapipe::kBasicVertexShader, frag_src,
+  mediapipe::GlhCreateProgram(mediapipe::kBasicVertexShader, frag_src.c_str(),
                               NUM_ATTRIBUTES, (const GLchar**)&attr_name[0],
                               attr_location, &program_);
   RET_CHECK(program_) << "Problem initializing the program.";
diff --git a/mediapipe/calculators/util/annotation_overlay_calculator.proto b/mediapipe/calculators/util/annotation_overlay_calculator.proto
index 93e436110..4391a1f2a 100644
--- a/mediapipe/calculators/util/annotation_overlay_calculator.proto
+++ b/mediapipe/calculators/util/annotation_overlay_calculator.proto
@@ -40,4 +40,9 @@ message AnnotationOverlayCalculatorOptions {
   // top-left corner. Therefore, for images with the origin at the bottom-left
   // corner this should be set to true.
   optional bool flip_text_vertically = 5 [default = false];
+
+  // Whether input stream IMAGE_GPU (OpenGL texture) has bottom-left or top-left
+  // origin. (Historically, OpenGL uses bottom left origin, but most MediaPipe
+  // examples expect textures to have top-left origin.)
+  optional bool gpu_uses_top_left_origin = 6 [default = true];
 }
diff --git a/mediapipe/calculators/util/landmark_letterbox_removal_calculator.cc b/mediapipe/calculators/util/landmark_letterbox_removal_calculator.cc
index b0f7cc0fd..b79d8e4f0 100644
--- a/mediapipe/calculators/util/landmark_letterbox_removal_calculator.cc
+++ b/mediapipe/calculators/util/landmark_letterbox_removal_calculator.cc
@@ -127,6 +127,8 @@ class LandmarkLetterboxRemovalCalculator : public CalculatorBase {
         new_landmark->set_y(new_y);
         // Keep z-coord as is.
         new_landmark->set_z(landmark.z());
+        // Keep visibility as is.
+        new_landmark->set_visibility(landmark.visibility());
       }
 
       cc->Outputs().Get(output_id).AddPacket(
diff --git a/mediapipe/calculators/util/landmark_projection_calculator.cc b/mediapipe/calculators/util/landmark_projection_calculator.cc
index 0ab22ad97..61986672c 100644
--- a/mediapipe/calculators/util/landmark_projection_calculator.cc
+++ b/mediapipe/calculators/util/landmark_projection_calculator.cc
@@ -128,6 +128,8 @@ class LandmarkProjectionCalculator : public CalculatorBase {
         new_landmark->set_y(new_y);
         // Keep z-coord as is.
         new_landmark->set_z(landmark.z());
+        // Keep visibility as is.
+        new_landmark->set_visibility(landmark.visibility());
       }
 
       cc->Outputs().Get(output_id).AddPacket(
diff --git a/mediapipe/calculators/util/landmarks_to_render_data_calculator.cc b/mediapipe/calculators/util/landmarks_to_render_data_calculator.cc
index a099e81f3..3d43a64bb 100644
--- a/mediapipe/calculators/util/landmarks_to_render_data_calculator.cc
+++ b/mediapipe/calculators/util/landmarks_to_render_data_calculator.cc
@@ -97,11 +97,17 @@ void AddConnectionToRenderData(const LandmarkType& start,
 template <class LandmarkListType, class LandmarkType>
 void AddConnectionsWithDepth(const LandmarkListType& landmarks,
                              const std::vector<int>& landmark_connections,
-                             float thickness, bool normalized, float min_z,
-                             float max_z, RenderData* render_data) {
+                             bool utilize_visibility,
+                             float visibility_threshold, float thickness,
+                             bool normalized, float min_z, float max_z,
+                             RenderData* render_data) {
   for (int i = 0; i < landmark_connections.size(); i += 2) {
     const auto& ld0 = landmarks.landmark(landmark_connections[i]);
     const auto& ld1 = landmarks.landmark(landmark_connections[i + 1]);
+    if (visibility_threshold && (ld0.visibility() < visibility_threshold ||
+                                 ld1.visibility() < visibility_threshold)) {
+      continue;
+    }
     const int gray_val1 =
         255 - static_cast<int>(Remap(ld0.z(), min_z, max_z, 255));
     const int gray_val2 =
@@ -130,11 +136,16 @@ void AddConnectionToRenderData(const LandmarkType& start,
 template <class LandmarkListType, class LandmarkType>
 void AddConnections(const LandmarkListType& landmarks,
                     const std::vector<int>& landmark_connections,
+                    bool utilize_visibility, float visibility_threshold,
                     const Color& connection_color, float thickness,
                     bool normalized, RenderData* render_data) {
   for (int i = 0; i < landmark_connections.size(); i += 2) {
     const auto& ld0 = landmarks.landmark(landmark_connections[i]);
     const auto& ld1 = landmarks.landmark(landmark_connections[i + 1]);
+    if (visibility_threshold && (ld0.visibility() < visibility_threshold ||
+                                 ld1.visibility() < visibility_threshold)) {
+      continue;
+    }
     AddConnectionToRenderData<LandmarkType>(ld0, ld1, connection_color,
                                             thickness, normalized, render_data);
   }
@@ -231,6 +242,17 @@ REGISTER_CALCULATOR(LandmarksToRenderDataCalculator);
 
 ::mediapipe::Status LandmarksToRenderDataCalculator::Process(
     CalculatorContext* cc) {
+  // Check that landmarks are not empty and skip rendering if so.
+  // Don't emit an empty packet for this timestamp.
+  if (cc->Inputs().HasTag(kLandmarksTag) &&
+      cc->Inputs().Tag(kLandmarksTag).IsEmpty()) {
+    return ::mediapipe::OkStatus();
+  }
+  if (cc->Inputs().HasTag(kNormLandmarksTag) &&
+      cc->Inputs().Tag(kNormLandmarksTag).IsEmpty()) {
+    return ::mediapipe::OkStatus();
+  }
+
   auto render_data = absl::make_unique<RenderData>();
   bool visualize_depth = options_.visualize_landmark_depth();
   float z_min = 0.f;
@@ -255,15 +277,23 @@ REGISTER_CALCULATOR(LandmarksToRenderDataCalculator);
     visualize_depth &= ((z_max - z_min) > 1e-3);
     if (visualize_depth) {
       AddConnectionsWithDepth<LandmarkList, Landmark>(
-          landmarks, landmark_connections_, thickness, /*normalized=*/false,
+          landmarks, landmark_connections_, options_.utilize_visibility(),
+          options_.visibility_threshold(), thickness, /*normalized=*/false,
           z_min, z_max, render_data.get());
     } else {
       AddConnections<LandmarkList, Landmark>(
-          landmarks, landmark_connections_, options_.connection_color(),
+          landmarks, landmark_connections_, options_.utilize_visibility(),
+          options_.visibility_threshold(), options_.connection_color(),
           thickness, /*normalized=*/false, render_data.get());
     }
     for (int i = 0; i < landmarks.landmark_size(); ++i) {
       const Landmark& landmark = landmarks.landmark(i);
+
+      if (options_.utilize_visibility() &&
+          landmark.visibility() < options_.visibility_threshold()) {
+        continue;
+      }
+
       auto* landmark_data_render = AddPointRenderData(
           options_.landmark_color(), thickness, render_data.get());
       if (visualize_depth) {
@@ -288,15 +318,23 @@ REGISTER_CALCULATOR(LandmarksToRenderDataCalculator);
     visualize_depth &= ((z_max - z_min) > 1e-3);
     if (visualize_depth) {
       AddConnectionsWithDepth<NormalizedLandmarkList, NormalizedLandmark>(
-          landmarks, landmark_connections_, thickness, /*normalized=*/true,
+          landmarks, landmark_connections_, options_.utilize_visibility(),
+          options_.visibility_threshold(), thickness, /*normalized=*/true,
           z_min, z_max, render_data.get());
     } else {
       AddConnections<NormalizedLandmarkList, NormalizedLandmark>(
-          landmarks, landmark_connections_, options_.connection_color(),
+          landmarks, landmark_connections_, options_.utilize_visibility(),
+          options_.visibility_threshold(), options_.connection_color(),
           thickness, /*normalized=*/true, render_data.get());
     }
     for (int i = 0; i < landmarks.landmark_size(); ++i) {
       const NormalizedLandmark& landmark = landmarks.landmark(i);
+
+      if (options_.utilize_visibility() &&
+          landmark.visibility() < options_.visibility_threshold()) {
+        continue;
+      }
+
       auto* landmark_data_render = AddPointRenderData(
           options_.landmark_color(), thickness, render_data.get());
       if (visualize_depth) {
diff --git a/mediapipe/calculators/util/landmarks_to_render_data_calculator.proto b/mediapipe/calculators/util/landmarks_to_render_data_calculator.proto
index 1334fc1f1..ff1e8fdc5 100644
--- a/mediapipe/calculators/util/landmarks_to_render_data_calculator.proto
+++ b/mediapipe/calculators/util/landmarks_to_render_data_calculator.proto
@@ -40,4 +40,13 @@ message LandmarksToRenderDataCalculatorOptions {
 
   // Change color and size of rendered landmarks based on its z value.
   optional bool visualize_landmark_depth = 5 [default = true];
+
+  // Use landmarks visibility while rendering landmarks and connections. If
+  // landmark is not visible, neither it nor adjacent connections will be
+  // rendered.
+  optional bool utilize_visibility = 6 [default = false];
+
+  // Threshold to determine visibility of the landmark. Landmark with visibility
+  // greater or equal than threshold is considered visible.
+  optional double visibility_threshold = 7 [default = 0.0];
 }
diff --git a/mediapipe/calculators/util/rect_projection_calculator.cc b/mediapipe/calculators/util/rect_projection_calculator.cc
new file mode 100644
index 000000000..a9f7018cf
--- /dev/null
+++ b/mediapipe/calculators/util/rect_projection_calculator.cc
@@ -0,0 +1,100 @@
+// Copyright 2019 The MediaPipe Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//      http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+#include <cmath>
+
+#include "mediapipe/framework/calculator_framework.h"
+#include "mediapipe/framework/formats/rect.pb.h"
+
+namespace mediapipe {
+
+namespace {
+
+constexpr char kNormRectTag[] = "NORM_RECT";
+constexpr char kNormReferenceRectTag[] = "NORM_REFERENCE_RECT";
+
+}  // namespace
+
+// Projects rectangle from reference coordinate system (defined by reference
+// rectangle) to original coordinate system (in which this reference rectangle
+// is defined).
+//
+// Inputs:
+//   NORM_RECT - A NormalizedRect to be projected.
+//   NORM_REFERENCE_RECT - A NormalizedRect that represents reference coordinate
+//     system for NORM_RECT and is defined in original coordinates.
+//
+// Outputs:
+//   NORM_RECT: A NormalizedRect projected to the original coordinates.
+//
+// Example config:
+//   node {
+//     calculator: "RectProjectionCalculator"
+//     input_stream: "NORM_RECT:face_rect"
+//     input_stream: "NORM_REFERENCE_RECT:face_reference_rect"
+//     output_stream: "NORM_RECT:projected_face_rect"
+//   }
+//
+class RectProjectionCalculator : public CalculatorBase {
+ public:
+  static ::mediapipe::Status GetContract(CalculatorContract* cc);
+  ::mediapipe::Status Process(CalculatorContext* cc) override;
+};
+REGISTER_CALCULATOR(RectProjectionCalculator);
+
+::mediapipe::Status RectProjectionCalculator::GetContract(
+    CalculatorContract* cc) {
+  cc->Inputs().Tag(kNormRectTag).Set<NormalizedRect>();
+  cc->Inputs().Tag(kNormReferenceRectTag).Set<NormalizedRect>();
+  cc->Outputs().Tag(kNormRectTag).Set<NormalizedRect>();
+  return ::mediapipe::OkStatus();
+}
+
+::mediapipe::Status RectProjectionCalculator::Process(CalculatorContext* cc) {
+  if (cc->Inputs().Tag(kNormRectTag).IsEmpty()) {
+    return ::mediapipe::OkStatus();
+  }
+
+  const auto& rect = cc->Inputs().Tag(kNormRectTag).Get<NormalizedRect>();
+  const auto& reference_rect =
+      cc->Inputs().Tag(kNormReferenceRectTag).Get<NormalizedRect>();
+
+  // Project center.
+  const float x = rect.x_center() - 0.5f;
+  const float y = rect.y_center() - 0.5f;
+  const float angle = reference_rect.rotation();
+  float new_x = std::cos(angle) * x - std::sin(angle) * y;
+  float new_y = std::sin(angle) * x + std::cos(angle) * y;
+  new_x = new_x * reference_rect.width() + reference_rect.x_center();
+  new_y = new_y * reference_rect.height() + reference_rect.y_center();
+
+  // Project size.
+  const float new_width = rect.width() * reference_rect.width();
+  const float new_height = rect.height() * reference_rect.height();
+
+  // Project rotation.
+  const float new_rotation = rect.rotation() + reference_rect.rotation();
+
+  auto new_rect = absl::make_unique<NormalizedRect>();
+  new_rect->set_x_center(new_x);
+  new_rect->set_y_center(new_y);
+  new_rect->set_width(new_width);
+  new_rect->set_height(new_height);
+  new_rect->set_rotation(new_rotation);
+
+  cc->Outputs().Tag(kNormRectTag).Add(new_rect.release(), cc->InputTimestamp());
+
+  return ::mediapipe::OkStatus();
+}
+
+}  // namespace mediapipe
diff --git a/mediapipe/calculators/util/top_k_scores_calculator.cc b/mediapipe/calculators/util/top_k_scores_calculator.cc
index 8465c2391..1d5a8fede 100644
--- a/mediapipe/calculators/util/top_k_scores_calculator.cc
+++ b/mediapipe/calculators/util/top_k_scores_calculator.cc
@@ -21,6 +21,7 @@
 #include <utility>
 #include <vector>
 
+#include "absl/container/node_hash_map.h"
 #include "mediapipe/calculators/util/top_k_scores_calculator.pb.h"
 #include "mediapipe/framework/calculator_framework.h"
 #include "mediapipe/framework/formats/classification.pb.h"
@@ -72,7 +73,7 @@ class TopKScoresCalculator : public CalculatorBase {
 
   int top_k_ = -1;
   float threshold_ = 0.0;
-  std::unordered_map<int, std::string> label_map_;
+  absl::node_hash_map<int, std::string> label_map_;
   bool label_map_loaded_ = false;
 };
 REGISTER_CALCULATOR(TopKScoresCalculator);
diff --git a/mediapipe/docs/README.md b/mediapipe/docs/README.md
index 199643cbe..70c3d2723 100644
--- a/mediapipe/docs/README.md
+++ b/mediapipe/docs/README.md
@@ -1,2 +1,3 @@
-This directory contains the source markdown files presented on
-the [MediaPipe Read-the-Docs](https://mediapipe.readthedocs.io) documentation site.
+This directory contains legacy markdown docs referenced in external sites and blog posts, and the docs have messages to redirect users to the corresponding up-to-date docs in other locations.
+
+Source files of the update-to-date docs are in `docs` directly under root.
diff --git a/mediapipe/docs/autoflip.md b/mediapipe/docs/autoflip.md
index b250db3bf..4d7367810 100644
--- a/mediapipe/docs/autoflip.md
+++ b/mediapipe/docs/autoflip.md
@@ -1,344 +1,2 @@
-# Saliency-Aware Video Cropping using AutoFlip
-
-## Introduction
-
-AutoFlip is an automatic video cropping pipeline built on top of MediaPipe. This
-example focuses on demonstrating how to use AutoFlip to convert an input video
-to arbitrary aspect ratios.
-
-For overall context on AutoFlip, please read this
-[Google AI Blog](https://mediapipe.page.link/autoflip).
-
-![graph is_required](images/autoflip_edited_example.gif)
-
-## Building
-
-Run the following command to build the AutoFlip pipeline:
-
-Note: AutoFlip currently only works with OpenCV 3 . Please verify your OpenCV
-version beforehand.
-
-```bash
-bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 mediapipe/examples/desktop/autoflip:run_autoflip
-```
-
-## Running
-
-```bash
-GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/autoflip/run_autoflip \
-  --calculator_graph_config_file=mediapipe/examples/desktop/autoflip/autoflip_graph.pbtxt \
-  --input_side_packets=input_video_path=/absolute/path/to/the/local/video/file,output_video_path=/absolute/path/to/save/the/output/video/file,aspect_ratio=1:1
-```
-
-Use the `aspect_ratio` flag to provide the output aspect ratio. The format
-should be `width:height`, where the `width` and `height` are two positive
-integers. AutoFlip supports both landscape-to-portrait and portrait-to-landscape
-conversions. The pipeline internally compares the target aspect ratio against
-the original one, and determines the correct conversion automatically.
-
-We have put a couple test videos under this
-[Google Drive folder](https://drive.google.com/corp/drive/u/0/folders/1KK9LV--Ey0UEVpxssVLhVl7dypgJSQgk).
-You could download the videos into your local file system, then modify the
-command above accordingly to run AutoFlip against the videos.
-
-## MediaPipe Graph
-
-![graph visualization](images/autoflip_graph.png)
-
-To visualize the graph as shown above, copy the text specification of the graph
-below and paste it into [MediaPipe Visualizer](https://viz.mediapipe.dev).
-
-```bash
-# Autoflip graph that only renders the final cropped video. For use with
-# end user applications.
-max_queue_size: -1
-
-# VIDEO_PREP: Decodes an input video file into images and a video header.
-node {
-  calculator: "OpenCvVideoDecoderCalculator"
-  input_side_packet: "INPUT_FILE_PATH:input_video_path"
-  output_stream: "VIDEO:video_raw"
-  output_stream: "VIDEO_PRESTREAM:video_header"
-  output_side_packet: "SAVED_AUDIO_PATH:audio_path"
-}
-
-# VIDEO_PREP: Scale the input video before feature extraction.
-node {
-  calculator: "ScaleImageCalculator"
-  input_stream: "FRAMES:video_raw"
-  input_stream: "VIDEO_HEADER:video_header"
-  output_stream: "FRAMES:video_frames_scaled"
-  node_options: {
-    [type.googleapis.com/mediapipe.ScaleImageCalculatorOptions]: {
-      preserve_aspect_ratio: true
-      output_format: SRGB
-      target_width: 480
-      algorithm: DEFAULT_WITHOUT_UPSCALE
-    }
-  }
-}
-
-# VIDEO_PREP: Create a low frame rate stream for feature extraction.
-node {
-  calculator: "PacketThinnerCalculator"
-  input_stream: "video_frames_scaled"
-  output_stream: "video_frames_scaled_downsampled"
-  node_options: {
-    [type.googleapis.com/mediapipe.PacketThinnerCalculatorOptions]: {
-      thinner_type: ASYNC
-      period: 200000
-    }
-  }
-}
-
-# DETECTION: find borders around the video and major background color.
-node {
-  calculator: "BorderDetectionCalculator"
-  input_stream: "VIDEO:video_raw"
-  output_stream: "DETECTED_BORDERS:borders"
-}
-
-# DETECTION: find shot/scene boundaries on the full frame rate stream.
-node {
-  calculator: "ShotBoundaryCalculator"
-  input_stream: "VIDEO:video_frames_scaled"
-  output_stream: "IS_SHOT_CHANGE:shot_change"
-  options {
-    [type.googleapis.com/mediapipe.autoflip.ShotBoundaryCalculatorOptions] {
-      min_shot_span: 0.2
-      min_motion: 0.3
-      window_size: 15
-      min_shot_measure: 10
-      min_motion_with_shot_measure: 0.05
-    }
-  }
-}
-
-# DETECTION: find faces on the down sampled stream
-node {
-  calculator: "AutoFlipFaceDetectionSubgraph"
-  input_stream: "VIDEO:video_frames_scaled_downsampled"
-  output_stream: "DETECTIONS:face_detections"
-}
-node {
-  calculator: "FaceToRegionCalculator"
-  input_stream: "VIDEO:video_frames_scaled_downsampled"
-  input_stream: "FACES:face_detections"
-  output_stream: "REGIONS:face_regions"
-}
-
-# DETECTION: find objects on the down sampled stream
-node {
-  calculator: "AutoFlipObjectDetectionSubgraph"
-  input_stream: "VIDEO:video_frames_scaled_downsampled"
-  output_stream: "DETECTIONS:object_detections"
-}
-node {
-  calculator: "LocalizationToRegionCalculator"
-  input_stream: "DETECTIONS:object_detections"
-  output_stream: "REGIONS:object_regions"
-  options {
-    [type.googleapis.com/mediapipe.autoflip.LocalizationToRegionCalculatorOptions] {
-      output_all_signals: true
-    }
-  }
-}
-
-# SIGNAL FUSION: Combine detections (with weights) on each frame
-node {
-  calculator: "SignalFusingCalculator"
-  input_stream: "shot_change"
-  input_stream: "face_regions"
-  input_stream: "object_regions"
-  output_stream: "salient_regions"
-  options {
-    [type.googleapis.com/mediapipe.autoflip.SignalFusingCalculatorOptions] {
-      signal_settings {
-        type { standard: FACE_CORE_LANDMARKS }
-        min_score: 0.85
-        max_score: 0.9
-        is_required: false
-      }
-      signal_settings {
-        type { standard: FACE_ALL_LANDMARKS }
-        min_score: 0.8
-        max_score: 0.85
-        is_required: false
-      }
-      signal_settings {
-        type { standard: FACE_FULL }
-        min_score: 0.8
-        max_score: 0.85
-        is_required: false
-      }
-      signal_settings {
-        type: { standard: HUMAN }
-        min_score: 0.75
-        max_score: 0.8
-        is_required: false
-      }
-      signal_settings {
-        type: { standard: PET }
-        min_score: 0.7
-        max_score: 0.75
-        is_required: false
-      }
-      signal_settings {
-        type: { standard: CAR }
-        min_score: 0.7
-        max_score: 0.75
-        is_required: false
-      }
-      signal_settings {
-        type: { standard: OBJECT }
-        min_score: 0.1
-        max_score: 0.2
-        is_required: false
-      }
-    }
-  }
-}
-
-# CROPPING: make decisions about how to crop each frame.
-node {
-  calculator: "SceneCroppingCalculator"
-  input_side_packet: "EXTERNAL_ASPECT_RATIO:aspect_ratio"
-  input_stream: "VIDEO_FRAMES:video_raw"
-  input_stream: "KEY_FRAMES:video_frames_scaled_downsampled"
-  input_stream: "DETECTION_FEATURES:salient_regions"
-  input_stream: "STATIC_FEATURES:borders"
-  input_stream: "SHOT_BOUNDARIES:shot_change"
-  output_stream: "CROPPED_FRAMES:cropped_frames"
-  node_options: {
-    [type.googleapis.com/mediapipe.autoflip.SceneCroppingCalculatorOptions]: {
-      max_scene_size: 600
-      key_frame_crop_options: {
-        score_aggregation_type: CONSTANT
-      }
-      scene_camera_motion_analyzer_options: {
-        motion_stabilization_threshold_percent: 0.5
-        salient_point_bound: 0.499
-      }
-      padding_parameters: {
-        blur_cv_size: 200
-        overlay_opacity: 0.6
-      }
-      target_size_type: MAXIMIZE_TARGET_DIMENSION
-    }
-  }
-}
-
-# ENCODING(required): encode the video stream for the final cropped output.
-node {
-  calculator: "VideoPreStreamCalculator"
-  # Fetch frame format and dimension from input frames.
-  input_stream: "FRAME:cropped_frames"
-  # Copying frame rate and duration from original video.
-  input_stream: "VIDEO_PRESTREAM:video_header"
-  output_stream: "output_frames_video_header"
-}
-
-node {
-  calculator: "OpenCvVideoEncoderCalculator"
-  input_stream: "VIDEO:cropped_frames"
-  input_stream: "VIDEO_PRESTREAM:output_frames_video_header"
-  input_side_packet: "OUTPUT_FILE_PATH:output_video_path"
-  input_side_packet: "AUDIO_FILE_PATH:audio_path"
-  node_options: {
-    [type.googleapis.com/mediapipe.OpenCvVideoEncoderCalculatorOptions]: {
-      codec: "avc1"
-      video_format: "mp4"
-    }
-  }
-}
-```
-
-## Advanced Parameters
-
-### Required vs. Best-Effort Saliency Features
-
-AutoFlip allows users to implement and specify custom features to be used in the
-camera trajectory computation. If the user would like to detect and preserve
-scenes of lions in a wildlife protection video, for example, they could
-implement and add a feature detection calculator for lions into the pipeline.
-Refer to `AutoFlipFaceDetectionSubgraph` and `FaceToRegionCalculator`, or
-`AutoFlipObjectDetectionSubgraph` and `LocalizationToRegionCalculator` for
-examples of how to create new feature detection calculators.
-
-After adding different feature signals into the graph, use the
-`SignalFusingCalculator` node to specify types and weights for different feature
-signals. For example, in the graph above, we specified a `face_region` and an
-`object_region` input streams, to represent face signals and agnostic object
-signals, respectively.
-
-The larger the weight, the more important the features will be considered when
-AutoFlip computes the camera trajectory. Use the `is_required` flag to mark a
-feature as a hard constraint, in which case the computed camera trajectory will
-try best to cover these feature types in the cropped videos. If for some reason
-the required features cannot be all covered (for example, when they are too
-spread out in the video), AutoFlip will apply a padding effect to cover as much
-salient content as possible. See an illustration below.
-
-![graph is_required](images/autoflip_is_required.gif)
-
-### Stable vs Tracking Camera Motion
-
-AutoFlip makes a decision on each scene whether to have the cropped viewpoint
-follow an object or if the crop should remain stable (centered on detected
-objects). The parameter `motion_stabilization_threshold_percent` value is used
-to make the decision to track action or keep the camera stable. If, over the
-duration of the scene, all detected focus objects remain within this ratio of
-the frame (e.g. 0.5 = 50% or 1920 * .5 = 960 pixels on 1080p video) then the
-camera is held steady. Otherwise the camera tracks activity within the frame.
-
-### Snap To Center
-
-For some scenes the camera viewpoint will remain stable at the center of
-activity (see `motion_stabilization_threshold_percent` setting). In this case,
-if the determined best stable viewpoint is within
-`snap_center_max_distance_percent` of the frame's center the camera will be
-shifted to be locked to the center of the frame. This setting is useful for
-videos where the camera operator did a good job already centering content or if
-titles and logos are expected to appear in the center of the frame. It may be
-less useful on raw content where objects are not already well positioned on
-screen.
-
-### Visualization to Facilitate Debugging
-
-`SceneCroppingCalculator` provides two extra output streams
-`KEY_FRAME_CROP_REGION_VIZ_FRAMES` and `SALIENT_POINT_FRAME_VIZ_FRAMES` to
-visualize the cropping window as well as salient points detected on each frame.
-You could modify the `SceneCroppingCalculator` node like below to enable these
-two output streams.
-
-```bash
-node {
-  calculator: "SceneCroppingCalculator"
-  input_side_packet: "EXTERNAL_ASPECT_RATIO:aspect_ratio"
-  input_stream: "VIDEO_FRAMES:video_raw"
-  input_stream: "KEY_FRAMES:video_frames_scaled_downsampled"
-  input_stream: "DETECTION_FEATURES:salient_regions"
-  input_stream: "STATIC_FEATURES:borders"
-  input_stream: "SHOT_BOUNDARIES:shot_change"
-  output_stream: "CROPPED_FRAMES:cropped_frames"
-  output_stream: "KEY_FRAME_CROP_REGION_VIZ_FRAMES:key_frame_crop_viz_frames"
-  output_stream: "SALIENT_POINT_FRAME_VIZ_FRAMES:salient_point_viz_frames"
-  node_options: {
-    [type.googleapis.com/mediapipe.autoflip.SceneCroppingCalculatorOptions]: {
-      max_scene_size: 600
-      key_frame_crop_options: {
-        score_aggregation_type: CONSTANT
-      }
-      scene_camera_motion_analyzer_options: {
-        motion_stabilization_threshold_percent: 0.5
-        salient_point_bound: 0.499
-      }
-      padding_parameters: {
-        blur_cv_size: 200
-        overlay_opacity: 0.6
-      }
-      target_size_type: MAXIMIZE_TARGET_DIMENSION
-    }
-  }
-}
-```
+Content moved to
+[AutoFlip: Saliency-aware Video Cropping](https://google.github.io/mediapipe/solutions/autoflip)
diff --git a/mediapipe/docs/calculator.md b/mediapipe/docs/calculator.md
deleted file mode 100644
index 747c53037..000000000
--- a/mediapipe/docs/calculator.md
+++ /dev/null
@@ -1,164 +0,0 @@
-## Building MediaPipe Calculators
-
--   [Example calculator](#example-calculator)
-
-
-### Example calculator
-
-This section discusses the implementation of `PacketClonerCalculator`, which
-does a relatively simple job, and is used in many calculator graphs.
-`PacketClonerCalculator` simply produces a copy of its most recent input
-packets on demand.
-
-`PacketClonerCalculator` is useful when the timestamps of arriving data packets
-are not aligned perfectly. Suppose we have a room with a microphone, light
-sensor and a video camera that is collecting sensory data. Each of the sensors
-operates independently and collects data intermittently. Suppose that the output
-of each sensor is:
-
-*   microphone = loudness in decibels of sound in the room (Integer)
-*   light sensor = brightness of room (Integer)
-*   video camera = RGB image frame of room (ImageFrame)
-
-Our simple perception pipeline is designed to process sensory data from these 3
-sensors such that at any time when we have image frame data from the camera that
-is synchronized with the last collected microphone loudness data and light
-sensor brightness data. To do this with MediaPipe, our perception pipeline has 3
-input streams:
-
-*   room_mic_signal - Each packet of data in this input stream is integer data
-    representing how loud audio is in a room with timestamp.
-*   room_lightening_sensor - Each packet of data in this input stream is integer
-    data representing how bright is the room illuminated with timestamp.
-*   room_video_tick_signal - Each packet of data in this input stream is
-    imageframe of video data representing video collected from camera in the
-    room with timestamp.
-
-Below is the implementation of the `PacketClonerCalculator`.  You can see
-the `GetContract()`, `Open()`, and `Process()` methods as well as the instance
-variable `current_` which holds the most recent input packets.
-
-```c++
-// This takes packets from N+1 streams, A_1, A_2, ..., A_N, B.
-// For every packet that appears in B, outputs the most recent packet from each
-// of the A_i on a separate stream.
-
-#include <vector>
-
-#include "absl/strings/str_cat.h"
-#include "mediapipe/framework/calculator_framework.h"
-
-namespace mediapipe {
-
-// For every packet received on the last stream, output the latest packet
-// obtained on all other streams. Therefore, if the last stream outputs at a
-// higher rate than the others, this effectively clones the packets from the
-// other streams to match the last.
-//
-// Example config:
-// node {
-//   calculator: "PacketClonerCalculator"
-//   input_stream: "first_base_signal"
-//   input_stream: "second_base_signal"
-//   input_stream: "tick_signal"
-//   output_stream: "cloned_first_base_signal"
-//   output_stream: "cloned_second_base_signal"
-// }
-//
-class PacketClonerCalculator : public CalculatorBase {
- public:
-  static ::mediapipe::Status GetContract(CalculatorContract* cc) {
-    const int tick_signal_index = cc->Inputs().NumEntries() - 1;
-    // cc->Inputs().NumEntries() returns the number of input streams
-    // for the PacketClonerCalculator
-    for (int i = 0; i < tick_signal_index; ++i) {
-      cc->Inputs().Index(i).SetAny();
-      // cc->Inputs().Index(i) returns the input stream pointer by index
-      cc->Outputs().Index(i).SetSameAs(&cc->Inputs().Index(i));
-    }
-    cc->Inputs().Index(tick_signal_index).SetAny();
-    return ::mediapipe::OkStatus();
-  }
-
-  ::mediapipe::Status Open(CalculatorContext* cc) final {
-    tick_signal_index_ = cc->Inputs().NumEntries() - 1;
-    current_.resize(tick_signal_index_);
-    // Pass along the header for each stream if present.
-    for (int i = 0; i < tick_signal_index_; ++i) {
-      if (!cc->Inputs().Index(i).Header().IsEmpty()) {
-        cc->Outputs().Index(i).SetHeader(cc->Inputs().Index(i).Header());
-        // Sets the output stream of index i header to be the same as
-        // the header for the input stream of index i
-      }
-    }
-    return ::mediapipe::OkStatus();
-  }
-
-  ::mediapipe::Status Process(CalculatorContext* cc) final {
-    // Store input signals.
-    for (int i = 0; i < tick_signal_index_; ++i) {
-      if (!cc->Inputs().Index(i).Value().IsEmpty()) {
-        current_[i] = cc->Inputs().Index(i).Value();
-      }
-    }
-
-    // Output if the tick signal is non-empty.
-    if (!cc->Inputs().Index(tick_signal_index_).Value().IsEmpty()) {
-      for (int i = 0; i < tick_signal_index_; ++i) {
-        if (!current_[i].IsEmpty()) {
-          cc->Outputs().Index(i).AddPacket(
-              current_[i].At(cc->InputTimestamp()));
-          // Add a packet to output stream of index i a packet from inputstream i
-          // with timestamp common to all present inputs
-          //
-        } else {
-          cc->Outputs().Index(i).SetNextTimestampBound(
-              cc->InputTimestamp().NextAllowedInStream());
-          // if current_[i], 1 packet buffer for input stream i is empty, we will set
-          // next allowed timestamp for input stream i to be current timestamp + 1
-        }
-      }
-    }
-    return ::mediapipe::OkStatus();
-  }
-
- private:
-  std::vector<Packet> current_;
-  int tick_signal_index_;
-};
-
-REGISTER_CALCULATOR(PacketClonerCalculator);
-}  // namespace mediapipe
-```
-
-Typically, a calculator has only a .cc file. No .h is required, because
-mediapipe uses registration to make calculators known to it. After you have
-defined your calculator class, register it with a macro invocation
-REGISTER_CALCULATOR(calculator_class_name).
-
-Below is a trivial MediaPipe graph that has 3 input streams, 1 node
-(PacketClonerCalculator) and 3 output streams.
-
-```proto
-input_stream: "room_mic_signal"
-input_stream: "room_lighting_sensor"
-input_stream: "room_video_tick_signal"
-
-node {
-   calculator: "PacketClonerCalculator"
-   input_stream: "room_mic_signal"
-   input_stream: "room_lighting_sensor"
-   input_stream: "room_video_tick_signal"
-   output_stream: "cloned_room_mic_signal"
-   output_stream: "cloned_lighting_sensor"
- }
-```
-
-The diagram below shows how the `PacketClonerCalculator` defines its output
-packets based on its series of input packets.
-
-| ![Graph using PacketClonerCalculator](images/packet_cloner_calculator.png) |
-|:--:|
-| *Each time it receives a packet on its TICK input stream, the PacketClonerCalculator outputs the most recent packet from each of its input streams.  The sequence of output packets is determined by the sequene of input packets and their timestamps. The timestamps are shows along the right side of the diagram.* |
-
-
diff --git a/mediapipe/docs/cycles.md b/mediapipe/docs/cycles.md
deleted file mode 100644
index 5b43e0e8d..000000000
--- a/mediapipe/docs/cycles.md
+++ /dev/null
@@ -1,128 +0,0 @@
-# Cycles in MediaPipe Graphs
-
-<!-- TODO: add discussion of PreviousLoopbackCalculator -->
-
-[TOC]
-
-By default, MediaPipe requires calculator graphs to be acyclic and treats cycles
-in a graph as errors. If a graph is intended to have cycles, the cycles need to
-be annotated in the graph config. This page describes how to do that.
-
-NOTE: The current approach is experimental and subject to change. We welcome
-your feedback.
-
-Please use the `CalculatorGraphTest.Cycle` unit test in
-`mediapipe/framework/calculator_graph_test.cc` as sample code. Shown
-below is the cyclic graph in the test. The `sum` output of the adder is the sum
-of the integers generated by the integer source calculator.
-
-![a cyclic graph that adds a stream of integers](images/cyclic_integer_sum_graph.svg "A cyclic graph")
-
-This simple graph illustrates all the issues in supporting cyclic graphs.
-
-## Back Edge Annotation
-
-We require that an edge in each cycle be annotated as a back edge. This allows
-MediaPipe’s topological sort to work, after removing all the back edges.
-
-There are usually multiple ways to select the back edges. Which edges are marked
-as back edges affects which nodes are considered as upstream and which nodes are
-considered as downstream, which in turn affects the priorities MediaPipe assigns
-to the nodes.
-
-For example, the `CalculatorGraphTest.Cycle` test marks the `old_sum` edge as a
-back edge, so the Delay node is considered as a downstream node of the adder
-node and is given a higher priority. Alternatively, we could mark the `sum`
-input to the delay node as the back edge, in which case the delay node would be
-considered as an upstream node of the adder node and is given a lower priority.
-
-## Initial Packet
-
-For the adder calculator to be runnable when the first integer from the integer
-source arrives, we need an initial packet, with value 0 and with the same
-timestamp, on the `old_sum` input stream to the adder. This initial packet
-should be output by the delay calculator in the `Open()` method.
-
-## Delay in a Loop
-
-Each loop should incur a delay to align the previous `sum` output with the next
-integer input. This is also done by the delay node. So the delay node needs to
-know the following about the timestamps of the integer source calculator:
-
-*   The timestamp of the first output.
-
-*   The timestamp delta between successive outputs.
-
-We plan to add an alternative scheduling policy that only cares about packet
-ordering and ignores packet timestamps, which will eliminate this inconvenience.
-
-## Early Termination of a Calculator When One Input Stream is Done
-
-By default, MediaPipe calls the `Close()` method of a non-source calculator when
-all of its input streams are done. In the example graph, we want to stop the
-adder node as soon as the integer source is done. This is accomplished by
-configuring the adder node with an alternative input stream handler,
-`EarlyCloseInputStreamHandler`.
-
-## Relevant Source Code
-
-### Delay Calculator
-
-Note the code in `Open()` that outputs the initial packet and the code in
-`Process()` that adds a (unit) delay to input packets. As noted above, this
-delay node assumes that its output stream is used alongside an input stream with
-packet timestamps 0, 1, 2, 3, ...
-
-```c++
-class UnitDelayCalculator : public Calculator {
- public:
-  static ::util::Status FillExpectations(
-      const CalculatorOptions& extendable_options, PacketTypeSet* inputs,
-      PacketTypeSet* outputs, PacketTypeSet* input_side_packets) {
-    inputs->Index(0)->Set<int>("An integer.");
-    outputs->Index(0)->Set<int>("The input delayed by one time unit.");
-    return ::mediapipe::OkStatus();
-  }
-
-  ::util::Status Open() final {
-    Output()->Add(new int(0), Timestamp(0));
-    return ::mediapipe::OkStatus();
-  }
-
-  ::util::Status Process() final {
-    const Packet& packet = Input()->Value();
-    Output()->AddPacket(packet.At(packet.Timestamp().NextAllowedInStream()));
-    return ::mediapipe::OkStatus();
-  }
-};
-```
-
-### Graph Config
-
-Note the `back_edge` annotation and the alternative `input_stream_handler`.
-
-```proto
-node {
-  calculator: 'GlobalCountSourceCalculator'
-  input_side_packet: 'global_counter'
-  output_stream: 'integers'
-}
-node {
-  calculator: 'IntAdderCalculator'
-  input_stream: 'integers'
-  input_stream: 'old_sum'
-  input_stream_info: {
-    tag_index: ':1'  # 'old_sum'
-    back_edge: true
-  }
-  output_stream: 'sum'
-  input_stream_handler {
-    input_stream_handler: 'EarlyCloseInputStreamHandler'
-  }
-}
-node {
-  calculator: 'UnitDelayCalculator'
-  input_stream: 'sum'
-  output_stream: 'old_sum'
-}
-```
diff --git a/mediapipe/docs/examples.md b/mediapipe/docs/examples.md
deleted file mode 100644
index d3a004d62..000000000
--- a/mediapipe/docs/examples.md
+++ /dev/null
@@ -1,238 +0,0 @@
-# Examples
-
-Below are code samples on how to run MediaPipe on both mobile and desktop. We
-currently support MediaPipe APIs on mobile for Android only but will add support
-for Objective-C shortly.
-
-## Mobile
-
-### Hello World! on Android
-
-[Hello World! on Android](./hello_world_android.md) should be the first mobile
-Android example users go through in detail. It teaches the following:
-
-*   Introduction of a simple MediaPipe graph running on mobile GPUs for
-    [Sobel edge detection](https://en.wikipedia.org/wiki/Sobel_operator).
-*   Building a simple baseline Android application that displays "Hello World!".
-*   Adding camera preview support into the baseline application using the
-    Android [CameraX] API.
-*   Incorporating the Sobel edge detection graph to process the live camera
-    preview and display the processed video in real-time.
-
-### Hello World! on iOS
-
-[Hello World! on iOS](./hello_world_ios.md) is the iOS version of Sobel edge
-detection example.
-
-### Object Detection with GPU
-
-[Object Detection with GPU](./object_detection_mobile_gpu.md) illustrates how to
-use MediaPipe with a TFLite model for object detection in a GPU-accelerated
-pipeline.
-
-*   [Android](./object_detection_mobile_gpu.md)
-*   [iOS](./object_detection_mobile_gpu.md)
-
-### Object Detection with CPU
-
-[Object Detection with CPU](./object_detection_mobile_cpu.md) illustrates using
-the same TFLite model in a CPU-based pipeline. This example highlights how
-graphs can be easily adapted to run on CPU v.s. GPU.
-
-### Object Detection and Tracking with GPU
-
-[Object Detection and Tracking with GPU](./object_tracking_mobile_gpu.md) illustrates how to
-use MediaPipe for object detection and tracking.
-
-### Objectron: 3D Object Detection and Tracking with GPU
-
-[MediaPipe Objectron is 3D Object Detection with GPU](./objectron_mobile_gpu.md)
-illustrates mobile real-time 3D object detection and tracking pipeline for every
-day objects like shoes and chairs
-
-*   [Android](./objectron_mobile_gpu.md)
-
-### Face Detection with GPU
-
-[Face Detection with GPU](./face_detection_mobile_gpu.md) illustrates how to use
-MediaPipe with a TFLite model for face detection in a GPU-accelerated pipeline.
-The selfie face detection TFLite model is based on
-["BlazeFace: Sub-millisecond Neural Face Detection on Mobile GPUs"](https://sites.google.com/view/perception-cv4arvr/blazeface),
-and model details are described in the
-[model card](https://sites.google.com/corp/view/perception-cv4arvr/blazeface#h.p_21ojPZDx3cqq).
-
-*   [Android](./face_detection_mobile_gpu.md)
-*   [iOS](./face_detection_mobile_gpu.md)
-
-### Face Detection with CPU
-
-[Face Detection with CPU](./face_detection_mobile_cpu.md) illustrates using the
-same TFLite model in a CPU-based pipeline. This example highlights how graphs
-can be easily adapted to run on CPU v.s. GPU.
-
-*   [Android](./face_detection_mobile_cpu.md)
-*   [iOS](./face_detection_mobile_cpu.md)
-
-### Face Mesh with GPU
-
-[Face Mesh with GPU](./face_mesh_mobile_gpu.md) illustrates how to run the
-MediaPipe Face Mesh pipeline to perform 3D face landmark estimation in real-time
-on mobile devices, utilizing GPU acceleration. The pipeline is based on
-["Real-time Facial Surface Geometry from Monocular Video on Mobile GPUs"](https://arxiv.org/abs/1907.06724),
-and details of the underlying ML models are described in the
-[model card](https://drive.google.com/file/d/1VFC_wIpw4O7xBOiTgUldl79d9LA-LsnA/view).
-
-*   [Android](./face_mesh_mobile_gpu.md)
-*   [iOS](./face_mesh_mobile_gpu.md)
-
-### Hand Detection with GPU
-
-[Hand Detection with GPU](./hand_detection_mobile_gpu.md) illustrates how to use
-MediaPipe with a TFLite model for hand detection in a GPU-accelerated pipeline.
-
-*   [Android](./hand_detection_mobile_gpu.md)
-*   [iOS](./hand_detection_mobile_gpu.md)
-
-### Hand Tracking with GPU
-
-[Hand Tracking with GPU](./hand_tracking_mobile_gpu.md) illustrates how to use
-MediaPipe with TFLite models for hand tracking in a GPU-accelerated pipeline.
-
-*   [Android](./hand_tracking_mobile_gpu.md)
-*   [iOS](./hand_tracking_mobile_gpu.md)
-
-### Multi-Hand Tracking with GPU
-
-[Multi-Hand Tracking with GPU](./multi_hand_tracking_mobile_gpu.md) illustrates
-how to use MediaPipe with TFLite models for multi-hand tracking in a
-GPU-accelerated pipeline.
-
-*   [Android](./multi_hand_tracking_mobile_gpu.md)
-*   [iOS](./multi_hand_tracking_mobile_gpu.md)
-
-### Hair Segmentation with GPU
-
-[Hair Segmentation on GPU](./hair_segmentation_mobile_gpu.md) illustrates how to
-use MediaPipe with a TFLite model for hair segmentation in a GPU-accelerated
-pipeline. The selfie hair segmentation TFLite model is based on
-["Real-time Hair segmentation and recoloring on Mobile GPUs"](https://sites.google.com/view/perception-cv4arvr/hair-segmentation),
-and model details are described in the
-[model card](https://sites.google.com/corp/view/perception-cv4arvr/hair-segmentation#h.p_NimuO7PgHxlY).
-
-*   [Android](./hair_segmentation_mobile_gpu.md)
-
-### Template Matching using KNIFT with CPU
-
-[Template Matching using KNIFT on Mobile](./template_matching_mobile_cpu.md)
-shows how to use MediaPipe with TFLite model for template matching using Knift
-on mobile using CPU.
-
-*   [Android](./template_matching_mobile_cpu.md)
-
-## Desktop
-
-### Hello World for C++
-
-[Hello World for C++](./hello_world_desktop.md) shows how to run a simple graph
-using the MediaPipe C++ APIs.
-
-### Feature Extraction and Model Inference for YouTube-8M Challenge
-
-[Feature Extraction and Model Inference for YouTube-8M Challenge](./youtube_8m.md)
-shows how to use MediaPipe to prepare training data for the YouTube-8M Challenge
-and do the model inference with the baseline model.
-
-### Preparing Data Sets with MediaSequence
-
-[Preparing Data Sets with MediaSequence](./media_sequence.md) shows how to use
-MediaPipe for media processing to prepare video data sets for training a
-TensorFlow model.
-
-### AutoFlip - Automatic video cropping
-
-[AutoFlip](./autoflip.md) shows how to use MediaPipe to build an automatic video
-cropping pipeline that can convert an input video to arbitrary aspect ratios.
-
-### Object Detection on Desktop
-
-[Object Detection on Desktop](./object_detection_desktop.md) shows how to run
-object detection models (TensorFlow and TFLite) using the MediaPipe C++ APIs.
-
-[Sobel edge detection]:https://en.wikipedia.org/wiki/Sobel_operator
-[CameraX]:https://developer.android.com/training/camerax
-
-### Face Detection on Desktop with Webcam
-
-[Face Detection on Desktop with Webcam](./face_detection_desktop.md) shows how
-to use MediaPipe with a TFLite model for face detection on desktop using CPU or
-GPU with live video from a webcam.
-
-*   [Desktop GPU](./face_detection_desktop.md)
-*   [Desktop CPU](./face_detection_desktop.md)
-
-### Face Mesh on Desktop with Webcam
-
-[Face Mesh on Desktop with Webcam](./face_mesh_desktop.md) shows how to run the
-MediaPipe Face Mesh pipeline to perform 3D face landmark estimation in real-time
-on desktop with webcam input.
-
-*   [Desktop GPU](./face_mesh_desktop.md)
-*   [Desktop CPU](./face_mesh_desktop.md)
-
-### Hand Tracking on Desktop with Webcam
-
-[Hand Tracking on Desktop with Webcam](./hand_tracking_desktop.md) shows how to
-use MediaPipe with TFLite models for hand tracking on desktop using CPU or GPU
-with live video from a webcam.
-
-*   [Desktop GPU](./hand_tracking_desktop.md)
-*   [Desktop CPU](./hand_tracking_desktop.md)
-
-### Multi-Hand Tracking on Desktop with Webcam
-
-[Multi-Hand Tracking on Desktop with Webcam](./multi_hand_tracking_desktop.md)
-shows how to use MediaPipe with TFLite models for multi-hand tracking on desktop
-using CPU or GPU with live video from a webcam.
-
-*   [Desktop GPU](./multi_hand_tracking_desktop.md)
-*   [Desktop CPU](./multi_hand_tracking_desktop.md)
-
-### Hair Segmentation on Desktop with Webcam
-
-[Hair Segmentation on Desktop with Webcam](./hair_segmentation_desktop.md) shows
-how to use MediaPipe with a TFLite model for hair segmentation on desktop using
-GPU with live video from a webcam.
-
-*   [Desktop GPU](./hair_segmentation_desktop.md)
-
-## Google Coral (ML acceleration with Google EdgeTPU)
-
-Below are code samples on how to run MediaPipe on Google Coral Dev Board.
-
-### Object Detection on Coral
-
-[Object Detection on Coral with Webcam](./object_detection_coral_devboard.md)
-shows how to run quantized object detection TFlite model accelerated with
-EdgeTPU on
-[Google Coral Dev Board](https://coral.withgoogle.com/products/dev-board).
-
-### Face Detection on Coral
-
-[Face Detection on Coral with Webcam](./face_detection_coral_devboard.md) shows
-how to use quantized face detection TFlite model accelerated with EdgeTPU on
-[Google Coral Dev Board](https://coral.withgoogle.com/products/dev-board).
-
-
-## Web Browser
-
-Below are samples that can directly be run in your web browser.
-See more details in [MediaPipe on the Web](./web.md) and
-[Google Developer blog post](https://mediapipe.page.link/webdevblog)
-
-### [Face Detection In Browser](https://viz.mediapipe.dev/demo/face_detection)
-
-### [Hand Detection In Browser](https://viz.mediapipe.dev/demo/hand_detection)
-
-### [Hand Tracking In Browser](https://viz.mediapipe.dev/demo/hand_tracking)
-
-### [Hair Segmentation In Browser](https://viz.mediapipe.dev/demo/hair_segmentation)
diff --git a/mediapipe/docs/face_detection_coral_devboard.md b/mediapipe/docs/face_detection_coral_devboard.md
deleted file mode 100644
index c4ac47972..000000000
--- a/mediapipe/docs/face_detection_coral_devboard.md
+++ /dev/null
@@ -1,23 +0,0 @@
-## Face Detection on Coral with Webcam
-
-MediaPipe is able to run cross platform across device types like desktop, mobile
-and edge devices. Here is an example of running MediaPipe
-[face detection pipeline](./face_detection_desktop.md) on edge device like the
-[Coral Dev Board](https://coral.ai/products/dev-board).
-
-This MediaPipe Coral face
-detection pipeline is running [coral specific quantized version](https://github.com/google/mediapipe/blob/master/mediapipe/examples/coral/models/face-detector-quantized_edgetpu.tflite)
-of the [MediaPipe face detection TFLite model](https://github.com/google/mediapipe/blob/master/mediapipe/models/face_detection_front.tflite)
-accelerated on Edge TPU.
-
-### Cross compilation of MediaPipe Coral binaries in Docker
-
-We recommend building the MediaPipe binaries not on the edge device due to
-limited compute resulting in long build times. Instead, we will build MediaPipe
-binaries using Docker containers on a more powerful host machine.
-
-For step by
-step details of cross compiling and running MediaPipe binaries on the Coral Dev
-Board, please refer to [README.md in MediaPipe Coral example folder](https://github.com/google/mediapipe/tree/master/mediapipe/examples/coral).
-
-![Face Detection running on Coral](images/face_detection_demo_coral.gif)
diff --git a/mediapipe/docs/face_detection_desktop.md b/mediapipe/docs/face_detection_desktop.md
index 30fe2a2aa..8723faeb1 100644
--- a/mediapipe/docs/face_detection_desktop.md
+++ b/mediapipe/docs/face_detection_desktop.md
@@ -1,264 +1,2 @@
-## Face Detection on Desktop
-
-This is an example of using MediaPipe to run face detection models (TensorFlow
-Lite) and render bounding boxes on the detected faces. To know more about the
-face detection models, please refer to the model [`README file`]. Moreover, if
-you are interested in running the same TensorfFlow Lite model on Android/iOS,
-please see the
-[Face Detection on GPU on Android/iOS](face_detection_mobile_gpu.md) and
-[Face Detection on CPU on Android/iOS](face_detection_mobile_cpu.md) examples.
-
-We show the face detection demos with TensorFlow Lite model using the Webcam:
-
--   [TensorFlow Lite Face Detection Demo with Webcam (CPU)](#tensorflow-lite-face-detection-demo-with-webcam-cpu)
-
--   [TensorFlow Lite Face Detection Demo with Webcam (GPU)](#tensorflow-lite-face-detection-demo-with-webcam-gpu)
-
-Note: If MediaPipe depends on OpenCV 2, please see the
-[known issues with OpenCV 2](./object_detection_desktop.md#known-issues-with-opencv-2)
-section.
-
-### TensorFlow Lite Face Detection Demo with Webcam (CPU)
-
-To build and run the TensorFlow Lite example on desktop (CPU) with Webcam, run:
-
-```bash
-# Video from webcam running on desktop CPU
-$ bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 \
-    mediapipe/examples/desktop/face_detection:face_detection_cpu
-
-# It should print:
-# Target //mediapipe/examples/desktop/face_detection:face_detection_cpu up-to-date:
-#   bazel-bin/mediapipe/examples/desktop/face_detection/face_detection_cpu
-# INFO: Elapsed time: 36.417s, Critical Path: 23.22s
-# INFO: 711 processes: 710 linux-sandbox, 1 local.
-# INFO: Build completed successfully, 734 total actions
-
-# This will open up your webcam as long as it is connected and on
-# Any errors is likely due to your webcam being not accessible
-$ GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/face_detection/face_detection_cpu \
-    --calculator_graph_config_file=mediapipe/graphs/face_detection/face_detection_desktop_live.pbtxt
-```
-
-### TensorFlow Lite Face Detection Demo with Webcam (GPU)
-
-Note: This currently works only on Linux, and please first follow
-[OpenGL ES Setup on Linux Desktop](./gpu.md#opengl-es-setup-on-linux-desktop).
-
-To build and run the TensorFlow Lite example on desktop (GPU) with Webcam, run:
-
-```bash
-# Video from webcam running on desktop GPU
-# This works only for Linux currently
-$ bazel build -c opt --copt -DMESA_EGL_NO_X11_HEADERS --copt -DEGL_NO_X11 \
-    mediapipe/examples/desktop/face_detection:face_detection_gpu
-
-# It should print:
-# Target //mediapipe/examples/desktop/face_detection:face_detection_gpu up-to-date:
-#   bazel-bin/mediapipe/examples/desktop/face_detection/face_detection_gpu
-# INFO: Elapsed time: 36.417s, Critical Path: 23.22s
-# INFO: 711 processes: 710 linux-sandbox, 1 local.
-# INFO: Build completed successfully, 734 total actions
-
-# This will open up your webcam as long as it is connected and on
-# Any errors is likely due to your webcam being not accessible,
-# or GPU drivers not setup properly.
-$ GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/face_detection/face_detection_gpu \
-    --calculator_graph_config_file=mediapipe/graphs/face_detection/face_detection_mobile_gpu.pbtxt
-```
-
-#### Graph
-
-![graph visualization](images/face_detection_desktop.png)
-
-To visualize the graph as shown above, copy the text specification of the graph
-below and paste it into
-[MediaPipe Visualizer](https://viz.mediapipe.dev).
-
-```bash
-# MediaPipe graph that performs face detection with TensorFlow Lite on CPU & GPU.
-# Used in the examples in
-# mediapipe/examples/desktop/face_detection:face_detection_cpu.
-
-# Images on CPU coming into and out of the graph.
-input_stream: "input_video"
-output_stream: "output_video"
-
-# Throttles the images flowing downstream for flow control. It passes through
-# the very first incoming image unaltered, and waits for
-# TfLiteTensorsToDetectionsCalculator downstream in the graph to finish
-# generating the corresponding detections before it passes through another
-# image. All images that come in while waiting are dropped, limiting the number
-# of in-flight images between this calculator and
-# TfLiteTensorsToDetectionsCalculator to 1. This prevents the nodes in between
-# from queuing up incoming images and data excessively, which leads to increased
-# latency and memory usage, unwanted in real-time mobile applications. It also
-# eliminates unnecessarily computation, e.g., a transformed image produced by
-# ImageTransformationCalculator may get dropped downstream if the subsequent
-# TfLiteConverterCalculator or TfLiteInferenceCalculator is still busy
-# processing previous inputs.
-node {
-  calculator: "FlowLimiterCalculator"
-  input_stream: "input_video"
-  input_stream: "FINISHED:detections"
-  input_stream_info: {
-    tag_index: "FINISHED"
-    back_edge: true
-  }
-  output_stream: "throttled_input_video"
-}
-
-# Transforms the input image on CPU to a 128x128 image. To scale the input
-# image, the scale_mode option is set to FIT to preserve the aspect ratio,
-# resulting in potential letterboxing in the transformed image.
-node: {
-  calculator: "ImageTransformationCalculator"
-  input_stream: "IMAGE:throttled_input_video"
-  output_stream: "IMAGE:transformed_input_video_cpu"
-  output_stream: "LETTERBOX_PADDING:letterbox_padding"
-  node_options: {
-    [type.googleapis.com/mediapipe.ImageTransformationCalculatorOptions] {
-      output_width: 128
-      output_height: 128
-      scale_mode: FIT
-    }
-  }
-}
-
-# Converts the transformed input image on CPU into an image tensor stored as a
-# TfLiteTensor.
-node {
-  calculator: "TfLiteConverterCalculator"
-  input_stream: "IMAGE:transformed_input_video_cpu"
-  output_stream: "TENSORS:image_tensor"
-}
-
-# Runs a TensorFlow Lite model on CPU that takes an image tensor and outputs a
-# vector of tensors representing, for instance, detection boxes/keypoints and
-# scores.
-node {
-  calculator: "TfLiteInferenceCalculator"
-  input_stream: "TENSORS:image_tensor"
-  output_stream: "TENSORS:detection_tensors"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteInferenceCalculatorOptions] {
-      model_path: "mediapipe/models/face_detection_front.tflite"
-    }
-  }
-}
-
-# Generates a single side packet containing a vector of SSD anchors based on
-# the specification in the options.
-node {
-  calculator: "SsdAnchorsCalculator"
-  output_side_packet: "anchors"
-  node_options: {
-    [type.googleapis.com/mediapipe.SsdAnchorsCalculatorOptions] {
-      num_layers: 4
-      min_scale: 0.1484375
-      max_scale: 0.75
-      input_size_height: 128
-      input_size_width: 128
-      anchor_offset_x: 0.5
-      anchor_offset_y: 0.5
-      strides: 8
-      strides: 16
-      strides: 16
-      strides: 16
-      aspect_ratios: 1.0
-      fixed_anchor_size: true
-    }
-  }
-}
-
-# Decodes the detection tensors generated by the TensorFlow Lite model, based on
-# the SSD anchors and the specification in the options, into a vector of
-# detections. Each detection describes a detected object.
-node {
-  calculator: "TfLiteTensorsToDetectionsCalculator"
-  input_stream: "TENSORS:detection_tensors"
-  input_side_packet: "ANCHORS:anchors"
-  output_stream: "DETECTIONS:detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteTensorsToDetectionsCalculatorOptions] {
-      num_classes: 1
-      num_boxes: 896
-      num_coords: 16
-      box_coord_offset: 0
-      keypoint_coord_offset: 4
-      num_keypoints: 6
-      num_values_per_keypoint: 2
-      sigmoid_score: true
-      score_clipping_thresh: 100.0
-      reverse_output_order: true
-      x_scale: 128.0
-      y_scale: 128.0
-      h_scale: 128.0
-      w_scale: 128.0
-      min_score_thresh: 0.75
-    }
-  }
-}
-
-# Performs non-max suppression to remove excessive detections.
-node {
-  calculator: "NonMaxSuppressionCalculator"
-  input_stream: "detections"
-  output_stream: "filtered_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.NonMaxSuppressionCalculatorOptions] {
-      min_suppression_threshold: 0.3
-      overlap_type: INTERSECTION_OVER_UNION
-      algorithm: WEIGHTED
-      return_empty_detections: true
-    }
-  }
-}
-
-# Maps detection label IDs to the corresponding label text ("Face"). The label
-# map is provided in the label_map_path option.
-node {
-  calculator: "DetectionLabelIdToTextCalculator"
-  input_stream: "filtered_detections"
-  output_stream: "labeled_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionLabelIdToTextCalculatorOptions] {
-      label_map_path: "mediapipe/models/face_detection_front_labelmap.txt"
-    }
-  }
-}
-
-# Adjusts detection locations (already normalized to [0.f, 1.f]) on the
-# letterboxed image (after image transformation with the FIT scale mode) to the
-# corresponding locations on the same image with the letterbox removed (the
-# input image to the graph before image transformation).
-node {
-  calculator: "DetectionLetterboxRemovalCalculator"
-  input_stream: "DETECTIONS:labeled_detections"
-  input_stream: "LETTERBOX_PADDING:letterbox_padding"
-  output_stream: "DETECTIONS:output_detections"
-}
-
-# Converts the detections to drawing primitives for annotation overlay.
-node {
-  calculator: "DetectionsToRenderDataCalculator"
-  input_stream: "DETECTIONS:output_detections"
-  output_stream: "RENDER_DATA:render_data"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionsToRenderDataCalculatorOptions] {
-      thickness: 4.0
-      color { r: 255 g: 0 b: 0 }
-    }
-  }
-}
-
-# Draws annotations and overlays them on top of the input images.
-node {
-  calculator: "AnnotationOverlayCalculator"
-  input_stream: "IMAGE:throttled_input_video"
-  input_stream: "render_data"
-  output_stream: "IMAGE:output_video"
-}
-```
-
-[`README file`]:https://github.com/google/mediapipe/tree/master/mediapipe/models/object_detection_saved_model/README.md
+Content moved to
+[MediapPipe Face Detection](https://google.github.io/mediapipe/solutions/face_detection)
diff --git a/mediapipe/docs/face_detection_mobile_cpu.md b/mediapipe/docs/face_detection_mobile_cpu.md
deleted file mode 100644
index 4102a22b9..000000000
--- a/mediapipe/docs/face_detection_mobile_cpu.md
+++ /dev/null
@@ -1,246 +0,0 @@
-# Face Detection (CPU)
-
-This doc focuses on the
-[example graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/face_detection/face_detection_mobile_cpu.pbtxt)
-that performs face detection with TensorFlow Lite on CPU.
-
-![face_detection_android_gpu_gif](images/mobile/face_detection_android_gpu.gif)
-
-## Android
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectioncpu)
-
-To build and install the app:
-
-```bash
-bazel build -c opt --config=android_arm64 mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectioncpu
-adb install bazel-bin/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectioncpu/facedetectioncpu.apk
-```
-
-## iOS
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/facedetectioncpu).
-
-See the general [instructions](./building_examples.md#ios) for building iOS
-examples and generating an Xcode project. This will be the FaceDetectionCpuApp
-target.
-
-To build on the command line:
-
-```bash
-bazel build -c opt --config=ios_arm64 mediapipe/examples/ios/facedetectioncpu:FaceDetectionCpuApp
-```
-
-## Graph
-
-![face_detection_mobile_cpu_graph](images/mobile/face_detection_mobile_cpu.png)
-
-To visualize the graph as shown above, copy the text specification of the graph
-below and paste it into [MediaPipe Visualizer](https://viz.mediapipe.dev/).
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/face_detection/face_detection_mobile_cpu.pbtxt)
-
-```bash
-# MediaPipe graph that performs face detection with TensorFlow Lite on CPU.
-# Used in the examples in
-# mediapipie/examples/android/src/java/com/mediapipe/apps/facedetectioncpu and
-# mediapipie/examples/ios/facedetectioncpu.
-
-# Images on GPU coming into and out of the graph.
-input_stream: "input_video"
-output_stream: "output_video"
-
-# Throttles the images flowing downstream for flow control. It passes through
-# the very first incoming image unaltered, and waits for
-# TfLiteTensorsToDetectionsCalculator downstream in the graph to finish
-# generating the corresponding detections before it passes through another
-# image. All images that come in while waiting are dropped, limiting the number
-# of in-flight images between this calculator and
-# TfLiteTensorsToDetectionsCalculator to 1. This prevents the nodes in between
-# from queuing up incoming images and data excessively, which leads to increased
-# latency and memory usage, unwanted in real-time mobile applications. It also
-# eliminates unnecessarily computation, e.g., a transformed image produced by
-# ImageTransformationCalculator may get dropped downstream if the subsequent
-# TfLiteConverterCalculator or TfLiteInferenceCalculator is still busy
-# processing previous inputs.
-node {
-  calculator: "FlowLimiterCalculator"
-  input_stream: "input_video"
-  input_stream: "FINISHED:detections"
-  input_stream_info: {
-    tag_index: "FINISHED"
-    back_edge: true
-  }
-  output_stream: "throttled_input_video"
-}
-
-# Transfers the input image from GPU to CPU memory for the purpose of
-# demonstrating a CPU-based pipeline. Note that the input image on GPU has the
-# origin defined at the bottom-left corner (OpenGL convention). As a result,
-# the transferred image on CPU also shares the same representation.
-node: {
-  calculator: "GpuBufferToImageFrameCalculator"
-  input_stream: "throttled_input_video"
-  output_stream: "input_video_cpu"
-}
-
-# Transforms the input image on CPU to a 128x128 image. To scale the input
-# image, the scale_mode option is set to FIT to preserve the aspect ratio,
-# resulting in potential letterboxing in the transformed image.
-node: {
-  calculator: "ImageTransformationCalculator"
-  input_stream: "IMAGE:input_video_cpu"
-  output_stream: "IMAGE:transformed_input_video_cpu"
-  output_stream: "LETTERBOX_PADDING:letterbox_padding"
-  node_options: {
-    [type.googleapis.com/mediapipe.ImageTransformationCalculatorOptions] {
-      output_width: 128
-      output_height: 128
-      scale_mode: FIT
-    }
-  }
-}
-
-# Converts the transformed input image on CPU into an image tensor stored as a
-# TfLiteTensor.
-node {
-  calculator: "TfLiteConverterCalculator"
-  input_stream: "IMAGE:transformed_input_video_cpu"
-  output_stream: "TENSORS:image_tensor"
-}
-
-# Runs a TensorFlow Lite model on CPU that takes an image tensor and outputs a
-# vector of tensors representing, for instance, detection boxes/keypoints and
-# scores.
-node {
-  calculator: "TfLiteInferenceCalculator"
-  input_stream: "TENSORS:image_tensor"
-  output_stream: "TENSORS:detection_tensors"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteInferenceCalculatorOptions] {
-      model_path: "mediapipe/models/face_detection_front.tflite"
-    }
-  }
-}
-
-# Generates a single side packet containing a vector of SSD anchors based on
-# the specification in the options.
-node {
-  calculator: "SsdAnchorsCalculator"
-  output_side_packet: "anchors"
-  node_options: {
-    [type.googleapis.com/mediapipe.SsdAnchorsCalculatorOptions] {
-      num_layers: 4
-      min_scale: 0.1484375
-      max_scale: 0.75
-      input_size_height: 128
-      input_size_width: 128
-      anchor_offset_x: 0.5
-      anchor_offset_y: 0.5
-      strides: 8
-      strides: 16
-      strides: 16
-      strides: 16
-      aspect_ratios: 1.0
-      fixed_anchor_size: true
-    }
-  }
-}
-
-# Decodes the detection tensors generated by the TensorFlow Lite model, based on
-# the SSD anchors and the specification in the options, into a vector of
-# detections. Each detection describes a detected object.
-node {
-  calculator: "TfLiteTensorsToDetectionsCalculator"
-  input_stream: "TENSORS:detection_tensors"
-  input_side_packet: "ANCHORS:anchors"
-  output_stream: "DETECTIONS:detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteTensorsToDetectionsCalculatorOptions] {
-      num_classes: 1
-      num_boxes: 896
-      num_coords: 16
-      box_coord_offset: 0
-      keypoint_coord_offset: 4
-      num_keypoints: 6
-      num_values_per_keypoint: 2
-      sigmoid_score: true
-      score_clipping_thresh: 100.0
-      reverse_output_order: true
-      x_scale: 128.0
-      y_scale: 128.0
-      h_scale: 128.0
-      w_scale: 128.0
-      min_score_thresh: 0.75
-    }
-  }
-}
-
-# Performs non-max suppression to remove excessive detections.
-node {
-  calculator: "NonMaxSuppressionCalculator"
-  input_stream: "detections"
-  output_stream: "filtered_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.NonMaxSuppressionCalculatorOptions] {
-      min_suppression_threshold: 0.3
-      overlap_type: INTERSECTION_OVER_UNION
-      algorithm: WEIGHTED
-      return_empty_detections: true
-    }
-  }
-}
-
-# Maps detection label IDs to the corresponding label text ("Face"). The label
-# map is provided in the label_map_path option.
-node {
-  calculator: "DetectionLabelIdToTextCalculator"
-  input_stream: "filtered_detections"
-  output_stream: "labeled_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionLabelIdToTextCalculatorOptions] {
-      label_map_path: "mediapipe/models/face_detection_front_labelmap.txt"
-    }
-  }
-}
-
-# Adjusts detection locations (already normalized to [0.f, 1.f]) on the
-# letterboxed image (after image transformation with the FIT scale mode) to the
-# corresponding locations on the same image with the letterbox removed (the
-# input image to the graph before image transformation).
-node {
-  calculator: "DetectionLetterboxRemovalCalculator"
-  input_stream: "DETECTIONS:labeled_detections"
-  input_stream: "LETTERBOX_PADDING:letterbox_padding"
-  output_stream: "DETECTIONS:output_detections"
-}
-
-# Converts the detections to drawing primitives for annotation overlay.
-node {
-  calculator: "DetectionsToRenderDataCalculator"
-  input_stream: "DETECTIONS:output_detections"
-  output_stream: "RENDER_DATA:render_data"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionsToRenderDataCalculatorOptions] {
-      thickness: 4.0
-      color { r: 255 g: 0 b: 0 }
-    }
-  }
-}
-
-# Draws annotations and overlays them on top of the input images.
-node {
-  calculator: "AnnotationOverlayCalculator"
-  input_stream: "IMAGE:input_video_cpu"
-  input_stream: "render_data"
-  output_stream: "IMAGE:output_video_cpu"
-}
-
-# Transfers the annotated image from CPU back to GPU memory, to be sent out of
-# the graph.
-node: {
-  calculator: "ImageFrameToGpuBufferCalculator"
-  input_stream: "output_video_cpu"
-  output_stream: "output_video"
-}
-```
diff --git a/mediapipe/docs/face_detection_mobile_gpu.md b/mediapipe/docs/face_detection_mobile_gpu.md
index b99350e94..8723faeb1 100644
--- a/mediapipe/docs/face_detection_mobile_gpu.md
+++ b/mediapipe/docs/face_detection_mobile_gpu.md
@@ -1,228 +1,2 @@
-# Face Detection (GPU)
-
-This doc focuses on the
-[example graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/face_detection/face_detection_mobile_gpu.pbtxt)
-that performs face detection with TensorFlow Lite on GPU.
-
-![face_detection_android_gpu_gif](images/mobile/face_detection_android_gpu.gif)
-
-## Android
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectiongpu)
-
-To build and install the app:
-
-```bash
-bazel build -c opt --config=android_arm64 mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectiongpu
-adb install bazel-bin/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectiongpu/facedetectiongpu.apk
-```
-
-## iOS
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/facedetectiongpu).
-
-See the general [instructions](./building_examples.md#ios) for building iOS
-examples and generating an Xcode project. This will be the FaceDetectionGpuApp
-target.
-
-To build on the command line:
-
-```bash
-bazel build -c opt --config=ios_arm64 mediapipe/examples/ios/facedetectiongpu:FaceDetectionGpuApp
-```
-
-## Graph
-
-![face_detection_mobile_gpu_graph](images/mobile/face_detection_mobile_gpu.png)
-
-To visualize the graph as shown above, copy the text specification of the graph
-below and paste it into [MediaPipe Visualizer](https://viz.mediapipe.dev/).
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/face_detection/face_detection_mobile_gpu.pbtxt)
-
-```bash
-# MediaPipe graph that performs face detection with TensorFlow Lite on GPU.
-# Used in the examples in
-# mediapipie/examples/android/src/java/com/mediapipe/apps/facedetectiongpu and
-# mediapipie/examples/ios/facedetectiongpu.
-
-# Images on GPU coming into and out of the graph.
-input_stream: "input_video"
-output_stream: "output_video"
-
-# Throttles the images flowing downstream for flow control. It passes through
-# the very first incoming image unaltered, and waits for
-# TfLiteTensorsToDetectionsCalculator downstream in the graph to finish
-# generating the corresponding detections before it passes through another
-# image. All images that come in while waiting are dropped, limiting the number
-# of in-flight images between this calculator and
-# TfLiteTensorsToDetectionsCalculator to 1. This prevents the nodes in between
-# from queuing up incoming images and data excessively, which leads to increased
-# latency and memory usage, unwanted in real-time mobile applications. It also
-# eliminates unnecessarily computation, e.g., a transformed image produced by
-# ImageTransformationCalculator may get dropped downstream if the subsequent
-# TfLiteConverterCalculator or TfLiteInferenceCalculator is still busy
-# processing previous inputs.
-node {
-  calculator: "FlowLimiterCalculator"
-  input_stream: "input_video"
-  input_stream: "FINISHED:detections"
-  input_stream_info: {
-    tag_index: "FINISHED"
-    back_edge: true
-  }
-  output_stream: "throttled_input_video"
-}
-
-# Transforms the input image on GPU to a 128x128 image. To scale the input
-# image, the scale_mode option is set to FIT to preserve the aspect ratio,
-# resulting in potential letterboxing in the transformed image.
-node: {
-  calculator: "ImageTransformationCalculator"
-  input_stream: "IMAGE_GPU:throttled_input_video"
-  output_stream: "IMAGE_GPU:transformed_input_video"
-  output_stream: "LETTERBOX_PADDING:letterbox_padding"
-  node_options: {
-    [type.googleapis.com/mediapipe.ImageTransformationCalculatorOptions] {
-      output_width: 128
-      output_height: 128
-      scale_mode: FIT
-    }
-  }
-}
-
-# Converts the transformed input image on GPU into an image tensor stored as a
-# TfLiteTensor.
-node {
-  calculator: "TfLiteConverterCalculator"
-  input_stream: "IMAGE_GPU:transformed_input_video"
-  output_stream: "TENSORS_GPU:image_tensor"
-}
-
-# Runs a TensorFlow Lite model on GPU that takes an image tensor and outputs a
-# vector of tensors representing, for instance, detection boxes/keypoints and
-# scores.
-node {
-  calculator: "TfLiteInferenceCalculator"
-  input_stream: "TENSORS_GPU:image_tensor"
-  output_stream: "TENSORS:detection_tensors"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteInferenceCalculatorOptions] {
-      model_path: "face_detection_front.tflite"
-    }
-  }
-}
-
-# Generates a single side packet containing a vector of SSD anchors based on
-# the specification in the options.
-node {
-  calculator: "SsdAnchorsCalculator"
-  output_side_packet: "anchors"
-  node_options: {
-    [type.googleapis.com/mediapipe.SsdAnchorsCalculatorOptions] {
-      num_layers: 4
-      min_scale: 0.1484375
-      max_scale: 0.75
-      input_size_height: 128
-      input_size_width: 128
-      anchor_offset_x: 0.5
-      anchor_offset_y: 0.5
-      strides: 8
-      strides: 16
-      strides: 16
-      strides: 16
-      aspect_ratios: 1.0
-      fixed_anchor_size: true
-    }
-  }
-}
-
-# Decodes the detection tensors generated by the TensorFlow Lite model, based on
-# the SSD anchors and the specification in the options, into a vector of
-# detections. Each detection describes a detected object.
-node {
-  calculator: "TfLiteTensorsToDetectionsCalculator"
-  input_stream: "TENSORS:detection_tensors"
-  input_side_packet: "ANCHORS:anchors"
-  output_stream: "DETECTIONS:detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteTensorsToDetectionsCalculatorOptions] {
-      num_classes: 1
-      num_boxes: 896
-      num_coords: 16
-      box_coord_offset: 0
-      keypoint_coord_offset: 4
-      num_keypoints: 6
-      num_values_per_keypoint: 2
-      sigmoid_score: true
-      score_clipping_thresh: 100.0
-      reverse_output_order: true
-      x_scale: 128.0
-      y_scale: 128.0
-      h_scale: 128.0
-      w_scale: 128.0
-      min_score_thresh: 0.75
-    }
-  }
-}
-
-# Performs non-max suppression to remove excessive detections.
-node {
-  calculator: "NonMaxSuppressionCalculator"
-  input_stream: "detections"
-  output_stream: "filtered_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.NonMaxSuppressionCalculatorOptions] {
-      min_suppression_threshold: 0.3
-      overlap_type: INTERSECTION_OVER_UNION
-      algorithm: WEIGHTED
-      return_empty_detections: true
-    }
-  }
-}
-
-# Maps detection label IDs to the corresponding label text ("Face"). The label
-# map is provided in the label_map_path option.
-node {
-  calculator: "DetectionLabelIdToTextCalculator"
-  input_stream: "filtered_detections"
-  output_stream: "labeled_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionLabelIdToTextCalculatorOptions] {
-      label_map_path: "face_detection_front_labelmap.txt"
-    }
-  }
-}
-
-# Adjusts detection locations (already normalized to [0.f, 1.f]) on the
-# letterboxed image (after image transformation with the FIT scale mode) to the
-# corresponding locations on the same image with the letterbox removed (the
-# input image to the graph before image transformation).
-node {
-  calculator: "DetectionLetterboxRemovalCalculator"
-  input_stream: "DETECTIONS:labeled_detections"
-  input_stream: "LETTERBOX_PADDING:letterbox_padding"
-  output_stream: "DETECTIONS:output_detections"
-}
-
-# Converts the detections to drawing primitives for annotation overlay.
-node {
-  calculator: "DetectionsToRenderDataCalculator"
-  input_stream: "DETECTIONS:output_detections"
-  output_stream: "RENDER_DATA:render_data"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionsToRenderDataCalculatorOptions] {
-      thickness: 10.0
-      color { r: 255 g: 0 b: 0 }
-    }
-  }
-}
-
-# Draws annotations and overlays them on top of the input images.
-node {
-  calculator: "AnnotationOverlayCalculator"
-  input_stream: "IMAGE_GPU:throttled_input_video"
-  input_stream: "render_data"
-  output_stream: "IMAGE_GPU:output_video"
-}
-```
+Content moved to
+[MediapPipe Face Detection](https://google.github.io/mediapipe/solutions/face_detection)
diff --git a/mediapipe/docs/face_mesh_desktop.md b/mediapipe/docs/face_mesh_desktop.md
deleted file mode 100644
index a2e9bbb34..000000000
--- a/mediapipe/docs/face_mesh_desktop.md
+++ /dev/null
@@ -1,55 +0,0 @@
-## Face Mesh on Desktop with Webcam
-
-This doc focuses on running the **MediaPipe Face Mesh** pipeline to perform 3D
-face landmark estimation in real-time on desktop with webcam input. The pipeline
-internally incorporates TensorFlow Lite models. To know more about the models,
-please refer to the model
-[README file](https://github.com/google/mediapipe/tree/master/mediapipe/models/README.md#face-mesh).
-Moreover, if you are interested in running the same pipeline on Android/iOS,
-please see [Face Mesh on Android/iOS](face_mesh_mobile_gpu.md).
-
--   [Face Mesh on Desktop with Webcam (CPU)](#face-mesh-on-desktop-with-webcam-cpu)
-
--   [Face Mesh on Desktop with Webcam (GPU)](#face-mesh-on-desktop-with-webcam-gpu)
-
-Note: If MediaPipe depends on OpenCV 2, please see the [known issues with OpenCV 2](#known-issues-with-opencv-2) section.
-
-### Face Mesh on Desktop with Webcam (CPU)
-
-To build and run Face Mesh on desktop with webcam (CPU), run:
-
-```bash
-$ bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 \
-    mediapipe/examples/desktop/face_mesh:face_mesh_cpu
-
-# It should print:
-# Target //mediapipe/examples/desktop/face_mesh:face_mesh_cpu up-to-date:
-#  bazel-bin/mediapipe/examples/desktop/face_mesh/face_mesh_cpu
-
-# This will open up your webcam as long as it is connected. Errors are likely
-# due to your webcam being not accessible.
-$ GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/face_mesh/face_mesh_cpu \
-    --calculator_graph_config_file=mediapipe/graphs/face_mesh/face_mesh_desktop_live.pbtxt
-```
-
-### Face Mesh on Desktop with Webcam (GPU)
-
-Note: This currently works only on Linux, and please first follow
-[OpenGL ES Setup on Linux Desktop](./gpu.md#opengl-es-setup-on-linux-desktop).
-
-To build and run Face Mesh on desktop with webcam (GPU), run:
-
-```bash
-# This works only for Linux currently
-$ bazel build -c opt --copt -DMESA_EGL_NO_X11_HEADERS --copt -DEGL_NO_X11 \
-    mediapipe/examples/desktop/face_mesh:face_mesh_gpu
-
-# It should print:
-# Target //mediapipe/examples/desktop/face_mesh:face_mesh_gpu up-to-date:
-#  bazel-bin/mediapipe/examples/desktop/face_mesh/face_mesh_gpu
-
-# This will open up your webcam as long as it is connected. Errors are likely
-# due to your webcam being not accessible, or GPU drivers not setup properly.
-$ GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/face_mesh/face_mesh_gpu \
-    --calculator_graph_config_file=mediapipe/graphs/face_mesh/face_mesh_desktop_live_gpu.pbtxt
-```
diff --git a/mediapipe/docs/face_mesh_mobile_gpu.md b/mediapipe/docs/face_mesh_mobile_gpu.md
deleted file mode 100644
index d594a26e4..000000000
--- a/mediapipe/docs/face_mesh_mobile_gpu.md
+++ /dev/null
@@ -1,90 +0,0 @@
-# Face Mesh (GPU)
-
-This example focuses on running the **MediaPipe Face Mesh** pipeline on mobile
-devices to perform 3D face landmark estimation in real-time, utilizing GPU
-acceleration. The pipeline internally incorporates TensorFlow Lite models. To
-know more about the models, please refer to the model
-[README file](https://github.com/google/mediapipe/tree/master/mediapipe/models/README.md#face-mesh).
-The pipeline is related to the
-[face detection example](./face_detection_mobile_gpu.md) as it internally
-utilizes face detection and performs landmark estimation only within the
-detected region.
-
-![face_mesh_android_gpu.gif](images/mobile/face_mesh_android_gpu.gif)
-
-**MediaPipe Face Mesh** generates 468 3D face landmarks in real-time on mobile
-devices. In the visualization above, the red dots represent the landmarks, and
-the green lines connecting landmarks illustrate the contours around the eyes,
-eyebrows, lips and the entire face.
-
-## Android
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facemeshgpu)
-
-A prebuilt arm64 APK can be
-[downloaded here](https://drive.google.com/open?id=1pUmd7CXCL_onYMbsZo5p91cH0oNnR4gi).
-
-To build the app yourself, run:
-
-```bash
-bazel build -c opt --config=android_arm64 mediapipe/examples/android/src/java/com/google/mediapipe/apps/facemeshgpu
-```
-
-Once the app is built, install it on Android device with:
-
-```bash
-adb install bazel-bin/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facemeshgpu/facemeshgpu.apk
-```
-
-## iOS
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/facemeshgpu).
-
-See the general [instructions](./building_examples.md#ios) for building iOS
-examples and generating an Xcode project. This will be the FaceMeshGpuApp
-target.
-
-To build on the command line:
-
-```bash
-bazel build -c opt --config=ios_arm64 mediapipe/examples/ios/facemeshgpu:FaceMeshGpuApp
-```
-
-## Graph
-
-The face mesh [main graph](#main-graph) utilizes a
-[face landmark subgraph](#face-landmark-subgraph) from the
-[face landmark module](https://github.com/google/mediapipe/tree/master/mediapipe/modules/face_landmark),
-and renders using a dedicated [face renderer subgraph](#face-renderer-subgraph).
-
-The subgraphs show up in the main graph visualization as nodes colored in
-purple, and the subgraph itself can also be visualized just like a regular
-graph. For more information on how to visualize a graph that includes subgraphs,
-see the Visualizing Subgraphs section in the
-[visualizer documentation](./visualizer.md).
-
-### Main Graph
-
-![face_mesh_mobile_graph](images/mobile/face_mesh_mobile.png)
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/face_mesh/face_mesh_mobile.pbtxt)
-
-### Face Landmark Subgraph
-
-The
-[face landmark module](https://github.com/google/mediapipe/tree/master/mediapipe/modules/face_landmark)
-contains several subgraphs that can be used to detect and track face landmarks.
-In particular, in this example the
-[FaceLandmarkFrontGPU](https://github.com/google/mediapipe/tree/master/mediapipe/modules/face_landmark/face_landmark_front_gpu.pbtxt)
-subgraph, suitable for images from front-facing cameras (i.e., selfie images)
-and utilizing GPU acceleration, is selected.
-
-![face_landmark_front_gpu_subgraph](images/mobile/face_landmark_front_gpu_subgraph.png)
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/modules/face_landmark/face_landmark_front_gpu.pbtxt)
-
-### Face Renderer Subgraph
-
-![face_renderer_gpu_subgraph](images/mobile/face_renderer_gpu_subgraph.png)
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/face_mesh/subgraphs/face_renderer_gpu.pbtxt)
diff --git a/mediapipe/docs/framework_concepts.md b/mediapipe/docs/framework_concepts.md
deleted file mode 100644
index 6279b1685..000000000
--- a/mediapipe/docs/framework_concepts.md
+++ /dev/null
@@ -1,334 +0,0 @@
-## Framework Concepts
-
-- [CalculatorBase](#calculatorbase)
-- [Life of a Calculator](#life-of-a-calculator)
-- [Identifying inputs and outputs](#identifying-inputs-and-outputs)
-- [Processing](#processing)
-- [GraphConfig](#graphconfig)
-- [Subgraph](#subgraph)
-
-Each calculator is a node of a graph. We describe how to create a new
-calculator, how to initialize a calculator, how to perform its calculations,
-input and output streams, timestamps, and options. Each node in the graph is
-implemented as a `Calculator`. The bulk of graph execution happens inside its
-calculators. A calculator may receive zero or more input streams and/or side
-packets and produces zero or more output streams and/or side packets.
-
-### CalculatorBase
-
-A calculator is created by defining a new sub-class of the
-[`CalculatorBase`](https://github.com/google/mediapipe/tree/master/mediapipe/framework/calculator_base.cc)
-class, implementing a number of methods, and registering the new sub-class with
-Mediapipe. At a minimum, a new calculator must implement the below four methods
-
-* `GetContract()`
-  * Calculator authors can specify the expected types of inputs and outputs of a calculator in GetContract(). When a graph is initialized, the framework calls a static method to verify if the packet types of the connected inputs and outputs match the information in this specification.
-* `Open()`
-  * After a graph starts, the framework calls `Open()`. The input side packets are available to the calculator at this point. `Open()` interprets the node configuration operations (see Section [GraphConfig](#graphconfig)) and prepares the calculator's per-graph-run state. This function may also write packets to calculator outputs. An error during `Open()` can terminate the graph run.
-* `Process()`
-  * For a calculator with inputs, the framework calls `Process()` repeatedly whenever at least one input stream has a packet available. The framework by default guarantees that all inputs have the same timestamp (see [Framework Architecture](scheduling_sync.md) for more information). Multiple `Process()` calls can be invoked simultaneously when parallel execution is enabled. If an error occurs during `Process()`, the framework calls `Close()` and the graph run terminates.
-* `Close()`
-  * After all calls to `Process()` finish or when all input streams close, the framework calls `Close()`. This function is always called if `Open()` was called and succeeded and even if the graph run terminated because of an error. No inputs are available via any input streams during `Close()`, but it still has access to input side packets and therefore may write outputs. After `Close()` returns, the calculator should be considered a dead node. The calculator object is destroyed as soon as the graph finishes running.
-
-The following are code snippets from
-[CalculatorBase.h](https://github.com/google/mediapipe/tree/master/mediapipe/framework/calculator_base.h).
-
-```c++
-class CalculatorBase {
- public:
-  ...
-
-  // The subclasses of CalculatorBase must implement GetContract.
-  // ...
-  static ::MediaPipe::Status GetContract(CalculatorContract* cc);
-
-  // Open is called before any Process() calls, on a freshly constructed
-  // calculator.  Subclasses may override this method to perform necessary
-  // setup, and possibly output Packets and/or set output streams' headers.
-  // ...
-  virtual ::MediaPipe::Status Open(CalculatorContext* cc) {
-    return ::MediaPipe::OkStatus();
-  }
-
-  // Processes the incoming inputs. May call the methods on cc to access
-  // inputs and produce outputs.
-  // ...
-  virtual ::MediaPipe::Status Process(CalculatorContext* cc) = 0;
-
-  // Is called if Open() was called and succeeded.  Is called either
-  // immediately after processing is complete or after a graph run has ended
-  // (if an error occurred in the graph).  ...
-  virtual ::MediaPipe::Status Close(CalculatorContext* cc) {
-    return ::MediaPipe::OkStatus();
-  }
-
-  ...
-};
-```
-### Life of a calculator
-
-During initialization of a MediaPipe graph, the framework calls a
-`GetContract()` static method to determine what kinds of packets are expected.
-
-The framework constructs and destroys the entire calculator for each graph run (e.g. once per video or once per image). Expensive or large objects that remain constant across graph runs should be supplied as input side packets so the calculations are not repeated on subsequent runs.
-
-After initialization, for each run of the graph, the following sequence occurs:
-
-* `Open()`
-* `Process()` (repeatedly)
-* `Close()`
-
-The framework calls `Open()` to initialize the calculator. `Open()` should interpret any options and set up the calculator's per-graph-run state. `Open()` may obtain input side packets and write packets to calculator outputs. If appropriate, it should call `SetOffset()` to reduce potential packet buffering of input streams.
-
-If an error occurs during `Open()` or `Process()` (as indicated by one of them returning a non-`Ok ` status), the graph run is terminated with no further calls to the calculator's methods, and the calculator is destroyed.
-
-For a calculator with inputs, the framework calls `Process()` whenever at least one input has a packet available. The framework guarantees that inputs all have the same timestamp, that timestamps increase with each call to `Process()` and that all packets are delivered. As a consequence, some inputs may not have any packets when `Process()` is called. An input whose packet is missing appears to produce an empty packet (with no timestamp).
-
-The framework calls `Close()` after all calls to `Process()`. All inputs will have been exhausted, but `Close()` has access to input side packets and may write outputs. After Close returns, the calculator is destroyed.
-
-Calculators with no inputs are referred to as sources. A source calculator continues to have `Process()` called as long as it returns an `Ok` status. A source calculator indicates that it is exhausted by returning a stop status (i.e. MediaPipe::tool::StatusStop).
-
-### Identifying inputs and outputs
-
-The public interface to a calculator consists of a set of input streams and
-output streams. In a CalculatorGraphConfiguration, the outputs from some
-calculators are connected to the inputs of other calculators using named
-streams. Stream names are normally lowercase, while input and output tags are
-normally UPPERCASE. In the example below, the output with tag name `VIDEO` is
-connected to the input with tag name `VIDEO_IN` using the stream named
-`video_stream`.
-
-```proto
-# Graph describing calculator SomeAudioVideoCalculator
-node {
-  calculator: "SomeAudioVideoCalculator"
-  input_stream: "INPUT:combined_input"
-  output_stream: "VIDEO:video_stream"
-}
-node {
-  calculator: "SomeVideoCalculator"
-  input_stream: "VIDEO_IN:video_stream"
-  output_stream: "VIDEO_OUT:processed_video"
-}
-```
-
-Input and output streams can be identified by index number, by tag name, or by a
-combination of tag name and index number. You can see some examples of input and
-output identifiers in the example below. `SomeAudioVideoCalculator` identifies
-its video output by tag and its audio outputs by the combination of tag and
-index. The input with tag `VIDEO` is connected to the stream named
-`video_stream`. The outputs with tag `AUDIO` and indices `0` and `1` are
-connected to the streams named `audio_left` and `audio_right`.
-`SomeAudioCalculator` identifies its audio inputs by index only (no tag needed).
-
-```proto
-# Graph describing calculator SomeAudioVideoCalculator
-node {
-  calculator: "SomeAudioVideoCalculator"
-  input_stream: "combined_input"
-  output_stream: "VIDEO:video_stream"
-  output_stream: "AUDIO:0:audio_left"
-  output_stream: "AUDIO:1:audio_right"
-}
-
-node {
-  calculator: "SomeAudioCalculator"
-  input_stream: "audio_left"
-  input_stream: "audio_right"
-  output_stream: "audio_energy"
-}
-```
-
-In the calculator implementation, inputs and outputs are also identified by tag
-name and index number.  In the function below input are output are identified:
-
-*   By index number: The combined input stream is identified simply by index
-    `0`.
-*   By tag name: The video output stream is identified by tag name "VIDEO".
-*   By tag name and index number: The output audio streams are identified by the
-    combination of the tag name `AUDIO` and the index numbers `0` and `1`.
-
-```c++
-// c++ Code snippet describing the SomeAudioVideoCalculator GetContract() method
-class SomeAudioVideoCalculator : public CalculatorBase {
- public:
-  static ::mediapipe::Status GetContract(CalculatorContract* cc) {
-    cc->Inputs().Index(0).SetAny();
-    // SetAny() is used to specify that whatever the type of the
-    // stream is, it's acceptable.  This does not mean that any
-    // packet is acceptable.  Packets in the stream still have a
-    // particular type.  SetAny() has the same effect as explicitly
-    // setting the type to be the stream's type.
-    cc->Outputs().Tag("VIDEO").Set<ImageFrame>();
-    cc->Outputs().Get("AUDIO", 0).Set<Matrix>;
-    cc->Outputs().Get("AUDIO", 1).Set<Matrix>;
-    return ::mediapipe::OkStatus();
-  }
-```
-
-### Processing
-
-`Process()` called on a non-source node must return `::mediapipe::OkStatus()` to
-indicate that all went well, or any other status code to signal an error
-
-If a non-source calculator returns `tool::StatusStop()`, then this signals the
-graph is being cancelled early. In this case, all source calculators and graph
-input streams will be closed (and remaining Packets will propagate through the
-graph).
-
-A source node in a graph will continue to have `Process()` called on it as long
-as it returns `::mediapipe::OkStatus(`). To indicate that there is no more data
-to be generated return `tool::StatusStop()`. Any other status indicates an error
-has occurred.
-
-`Close()` returns `::mediapipe::OkStatus()` to indicate success. Any other
-status indicates a failure.
-
-Here is the basic `Process()` function. It uses the `Input()` method (which can
-be used only if the calculator has a single input) to request its input data. It
-then uses `std::unique_ptr` to allocate the memory needed for the output packet,
-and does the calculations. When done it releases the pointer when adding it to
-the output stream.
-
-```c++
-::util::Status MyCalculator::Process() {
-  const Matrix& input = Input()->Get<Matrix>();
-  std::unique_ptr<Matrix> output(new Matrix(input.rows(), input.cols()));
-  // do your magic here....
-  //    output->row(n) =  ...
-  Output()->Add(output.release(), InputTimestamp());
-  return ::mediapipe::OkStatus();
-}
-```
-
-### GraphConfig
-
-A `GraphConfig` is a specification that describes the topology and functionality
-of a MediaPipe graph. In the specification, a node in the graph represents an
-instance of a particular calculator. All the necessary configurations of the
-node, such its type, inputs and outputs must be described in the specification.
-Description of the node can also include several optional fields, such as
-node-specific options, input policy and executor, discussed in
-[Framework Architecture](scheduling_sync.md).
-
-`GraphConfig` has several other fields to configure the global graph-level
-settings, eg, graph executor configs, number of threads, and maximum queue size
-of input streams. Several graph-level settings are useful for tuning the
-performance of the graph on different platforms (eg, desktop v.s. mobile). For
-instance, on mobile, attaching a heavy model-inference calculator to a separate
-executor can improve the performance of a real-time application since this
-enables thread locality.
-
-Below is a trivial `GraphConfig` example where we have series of passthrough
-calculators :
-
-```proto
-# This graph named main_pass_throughcals_nosubgraph.pbtxt contains 4
-# passthrough calculators.
-input_stream: "in"
-node {
-    calculator: "PassThroughCalculator"
-    input_stream: "in"
-    output_stream: "out1"
-}
-node {
-    calculator: "PassThroughCalculator"
-    input_stream: "out1"
-    output_stream: "out2"
-}
-node {
-    calculator: "PassThroughCalculator"
-    input_stream: "out2"
-    output_stream: "out3"
-}
-node {
-    calculator: "PassThroughCalculator"
-    input_stream: "out3"
-    output_stream: "out4"
-}
-```
-
-### Subgraph
-
-To modularize a `CalculatorGraphConfig` into sub-modules and assist with re-use
-of perception solutions, a MediaPipe graph can be defined as a `Subgraph`. The
-public interface of a subgraph consists of a set of input and output streams
-similar to a calculator's public interface. The subgraph can then be
-included in an `CalculatorGraphConfig` as if it were a calculator. When a
-MediaPipe graph is loaded from a `CalculatorGraphConfig`, each subgraph node is
-replaced by the corresponding graph of calculators. As a result, the semantics
-and performance of the subgraph is identical to the corresponding graph of
-calculators.
-
-Below is an example of how to create a subgraph named `TwoPassThroughSubgraph`.
-
-1.  Defining the subgraph.
-
-    ```proto
-    # This subgraph is defined in two_pass_through_subgraph.pbtxt
-    # and is registered as "TwoPassThroughSubgraph"
-
-    type: "TwoPassThroughSubgraph"
-    input_stream: "out1"
-    output_stream: "out3"
-
-    node {
-        calculator: "PassThroughculator"
-        input_stream: "out1"
-        output_stream: "out2"
-    }
-    node {
-        calculator: "PassThroughculator"
-        input_stream: "out2"
-        output_stream: "out3"
-    }
-    ```
-
-    The public interface to the subgraph consists of:
-
-    *   Graph input streams
-    *   Graph output streams
-    *   Graph input side packets
-    *   Graph output side packets
-
-2.  Register the subgraph using BUILD rule `mediapipe_simple_subgraph`. The
-    parameter `register_as` defines the component name for the new subgraph.
-
-    ```proto
-    # Small section of BUILD file for registering the "TwoPassThroughSubgraph"
-    # subgraph for use by main graph main_pass_throughcals.pbtxt
-
-    mediapipe_simple_subgraph(
-        name = "twopassthrough_subgraph",
-        graph = "twopassthrough_subgraph.pbtxt",
-        register_as = "TwoPassThroughSubgraph",
-        deps = [
-                "//mediapipe/calculators/core:pass_through_calculator",
-                "//mediapipe/framework:calculator_graph",
-        ],
-    )
-    ```
-
-3.  Use the subgraph in the main graph.
-
-    ```proto
-    # This main graph is defined in main_pass_throughcals.pbtxt
-    # using subgraph called "TwoPassThroughSubgraph"
-
-    input_stream: "in"
-    node {
-        calculator: "PassThroughCalculator"
-        input_stream: "in"
-        output_stream: "out1"
-    }
-    node {
-        calculator: "TwoPassThroughSubgraph"
-        input_stream: "out1"
-        output_stream: "out3"
-    }
-    node {
-        calculator: "PassThroughCalculator"
-        input_stream: "out3"
-        output_stream: "out4"
-    }
-    ```
diff --git a/mediapipe/docs/hair_segmentation_desktop.md b/mediapipe/docs/hair_segmentation_desktop.md
deleted file mode 100644
index 607ce9725..000000000
--- a/mediapipe/docs/hair_segmentation_desktop.md
+++ /dev/null
@@ -1,207 +0,0 @@
-## Hair Segmentation on Desktop
-
-This is an example of using MediaPipe to run hair segmentation models
-(TensorFlow Lite) and render a color to the detected hair. To know more about
-the hair segmentation models, please refer to the model [`README file`].
-Moreover, if you are interested in running the same TensorfFlow Lite model on
-Android/iOS, please see the
-[Hair Segmentation on GPU on Android/iOS](hair_segmentation_mobile_gpu.md) and
-
-We show the hair segmentation demos with TensorFlow Lite model using the Webcam:
-
--   [TensorFlow Lite Hair Segmentation Demo with Webcam (GPU)](#tensorflow-lite-hair-segmentation-demo-with-webcam-gpu)
-
-Note: If MediaPipe depends on OpenCV 2, please see the
-[known issues with OpenCV 2](./object_detection_desktop.md#known-issues-with-opencv-2)
-section.
-
-### TensorFlow Lite Hair Segmentation Demo with Webcam (GPU)
-
-Note: This currently works only on Linux, and please first follow
-[OpenGL ES Setup on Linux Desktop](./gpu.md#opengl-es-setup-on-linux-desktop).
-
-To build and run the TensorFlow Lite example on desktop (GPU) with Webcam, run:
-
-```bash
-# Video from webcam running on desktop GPU
-# This works only for Linux currently
-$ bazel build -c opt --copt -DMESA_EGL_NO_X11_HEADERS --copt -DEGL_NO_X11 \
-    mediapipe/examples/desktop/hair_segmentation:hair_segmentation_gpu
-
-# It should print:
-#INFO: Found 1 target...
-#Target //mediapipe/examples/desktop/hair_segmentation:hair_segmentation_gpu up-to-date:
-#  bazel-bin/mediapipe/examples/desktop/hair_segmentation/hair_segmentation_gpu
-#INFO: Build completed successfully, 12210 total actions
-
-# This will open up your webcam as long as it is connected and on
-# Any errors is likely due to your webcam being not accessible,
-# or GPU drivers not setup properly.
-$ GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/hair_segmentation/hair_segmentation_gpu \
-    --calculator_graph_config_file=mediapipe/graphs/hair_segmentation/hair_segmentation_mobile_gpu.pbtxt
-```
-
-#### Graph
-
-![hair_segmentation_mobile_gpu_graph](images/mobile/hair_segmentation_mobile_gpu.png)
-
-To visualize the graph as shown above, copy the text specification of the graph
-below and paste it into
-[MediaPipe Visualizer](https://viz.mediapipe.dev).
-
-```bash
-# MediaPipe graph that performs hair segmentation with TensorFlow Lite on GPU.
-# Used in the example in
-# mediapipe/examples/android/src/java/com/mediapipe/apps/hairsegmentationgpu.
-
-# Images on GPU coming into and out of the graph.
-input_stream: "input_video"
-output_stream: "output_video"
-
-# Throttles the images flowing downstream for flow control. It passes through
-# the very first incoming image unaltered, and waits for
-# TfLiteTensorsToSegmentationCalculator downstream in the graph to finish
-# generating the corresponding hair mask before it passes through another
-# image. All images that come in while waiting are dropped, limiting the number
-# of in-flight images between this calculator and
-# TfLiteTensorsToSegmentationCalculator to 1. This prevents the nodes in between
-# from queuing up incoming images and data excessively, which leads to increased
-# latency and memory usage, unwanted in real-time mobile applications. It also
-# eliminates unnecessarily computation, e.g., a transformed image produced by
-# ImageTransformationCalculator may get dropped downstream if the subsequent
-# TfLiteConverterCalculator or TfLiteInferenceCalculator is still busy
-# processing previous inputs.
-node {
-  calculator: "FlowLimiterCalculator"
-  input_stream: "input_video"
-  input_stream: "FINISHED:hair_mask"
-  input_stream_info: {
-    tag_index: "FINISHED"
-    back_edge: true
-  }
-  output_stream: "throttled_input_video"
-}
-
-# Transforms the input image on GPU to a 512x512 image. To scale the image, by
-# default it uses the STRETCH scale mode that maps the entire input image to the
-# entire transformed image. As a result, image aspect ratio may be changed and
-# objects in the image may be deformed (stretched or squeezed), but the hair
-# segmentation model used in this graph is agnostic to that deformation.
-node: {
-  calculator: "ImageTransformationCalculator"
-  input_stream: "IMAGE_GPU:throttled_input_video"
-  output_stream: "IMAGE_GPU:transformed_input_video"
-  node_options: {
-    [type.googleapis.com/mediapipe.ImageTransformationCalculatorOptions] {
-      output_width: 512
-      output_height: 512
-    }
-  }
-}
-
-# Caches a mask fed back from the previous round of hair segmentation, and upon
-# the arrival of the next input image sends out the cached mask with the
-# timestamp replaced by that of the input image, essentially generating a packet
-# that carries the previous mask. Note that upon the arrival of the very first
-# input image, an empty packet is sent out to jump start the feedback loop.
-node {
-  calculator: "PreviousLoopbackCalculator"
-  input_stream: "MAIN:throttled_input_video"
-  input_stream: "LOOP:hair_mask"
-  input_stream_info: {
-    tag_index: "LOOP"
-    back_edge: true
-  }
-  output_stream: "PREV_LOOP:previous_hair_mask"
-}
-
-# Embeds the hair mask generated from the previous round of hair segmentation
-# as the alpha channel of the current input image.
-node {
-  calculator: "SetAlphaCalculator"
-  input_stream: "IMAGE_GPU:transformed_input_video"
-  input_stream: "ALPHA_GPU:previous_hair_mask"
-  output_stream: "IMAGE_GPU:mask_embedded_input_video"
-}
-
-# Converts the transformed input image on GPU into an image tensor stored in
-# tflite::gpu::GlBuffer. The zero_center option is set to false to normalize the
-# pixel values to [0.f, 1.f] as opposed to [-1.f, 1.f]. With the
-# max_num_channels option set to 4, all 4 RGBA channels are contained in the
-# image tensor.
-node {
-  calculator: "TfLiteConverterCalculator"
-  input_stream: "IMAGE_GPU:mask_embedded_input_video"
-  output_stream: "TENSORS_GPU:image_tensor"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteConverterCalculatorOptions] {
-      zero_center: false
-      max_num_channels: 4
-    }
-  }
-}
-
-# Generates a single side packet containing a TensorFlow Lite op resolver that
-# supports custom ops needed by the model used in this graph.
-node {
-  calculator: "TfLiteCustomOpResolverCalculator"
-  output_side_packet: "op_resolver"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteCustomOpResolverCalculatorOptions] {
-      use_gpu: true
-    }
-  }
-}
-
-# Runs a TensorFlow Lite model on GPU that takes an image tensor and outputs a
-# tensor representing the hair segmentation, which has the same width and height
-# as the input image tensor.
-node {
-  calculator: "TfLiteInferenceCalculator"
-  input_stream: "TENSORS_GPU:image_tensor"
-  output_stream: "TENSORS_GPU:segmentation_tensor"
-  input_side_packet: "CUSTOM_OP_RESOLVER:op_resolver"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteInferenceCalculatorOptions] {
-      model_path: "mediapipe/models/hair_segmentation.tflite"
-      use_gpu: true
-    }
-  }
-}
-
-# Decodes the segmentation tensor generated by the TensorFlow Lite model into a
-# mask of values in [0.f, 1.f], stored in the R channel of a GPU buffer. It also
-# takes the mask generated previously as another input to improve the temporal
-# consistency.
-node {
-  calculator: "TfLiteTensorsToSegmentationCalculator"
-  input_stream: "TENSORS_GPU:segmentation_tensor"
-  input_stream: "PREV_MASK_GPU:previous_hair_mask"
-  output_stream: "MASK_GPU:hair_mask"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteTensorsToSegmentationCalculatorOptions] {
-      tensor_width: 512
-      tensor_height: 512
-      tensor_channels: 2
-      combine_with_previous_ratio: 0.9
-      output_layer_index: 1
-    }
-  }
-}
-
-# Colors the hair segmentation with the color specified in the option.
-node {
-  calculator: "RecolorCalculator"
-  input_stream: "IMAGE_GPU:throttled_input_video"
-  input_stream: "MASK_GPU:hair_mask"
-  output_stream: "IMAGE_GPU:output_video"
-  node_options: {
-    [type.googleapis.com/mediapipe.RecolorCalculatorOptions] {
-      color { r: 0 g: 0 b: 255 }
-      mask_channel: RED
-    }
-  }
-}
-```
-
-[`README file`]:https://github.com/google/mediapipe/tree/master/mediapipe/README.md
diff --git a/mediapipe/docs/hair_segmentation_mobile_gpu.md b/mediapipe/docs/hair_segmentation_mobile_gpu.md
index 602a27847..945e84071 100644
--- a/mediapipe/docs/hair_segmentation_mobile_gpu.md
+++ b/mediapipe/docs/hair_segmentation_mobile_gpu.md
@@ -1,182 +1,2 @@
-# Hair Segmentation (GPU)
-
-This doc focuses on the
-[example graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hair_segmentation/hair_segmentation_mobile_gpu.pbtxt)
-that performs hair segmentation with TensorFlow Lite on GPU.
-
-![hair_segmentation_android_gpu_gif](images/mobile/hair_segmentation_android_gpu.gif)
-
-## Android
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/hairsegmentationgpu)
-
-To build and install the app:
-
-```bash
-bazel build -c opt --config=android_arm64 mediapipe/examples/android/src/java/com/google/mediapipe/apps/hairsegmentationgpu
-adb install bazel-bin/mediapipe/examples/android/src/java/com/google/mediapipe/apps/hairsegmentationgpu/hairsegmentationgpu.apk
-```
-
-## Graph
-
-![hair_segmentation_mobile_gpu_graph](images/mobile/hair_segmentation_mobile_gpu.png)
-
-To visualize the graph as shown above, copy the text specification of the graph
-below and paste it into [MediaPipe Visualizer](https://viz.mediapipe.dev/).
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hair_segmentation/hair_segmentation_mobile_gpu.pbtxt)
-
-```bash
-# MediaPipe graph that performs hair segmentation with TensorFlow Lite on GPU.
-# Used in the example in
-# mediapipe/examples/android/src/java/com/mediapipe/apps/hairsegmentationgpu.
-
-# Images on GPU coming into and out of the graph.
-input_stream: "input_video"
-output_stream: "output_video"
-
-# Throttles the images flowing downstream for flow control. It passes through
-# the very first incoming image unaltered, and waits for
-# TfLiteTensorsToSegmentationCalculator downstream in the graph to finish
-# generating the corresponding hair mask before it passes through another
-# image. All images that come in while waiting are dropped, limiting the number
-# of in-flight images between this calculator and
-# TfLiteTensorsToSegmentationCalculator to 1. This prevents the nodes in between
-# from queuing up incoming images and data excessively, which leads to increased
-# latency and memory usage, unwanted in real-time mobile applications. It also
-# eliminates unnecessarily computation, e.g., a transformed image produced by
-# ImageTransformationCalculator may get dropped downstream if the subsequent
-# TfLiteConverterCalculator or TfLiteInferenceCalculator is still busy
-# processing previous inputs.
-node {
-  calculator: "FlowLimiterCalculator"
-  input_stream: "input_video"
-  input_stream: "FINISHED:hair_mask"
-  input_stream_info: {
-    tag_index: "FINISHED"
-    back_edge: true
-  }
-  output_stream: "throttled_input_video"
-}
-
-# Transforms the input image on GPU to a 512x512 image. To scale the image, by
-# default it uses the STRETCH scale mode that maps the entire input image to the
-# entire transformed image. As a result, image aspect ratio may be changed and
-# objects in the image may be deformed (stretched or squeezed), but the hair
-# segmentation model used in this graph is agnostic to that deformation.
-node: {
-  calculator: "ImageTransformationCalculator"
-  input_stream: "IMAGE_GPU:throttled_input_video"
-  output_stream: "IMAGE_GPU:transformed_input_video"
-  node_options: {
-    [type.googleapis.com/mediapipe.ImageTransformationCalculatorOptions] {
-      output_width: 512
-      output_height: 512
-    }
-  }
-}
-
-# Caches a mask fed back from the previous round of hair segmentation, and upon
-# the arrival of the next input image sends out the cached mask with the
-# timestamp replaced by that of the input image, essentially generating a packet
-# that carries the previous mask. Note that upon the arrival of the very first
-# input image, an empty packet is sent out to jump start the feedback loop.
-node {
-  calculator: "PreviousLoopbackCalculator"
-  input_stream: "MAIN:throttled_input_video"
-  input_stream: "LOOP:hair_mask"
-  input_stream_info: {
-    tag_index: "LOOP"
-    back_edge: true
-  }
-  output_stream: "PREV_LOOP:previous_hair_mask"
-}
-
-# Embeds the hair mask generated from the previous round of hair segmentation
-# as the alpha channel of the current input image.
-node {
-  calculator: "SetAlphaCalculator"
-  input_stream: "IMAGE_GPU:transformed_input_video"
-  input_stream: "ALPHA_GPU:previous_hair_mask"
-  output_stream: "IMAGE_GPU:mask_embedded_input_video"
-}
-
-# Converts the transformed input image on GPU into an image tensor stored in
-# tflite::gpu::GlBuffer. The zero_center option is set to false to normalize the
-# pixel values to [0.f, 1.f] as opposed to [-1.f, 1.f]. With the
-# max_num_channels option set to 4, all 4 RGBA channels are contained in the
-# image tensor.
-node {
-  calculator: "TfLiteConverterCalculator"
-  input_stream: "IMAGE_GPU:mask_embedded_input_video"
-  output_stream: "TENSORS_GPU:image_tensor"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteConverterCalculatorOptions] {
-      zero_center: false
-      max_num_channels: 4
-    }
-  }
-}
-
-# Generates a single side packet containing a TensorFlow Lite op resolver that
-# supports custom ops needed by the model used in this graph.
-node {
-  calculator: "TfLiteCustomOpResolverCalculator"
-  output_side_packet: "op_resolver"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteCustomOpResolverCalculatorOptions] {
-      use_gpu: true
-    }
-  }
-}
-
-# Runs a TensorFlow Lite model on GPU that takes an image tensor and outputs a
-# tensor representing the hair segmentation, which has the same width and height
-# as the input image tensor.
-node {
-  calculator: "TfLiteInferenceCalculator"
-  input_stream: "TENSORS_GPU:image_tensor"
-  output_stream: "TENSORS_GPU:segmentation_tensor"
-  input_side_packet: "CUSTOM_OP_RESOLVER:op_resolver"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteInferenceCalculatorOptions] {
-      model_path: "hair_segmentation.tflite"
-      use_gpu: true
-    }
-  }
-}
-
-# Decodes the segmentation tensor generated by the TensorFlow Lite model into a
-# mask of values in [0.f, 1.f], stored in the R channel of a GPU buffer. It also
-# takes the mask generated previously as another input to improve the temporal
-# consistency.
-node {
-  calculator: "TfLiteTensorsToSegmentationCalculator"
-  input_stream: "TENSORS_GPU:segmentation_tensor"
-  input_stream: "PREV_MASK_GPU:previous_hair_mask"
-  output_stream: "MASK_GPU:hair_mask"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteTensorsToSegmentationCalculatorOptions] {
-      tensor_width: 512
-      tensor_height: 512
-      tensor_channels: 2
-      combine_with_previous_ratio: 0.9
-      output_layer_index: 1
-    }
-  }
-}
-
-# Colors the hair segmentation with the color specified in the option.
-node {
-  calculator: "RecolorCalculator"
-  input_stream: "IMAGE_GPU:throttled_input_video"
-  input_stream: "MASK_GPU:hair_mask"
-  output_stream: "IMAGE_GPU:output_video"
-  node_options: {
-    [type.googleapis.com/mediapipe.RecolorCalculatorOptions] {
-      color { r: 0 g: 0 b: 255 }
-      mask_channel: RED
-    }
-  }
-}
-```
+Content moved to
+[MediapPipe Hair Segmentation](https://google.github.io/mediapipe/solutions/hair_segmentation)
diff --git a/mediapipe/docs/hand_detection_mobile_gpu.md b/mediapipe/docs/hand_detection_mobile_gpu.md
deleted file mode 100644
index a052de0b3..000000000
--- a/mediapipe/docs/hand_detection_mobile_gpu.md
+++ /dev/null
@@ -1,350 +0,0 @@
-# Hand Detection (GPU)
-
-This doc focuses on the
-[example graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/hand_detection_mobile.pbtxt)
-that performs hand detection with TensorFlow Lite on GPU. It is related to the
-[hand tracking example](./hand_tracking_mobile_gpu.md).
-
-For overall context on hand detection and hand tracking, please read this
-[Google AI Blog post](https://mediapipe.page.link/handgoogleaiblog).
-
-![hand_detection_android_gpu_gif](images/mobile/hand_detection_android_gpu.gif)
-
-In the visualization above, green boxes represent the results of palm detection,
-and the red box represents the extended hand rectangle designed to cover the
-entire hand. The palm detection ML model (see also
-[model card](https://mediapipe.page.link/handmc)) supports detection of multiple
-palms, and this example selects only the one with the highest detection
-confidence score to generate the hand rectangle, to be further utilized in the
-[hand tracking example](./hand_tracking_mobile_gpu.md).
-
-## Android
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/handdetectiongpu)
-
-An arm64 APK can be
-[downloaded here](https://drive.google.com/open?id=1qUlTtH7Ydg-wl_H6VVL8vueu2UCTu37E).
-
-To build the app yourself:
-
-```bash
-bazel build -c opt --config=android_arm64 mediapipe/examples/android/src/java/com/google/mediapipe/apps/handdetectiongpu
-```
-
-Once the app is built, install it on Android device with:
-
-```bash
-adb install bazel-bin/mediapipe/examples/android/src/java/com/google/mediapipe/apps/handdetectiongpu/handdetectiongpu.apk
-```
-
-## iOS
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/handdetectiongpu).
-
-See the general [instructions](./building_examples.md#ios) for building iOS
-examples and generating an Xcode project. This will be the HandDetectionGpuApp
-target.
-
-To build on the command line:
-
-```bash
-bazel build -c opt --config=ios_arm64 mediapipe/examples/ios/handdetectiongpu:HandDetectionGpuApp
-```
-
-## Graph
-
-The hand detection [main graph](#main-graph) internally utilizes a
-[hand detection subgraph](#hand-detection-subgraph). The subgraph shows up in
-the main graph visualization as the `HandDetection` node colored in purple, and
-the subgraph itself can also be visualized just like a regular graph. For more
-information on how to visualize a graph that includes subgraphs, see the
-Visualizing Subgraphs section in the
-[visualizer documentation](./visualizer.md).
-
-### Main Graph
-
-![hand_detection_mobile_graph](images/mobile/hand_detection_mobile.png)
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/hand_detection_mobile.pbtxt)
-
-```bash
-# MediaPipe graph that performs hand detection with TensorFlow Lite on GPU.
-# Used in the examples in
-# mediapipie/examples/android/src/java/com/mediapipe/apps/handdetectiongpu and
-# mediapipie/examples/ios/handdetectiongpu.
-
-# Images coming into and out of the graph.
-input_stream: "input_video"
-output_stream: "output_video"
-
-# Throttles the images flowing downstream for flow control. It passes through
-# the very first incoming image unaltered, and waits for HandDetectionSubgraph
-# downstream in the graph to finish its tasks before it passes through another
-# image. All images that come in while waiting are dropped, limiting the number
-# of in-flight images in HandDetectionSubgraph to 1. This prevents the nodes in
-# HandDetectionSubgraph from queuing up incoming images and data excessively,
-# which leads to increased latency and memory usage, unwanted in real-time
-# mobile applications. It also eliminates unnecessarily computation, e.g., the
-# output produced by a node in the subgraph may get dropped downstream if the
-# subsequent nodes are still busy processing previous inputs.
-node {
-  calculator: "FlowLimiterCalculator"
-  input_stream: "input_video"
-  input_stream: "FINISHED:hand_rect_from_palm_detections"
-  input_stream_info: {
-    tag_index: "FINISHED"
-    back_edge: true
-  }
-  output_stream: "throttled_input_video"
-}
-
-# Subgraph that detections hands (see hand_detection_gpu.pbtxt).
-node {
-  calculator: "HandDetectionSubgraph"
-  input_stream: "throttled_input_video"
-  output_stream: "DETECTIONS:palm_detections"
-  output_stream: "NORM_RECT:hand_rect_from_palm_detections"
-}
-
-# Converts detections to drawing primitives for annotation overlay.
-node {
-  calculator: "DetectionsToRenderDataCalculator"
-  input_stream: "DETECTIONS:palm_detections"
-  output_stream: "RENDER_DATA:detection_render_data"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionsToRenderDataCalculatorOptions] {
-      thickness: 4.0
-      color { r: 0 g: 255 b: 0 }
-    }
-  }
-}
-
-# Converts normalized rects to drawing primitives for annotation overlay.
-node {
-  calculator: "RectToRenderDataCalculator"
-  input_stream: "NORM_RECT:hand_rect_from_palm_detections"
-  output_stream: "RENDER_DATA:rect_render_data"
-  node_options: {
-    [type.googleapis.com/mediapipe.RectToRenderDataCalculatorOptions] {
-      filled: false
-      color { r: 255 g: 0 b: 0 }
-      thickness: 4.0
-    }
-  }
-}
-
-# Draws annotations and overlays them on top of the input images.
-node {
-  calculator: "AnnotationOverlayCalculator"
-  input_stream: "IMAGE_GPU:throttled_input_video"
-  input_stream: "detection_render_data"
-  input_stream: "rect_render_data"
-  output_stream: "IMAGE_GPU:output_video"
-}
-```
-
-### Hand Detection Subgraph
-
-![hand_detection_gpu_subgraph](images/mobile/hand_detection_gpu_subgraph.png)
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/subgraphs/hand_detection_gpu.pbtxt)
-
-```bash
-# MediaPipe hand detection subgraph.
-
-type: "HandDetectionSubgraph"
-
-input_stream: "input_video"
-output_stream: "DETECTIONS:palm_detections"
-output_stream: "NORM_RECT:hand_rect_from_palm_detections"
-
-# Transforms the input image on GPU to a 256x256 image. To scale the input
-# image, the scale_mode option is set to FIT to preserve the aspect ratio,
-# resulting in potential letterboxing in the transformed image.
-node: {
-  calculator: "ImageTransformationCalculator"
-  input_stream: "IMAGE_GPU:input_video"
-  output_stream: "IMAGE_GPU:transformed_input_video"
-  output_stream: "LETTERBOX_PADDING:letterbox_padding"
-  node_options: {
-    [type.googleapis.com/mediapipe.ImageTransformationCalculatorOptions] {
-      output_width: 256
-      output_height: 256
-      scale_mode: FIT
-    }
-  }
-}
-
-# Generates a single side packet containing a TensorFlow Lite op resolver that
-# supports custom ops needed by the model used in this graph.
-node {
-  calculator: "TfLiteCustomOpResolverCalculator"
-  output_side_packet: "opresolver"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteCustomOpResolverCalculatorOptions] {
-      use_gpu: true
-    }
-  }
-}
-
-# Converts the transformed input image on GPU into an image tensor stored as a
-# TfLiteTensor.
-node {
-  calculator: "TfLiteConverterCalculator"
-  input_stream: "IMAGE_GPU:transformed_input_video"
-  output_stream: "TENSORS_GPU:image_tensor"
-}
-
-# Runs a TensorFlow Lite model on GPU that takes an image tensor and outputs a
-# vector of tensors representing, for instance, detection boxes/keypoints and
-# scores.
-node {
-  calculator: "TfLiteInferenceCalculator"
-  input_stream: "TENSORS_GPU:image_tensor"
-  output_stream: "TENSORS:detection_tensors"
-  input_side_packet: "CUSTOM_OP_RESOLVER:opresolver"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteInferenceCalculatorOptions] {
-      model_path: "palm_detection.tflite"
-      use_gpu: true
-    }
-  }
-}
-
-# Generates a single side packet containing a vector of SSD anchors based on
-# the specification in the options.
-node {
-  calculator: "SsdAnchorsCalculator"
-  output_side_packet: "anchors"
-  node_options: {
-    [type.googleapis.com/mediapipe.SsdAnchorsCalculatorOptions] {
-      num_layers: 5
-      min_scale: 0.1171875
-      max_scale: 0.75
-      input_size_height: 256
-      input_size_width: 256
-      anchor_offset_x: 0.5
-      anchor_offset_y: 0.5
-      strides: 8
-      strides: 16
-      strides: 32
-      strides: 32
-      strides: 32
-      aspect_ratios: 1.0
-      fixed_anchor_size: true
-    }
-  }
-}
-
-# Decodes the detection tensors generated by the TensorFlow Lite model, based on
-# the SSD anchors and the specification in the options, into a vector of
-# detections. Each detection describes a detected object.
-node {
-  calculator: "TfLiteTensorsToDetectionsCalculator"
-  input_stream: "TENSORS:detection_tensors"
-  input_side_packet: "ANCHORS:anchors"
-  output_stream: "DETECTIONS:detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteTensorsToDetectionsCalculatorOptions] {
-      num_classes: 1
-      num_boxes: 2944
-      num_coords: 18
-      box_coord_offset: 0
-      keypoint_coord_offset: 4
-      num_keypoints: 7
-      num_values_per_keypoint: 2
-      sigmoid_score: true
-      score_clipping_thresh: 100.0
-      reverse_output_order: true
-
-      x_scale: 256.0
-      y_scale: 256.0
-      h_scale: 256.0
-      w_scale: 256.0
-      min_score_thresh: 0.7
-    }
-  }
-}
-
-# Performs non-max suppression to remove excessive detections.
-node {
-  calculator: "NonMaxSuppressionCalculator"
-  input_stream: "detections"
-  output_stream: "filtered_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.NonMaxSuppressionCalculatorOptions] {
-      min_suppression_threshold: 0.3
-      overlap_type: INTERSECTION_OVER_UNION
-      algorithm: WEIGHTED
-      return_empty_detections: true
-    }
-  }
-}
-
-# Maps detection label IDs to the corresponding label text ("Palm"). The label
-# map is provided in the label_map_path option.
-node {
-  calculator: "DetectionLabelIdToTextCalculator"
-  input_stream: "filtered_detections"
-  output_stream: "labeled_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionLabelIdToTextCalculatorOptions] {
-      label_map_path: "palm_detection_labelmap.txt"
-    }
-  }
-}
-
-# Adjusts detection locations (already normalized to [0.f, 1.f]) on the
-# letterboxed image (after image transformation with the FIT scale mode) to the
-# corresponding locations on the same image with the letterbox removed (the
-# input image to the graph before image transformation).
-node {
-  calculator: "DetectionLetterboxRemovalCalculator"
-  input_stream: "DETECTIONS:labeled_detections"
-  input_stream: "LETTERBOX_PADDING:letterbox_padding"
-  output_stream: "DETECTIONS:palm_detections"
-}
-
-# Extracts image size from the input images.
-node {
-  calculator: "ImagePropertiesCalculator"
-  input_stream: "IMAGE_GPU:input_video"
-  output_stream: "SIZE:image_size"
-}
-
-# Converts results of palm detection into a rectangle (normalized by image size)
-# that encloses the palm and is rotated such that the line connecting center of
-# the wrist and MCP of the middle finger is aligned with the Y-axis of the
-# rectangle.
-node {
-  calculator: "DetectionsToRectsCalculator"
-  input_stream: "DETECTIONS:palm_detections"
-  input_stream: "IMAGE_SIZE:image_size"
-  output_stream: "NORM_RECT:palm_rect"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionsToRectsCalculatorOptions] {
-      rotation_vector_start_keypoint_index: 0  # Center of wrist.
-      rotation_vector_end_keypoint_index: 2  # MCP of middle finger.
-      rotation_vector_target_angle_degrees: 90
-      output_zero_rect_for_empty_detections: true
-    }
-  }
-}
-
-# Expands and shifts the rectangle that contains the palm so that it's likely
-# to cover the entire hand.
-node {
-  calculator: "RectTransformationCalculator"
-  input_stream: "NORM_RECT:palm_rect"
-  input_stream: "IMAGE_SIZE:image_size"
-  output_stream: "hand_rect_from_palm_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.RectTransformationCalculatorOptions] {
-      scale_x: 2.6
-      scale_y: 2.6
-      shift_y: -0.5
-      square_long: true
-    }
-  }
-}
-```
diff --git a/mediapipe/docs/hand_tracking_desktop.md b/mediapipe/docs/hand_tracking_desktop.md
index f48008109..7cbd74181 100644
--- a/mediapipe/docs/hand_tracking_desktop.md
+++ b/mediapipe/docs/hand_tracking_desktop.md
@@ -1,181 +1 @@
-## Hand Tracking on Desktop
-
-This is an example of using MediaPipe to run hand tracking models (TensorFlow
-Lite) and render bounding boxes on the detected hand (one hand only). To know
-more about the hand tracking models, please refer to the model [`README file`].
-Moreover, if you are interested in running the same TensorfFlow Lite model on
-Android/iOS, please see the
-[Hand Tracking on GPU on Android/iOS](hand_tracking_mobile_gpu.md) and
-
-We show the hand tracking demos with TensorFlow Lite model using the Webcam:
-
--   [TensorFlow Lite Hand Tracking Demo with Webcam (CPU)](#tensorflow-lite-hand-tracking-demo-with-webcam-cpu)
-
--   [TensorFlow Lite Hand Tracking Demo with Webcam (GPU)](#tensorflow-lite-hand-tracking-demo-with-webcam-gpu)
-
-Note: If MediaPipe depends on OpenCV 2, please see the
-[known issues with OpenCV 2](./object_detection_desktop.md#known-issues-with-opencv-2)
-section.
-
-### TensorFlow Lite Hand Tracking Demo with Webcam (CPU)
-
-To build and run the TensorFlow Lite example on desktop (CPU) with Webcam, run:
-
-```bash
-# Video from webcam running on desktop CPU
-$ bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 \
-    mediapipe/examples/desktop/hand_tracking:hand_tracking_cpu
-
-# It should print:
-#Target //mediapipe/examples/desktop/hand_tracking:hand_tracking_cpu up-to-date:
-#  bazel-bin/mediapipe/examples/desktop/hand_tracking/hand_tracking_cpu
-#INFO: Build completed successfully, 12517 total actions
-
-# This will open up your webcam as long as it is connected and on
-# Any errors is likely due to your webcam being not accessible
-$ GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/hand_tracking/hand_tracking_cpu \
-    --calculator_graph_config_file=mediapipe/graphs/hand_tracking/hand_tracking_desktop_live.pbtxt
-```
-
-### TensorFlow Lite Hand Tracking Demo with Webcam (GPU)
-
-Note: This currently works only on Linux, and please first follow
-[OpenGL ES Setup on Linux Desktop](./gpu.md#opengl-es-setup-on-linux-desktop).
-
-To build and run the TensorFlow Lite example on desktop (GPU) with Webcam, run:
-
-```bash
-# Video from webcam running on desktop GPU
-# This works only for Linux currently
-$ bazel build -c opt --copt -DMESA_EGL_NO_X11_HEADERS --copt -DEGL_NO_X11 \
-    mediapipe/examples/desktop/hand_tracking:hand_tracking_gpu
-
-# It should print:
-# Target //mediapipe/examples/desktop/hand_tracking:hand_tracking_gpu up-to-date:
-#  bazel-bin/mediapipe/examples/desktop/hand_tracking/hand_tracking_gpu
-#INFO: Build completed successfully, 22455 total actions
-
-# This will open up your webcam as long as it is connected and on
-# Any errors is likely due to your webcam being not accessible,
-# or GPU drivers not setup properly.
-$ GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/hand_tracking/hand_tracking_gpu \
-    --calculator_graph_config_file=mediapipe/graphs/hand_tracking/hand_tracking_mobile.pbtxt
-```
-
-#### Graph
-
-![graph visualization](images/hand_tracking_desktop.png)
-
-To visualize the graph as shown above, copy the text specification of the graph
-below and paste it into
-[MediaPipe Visualizer](https://viz.mediapipe.dev).
-
-```bash
-# MediaPipe graph that performs hand tracking on desktop with TensorFlow Lite
-# on CPU & GPU.
-# Used in the example in
-# mediapipe/examples/desktop/hand_tracking:hand_tracking_cpu.
-
-# Images coming into and out of the graph.
-input_stream: "input_video"
-output_stream: "output_video"
-
-# Caches a hand-presence decision fed back from HandLandmarkSubgraph, and upon
-# the arrival of the next input image sends out the cached decision with the
-# timestamp replaced by that of the input image, essentially generating a packet
-# that carries the previous hand-presence decision. Note that upon the arrival
-# of the very first input image, an empty packet is sent out to jump start the
-# feedback loop.
-node {
-  calculator: "PreviousLoopbackCalculator"
-  input_stream: "MAIN:input_video"
-  input_stream: "LOOP:hand_presence"
-  input_stream_info: {
-    tag_index: "LOOP"
-    back_edge: true
-  }
-  output_stream: "PREV_LOOP:prev_hand_presence"
-}
-
-# Drops the incoming image if HandLandmarkSubgraph was able to identify hand
-# presence in the previous image. Otherwise, passes the incoming image through
-# to trigger a new round of hand detection in HandDetectionSubgraph.
-node {
-  calculator: "GateCalculator"
-  input_stream: "input_video"
-  input_stream: "DISALLOW:prev_hand_presence"
-  output_stream: "hand_detection_input_video"
-
-  node_options: {
-    [type.googleapis.com/mediapipe.GateCalculatorOptions] {
-      empty_packets_as_allow: true
-    }
-  }
-}
-
-# Subgraph that detections hands (see hand_detection_cpu.pbtxt).
-node {
-  calculator: "HandDetectionSubgraph"
-  input_stream: "hand_detection_input_video"
-  output_stream: "DETECTIONS:palm_detections"
-  output_stream: "NORM_RECT:hand_rect_from_palm_detections"
-}
-
-# Subgraph that localizes hand landmarks (see hand_landmark_cpu.pbtxt).
-node {
-  calculator: "HandLandmarkSubgraph"
-  input_stream: "IMAGE:input_video"
-  input_stream: "NORM_RECT:hand_rect"
-  output_stream: "LANDMARKS:hand_landmarks"
-  output_stream: "NORM_RECT:hand_rect_from_landmarks"
-  output_stream: "PRESENCE:hand_presence"
-  output_stream: "HANDEDNESS:handedness"
-}
-
-# Caches a hand rectangle fed back from HandLandmarkSubgraph, and upon the
-# arrival of the next input image sends out the cached rectangle with the
-# timestamp replaced by that of the input image, essentially generating a packet
-# that carries the previous hand rectangle. Note that upon the arrival of the
-# very first input image, an empty packet is sent out to jump start the
-# feedback loop.
-node {
-  calculator: "PreviousLoopbackCalculator"
-  input_stream: "MAIN:input_video"
-  input_stream: "LOOP:hand_rect_from_landmarks"
-  input_stream_info: {
-    tag_index: "LOOP"
-    back_edge: true
-  }
-  output_stream: "PREV_LOOP:prev_hand_rect_from_landmarks"
-}
-
-# Merges a stream of hand rectangles generated by HandDetectionSubgraph and that
-# generated by HandLandmarkSubgraph into a single output stream by selecting
-# between one of the two streams. The former is selected if the incoming packet
-# is not empty, i.e., hand detection is performed on the current image by
-# HandDetectionSubgraph (because HandLandmarkSubgraph could not identify hand
-# presence in the previous image). Otherwise, the latter is selected, which is
-# never empty because HandLandmarkSubgraphs processes all images (that went
-# through FlowLimiterCaculator).
-node {
-  calculator: "MergeCalculator"
-  input_stream: "hand_rect_from_palm_detections"
-  input_stream: "prev_hand_rect_from_landmarks"
-  output_stream: "hand_rect"
-}
-
-# Subgraph that renders annotations and overlays them on top of the input
-# images (see renderer_cpu.pbtxt).
-node {
-  calculator: "RendererSubgraph"
-  input_stream: "IMAGE:input_video"
-  input_stream: "LANDMARKS:hand_landmarks"
-  input_stream: "NORM_RECT:hand_rect"
-  input_stream: "DETECTIONS:palm_detections"
-  input_stream: "HANDEDNESS:handedness"
-  output_stream: "IMAGE:output_video"
-}
-
-```
-
-[`README file`]:https://github.com/google/mediapipe/tree/master/mediapipe/README.md
+Content moved to [MediapPipe Hand](https://google.github.io/mediapipe/solutions/hand)
diff --git a/mediapipe/docs/hand_tracking_mobile_gpu.md b/mediapipe/docs/hand_tracking_mobile_gpu.md
index b81a77187..7cbd74181 100644
--- a/mediapipe/docs/hand_tracking_mobile_gpu.md
+++ b/mediapipe/docs/hand_tracking_mobile_gpu.md
@@ -1,154 +1 @@
-# MediaPipe Hand
-
-## Overview
-
-The ability to perceive the shape and motion of hands can be a vital component
-in improving the user experience across a variety of technological domains and
-platforms. For example, it can form the basis for sign language understanding
-and hand gesture control, and can also enable the overlay of digital content and
-information on top of the physical world in augmented reality. While coming
-naturally to people, robust real-time hand perception is a decidedly challenging
-computer vision task, as hands often occlude themselves or each other (e.g.
-finger/palm occlusions and hand shakes) and lack high contrast patterns.
-
-MediaPipe Hand is a high-fidelity hand and finger tracking solution. It employs
-machine learning (ML) to infer 21 3D landmarks of a hand from just a single
-frame. Whereas current state-of-the-art approaches rely primarily on powerful
-desktop environments for inference, our method achieves real-time performance on
-a mobile phone, and even scales to multiple hands. We hope that providing this
-hand perception functionality to the wider research and development community
-will result in an emergence of creative use cases, stimulating new applications
-and new research avenues.
-
-![hand_tracking_3d_android_gpu.gif](images/mobile/hand_tracking_3d_android_gpu.gif)
-
-*Fig 1. Tracked 3D hand landmarks are represented by dots in different shades,
-with the brighter ones denoting landmarks closer to the camera.*
-
-## ML Pipeline
-
-MediaPipe Hand utilizes an ML pipeline consisting of multiple models working
-together: A palm detection model that operates on the full image and returns an
-oriented hand bounding box. A hand landmark model that operates on the cropped
-image region defined by the palm detector and returns high-fidelity 3D hand
-keypoints. This architecture is similar to that employed by our recently
-released [MediaPipe Face Mesh](./face_mesh_mobile_gpu.md) solution.
-
-Providing the accurately cropped hand image to the hand landmark model
-drastically reduces the need for data augmentation (e.g. rotations, translation
-and scale) and instead allows the network to dedicate most of its capacity
-towards coordinate prediction accuracy. In addition, in our pipeline the crops
-can also be generated based on the hand landmarks identified in the previous
-frame, and only when the landmark model could no longer identify hand presence
-is palm detection invoked to relocalize the hand.
-
-The pipeline is implemented as a MediaPipe
-[graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/hand_tracking_mobile.pbtxt),
-which internally utilizes a
-[palm/hand detection subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/subgraphs/hand_detection_gpu.pbtxt),
-a
-[hand landmark subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/subgraphs/hand_landmark_gpu.pbtxt)
-and a
-[renderer subgraph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/subgraphs/renderer_gpu.pbtxt).
-For more information on how to visualize a graph and its associated subgraphs,
-please see the [visualizer documentation](./visualizer.md).
-
-## Models
-
-### Palm Detection Model
-
-To detect initial hand locations, we designed a
-[single-shot detector](https://arxiv.org/abs/1512.02325) model optimized for
-mobile real-time uses in a manner similar to the face detection model in
-[MediaPipe Face Mesh](./face_mesh_mobile_gpu.md). Detecting hands is a decidedly
-complex task: our model has to work across a variety of hand sizes with a large
-scale span (~20x) relative to the image frame and be able to detect occluded and
-self-occluded hands. Whereas faces have high contrast patterns, e.g., in the eye
-and mouth region, the lack of such features in hands makes it comparatively
-difficult to detect them reliably from their visual features alone. Instead,
-providing additional context, like arm, body, or person features, aids accurate
-hand localization.
-
-Our method addresses the above challenges using different strategies. First, we
-train a palm detector instead of a hand detector, since estimating bounding
-boxes of rigid objects like palms and fists is significantly simpler than
-detecting hands with articulated fingers. In addition, as palms are smaller
-objects, the non-maximum suppression algorithm works well even for two-hand
-self-occlusion cases, like handshakes. Moreover, palms can be modelled using
-square bounding boxes (anchors in ML terminology) ignoring other aspect ratios,
-and therefore reducing the number of anchors by a factor of 3-5. Second, an
-encoder-decoder feature extractor is used for bigger scene context awareness
-even for small objects (similar to the RetinaNet approach). Lastly, we minimize
-the focal loss during training to support a large amount of anchors resulting
-from the high scale variance.
-
-With the above techniques, we achieve an average precision of 95.7% in palm
-detection. Using a regular cross entropy loss and no decoder gives a baseline of
-just 86.22%.
-
-### Hand Landmark Model
-
-After the palm detection over the whole image our subsequent hand landmark model
-performs precise keypoint localization of 21 3D hand-knuckle coordinates inside
-the detected hand regions via regression, that is direct coordinate prediction.
-The model learns a consistent internal hand pose representation and is robust
-even to partially visible hands and self-occlusions.
-
-To obtain ground truth data, we have manually annotated ~30K real-world images
-with 21 3D coordinates, as shown below (we take Z-value from image depth map, if
-it exists per corresponding coordinate). To better cover the possible hand poses
-and provide additional supervision on the nature of hand geometry, we also
-render a high-quality synthetic hand model over various backgrounds and map it
-to the corresponding 3D coordinates.
-
-![hand_crops.png](images/mobile/hand_crops.png)
-
-*Fig 2. Top: Aligned hand crops passed to the tracking network with ground truth
-annotation. Bottom: Rendered synthetic hand images with ground truth
-annotation.*
-
-## Example Apps
-
-Please see the [general instructions](./building_examples.md) for how to build
-MediaPipe examples for different platforms.
-
-#### Main Example
-
-*   Android:
-    [Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/handtrackinggpu),
-    [Prebuilt ARM64 APK](https://drive.google.com/open?id=1uCjS0y0O0dTDItsMh8x2cf4-l3uHW1vE)
-*   iOS:
-    [Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/handtrackinggpu)
-*   Desktop:
-    [Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/desktop/hand_tracking)
-
-#### With Multi-hand Support
-
-*   Android:
-    [Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/multihandtrackinggpu),
-    [Prebuilt ARM64 APK](https://drive.google.com/open?id=1Wk6V9EVaz1ks_MInPqqVGvvJD01SGXDc)
-*   iOS:
-    [Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/multihandtrackinggpu)
-*   Desktop:
-    [Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/desktop/multi_hand_tracking)
-
-#### Palm/Hand Detection Only (no landmarks)
-
-*   Android:
-    [Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/handdetectionggpu),
-    [Prebuilt ARM64 APK](https://drive.google.com/open?id=1qUlTtH7Ydg-wl_H6VVL8vueu2UCTu37E)
-*   iOS:
-    [Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/handdetectiongpu)
-
-## Resources
-
-*   [Google AI Blog: On-Device, Real-Time Hand Tracking with MediaPipe](https://ai.googleblog.com/2019/08/on-device-real-time-hand-tracking-with.html)
-*   [TensorFlow Blog: Face and hand tracking in the browser with MediaPipe and
-    TensorFlow.js](https://blog.tensorflow.org/2020/03/face-and-hand-tracking-in-browser-with-mediapipe-and-tensorflowjs.html)
-*   Palm detection model:
-    [TFLite model](https://github.com/google/mediapipe/tree/master/mediapipe/models/palm_detection.tflite),
-    [TF.js model](https://tfhub.dev/mediapipe/handdetector/1)
-*   Hand landmark model:
-    [TFLite model](https://github.com/google/mediapipe/tree/master/mediapipe/models/hand_landmark.tflite),
-    [TF.js model](https://tfhub.dev/mediapipe/handskeleton/1)
-*   [Model card](https://mediapipe.page.link/handmc)
+Content moved to [MediapPipe Hand](https://google.github.io/mediapipe/solutions/hand)
diff --git a/mediapipe/docs/images/iris_tracking_desktop.png b/mediapipe/docs/images/iris_tracking_desktop.png
deleted file mode 100644
index a0dd91fcd..000000000
Binary files a/mediapipe/docs/images/iris_tracking_desktop.png and /dev/null differ
diff --git a/mediapipe/docs/measure_performance.md b/mediapipe/docs/measure_performance.md
deleted file mode 100644
index e4b2bde58..000000000
--- a/mediapipe/docs/measure_performance.md
+++ /dev/null
@@ -1,18 +0,0 @@
-# Measuring Performance
-
-*Coming soon.*
-
-MediaPipe includes APIs for gathering aggregate performance data and
-event timing data for CPU and GPU operations.  These API's can be found at:
-
-<!-- TODO: Update the source code URL's to local or public URL's -->
-
-   * [`GraphProfiler`](https://github.com/google/mediapipe/tree/master/mediapipe/framework/profiler/graph_profiler.h):
-     Accumulates for each running calculator a histogram of latencies for
-     Process calls.
-   * [`GraphTracer`](https://github.com/google/mediapipe/tree/master/mediapipe/framework/profiler/graph_tracer.h):
-     Records for each running calculator and each processed packet a series
-     of timed events including the start and finish of each Process call.
-
-Future mediapipe releases will include tools for visualizing and analysing
-the latency histograms and timed events captured by these API's.
diff --git a/mediapipe/docs/multi_hand_tracking_desktop.md b/mediapipe/docs/multi_hand_tracking_desktop.md
deleted file mode 100644
index b9edb08d3..000000000
--- a/mediapipe/docs/multi_hand_tracking_desktop.md
+++ /dev/null
@@ -1,177 +0,0 @@
-## Multi-Hand Tracking on Desktop
-
-This is an example of using MediaPipe to run hand tracking models (TensorFlow
-Lite) and render bounding boxes on the detected hand instances (for multiple
-hands). To know more about the hand tracking models, please refer to the model
-[`README file`]. Moreover, if you are interested in running the same TensorfFlow
-Lite model on Android/iOS, please see the
-[Mulit-Hand Tracking on GPU on Android/iOS](multi_hand_tracking_mobile_gpu.md)
-and
-
-We show the hand tracking demos with TensorFlow Lite model using the Webcam:
-
--   [TensorFlow Lite Multi-Hand Tracking Demo with Webcam (CPU)](#tensorflow-lite-multi-hand-tracking-demo-with-webcam-cpu)
-
--   [TensorFlow Lite Multi-Hand Tracking Demo with Webcam (GPU)](#tensorflow-lite-multi-hand-tracking-demo-with-webcam-gpu)
-
-Note: If MediaPipe depends on OpenCV 2, please see the
-[known issues with OpenCV 2](./object_detection_desktop.md#known-issues-with-opencv-2)
-section.
-
-### TensorFlow Lite Multi-Hand Tracking Demo with Webcam (CPU)
-
-To build and run the TensorFlow Lite example on desktop (CPU) with Webcam, run:
-
-```bash
-# Video from webcam running on desktop CPU
-$ bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 \
-    mediapipe/examples/desktop/multi_hand_tracking:multi_hand_tracking_cpu
-
-# It should print:
-#Target //mediapipe/examples/desktop/multi_hand_tracking:multi_hand_tracking_cpu up-to-date:
-#  bazel-bin/mediapipe/examples/desktop/multi_hand_tracking/multi_hand_tracking_cpu
-
-# This will open up your webcam as long as it is connected and on
-# Any errors is likely due to your webcam being not accessible
-$ GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/multi_hand_tracking/multi_hand_tracking_cpu \
-    --calculator_graph_config_file=mediapipe/graphs/hand_tracking/multi_hand_tracking_desktop_live.pbtxt
-```
-
-### TensorFlow Lite Multi-Hand Tracking Demo with Webcam (GPU)
-
-Note: This currently works only on Linux, and please first follow
-[OpenGL ES Setup on Linux Desktop](./gpu.md#opengl-es-setup-on-linux-desktop).
-
-To build and run the TensorFlow Lite example on desktop (GPU) with Webcam, run:
-
-```bash
-# Video from webcam running on desktop GPU
-# This works only for Linux currently
-$ bazel build -c opt --copt -DMESA_EGL_NO_X11_HEADERS --copt -DEGL_NO_X11 \
-    mediapipe/examples/desktop/multi_hand_tracking:multi_hand_tracking_gpu
-
-# It should print:
-# Target //mediapipe/examples/desktop/multi_hand_tracking:multi_hand_tracking_gpu up-to-date:
-#  bazel-bin/mediapipe/examples/desktop/multi_hand_tracking/multi_hand_tracking_gpu
-
-# This will open up your webcam as long as it is connected and on
-# Any errors is likely due to your webcam being not accessible,
-# or GPU drivers not setup properly.
-$ GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/multi_hand_tracking/multi_hand_tracking_gpu \
-    --calculator_graph_config_file=mediapipe/graphs/hand_tracking/multi_hand_tracking_mobile.pbtxt
-```
-
-#### Graph
-
-![graph visualization](images/multi_hand_tracking_desktop.png)
-
-To visualize the graph as shown above, copy the text specification of the graph
-below and paste it into [MediaPipe Visualizer](https://viz.mediapipe.dev).
-
-```bash
-# MediaPipe graph that performs multi-hand tracking on desktop with TensorFlow
-# Lite on CPU.
-# Used in the example in
-# mediapipie/examples/desktop/multi_hand_tracking:multi_hand_tracking_cpu.
-
-# Images coming into and out of the graph.
-input_stream: "input_video"
-output_stream: "output_video"
-
-# Determines if an input vector of NormalizedRect has a size greater than or
-# equal to the provided min_size.
-node {
-  calculator: "NormalizedRectVectorHasMinSizeCalculator"
-  input_stream: "ITERABLE:prev_multi_hand_rects_from_landmarks"
-  output_stream: "prev_has_enough_hands"
-  node_options: {
-    [type.googleapis.com/mediapipe.CollectionHasMinSizeCalculatorOptions] {
-      # This value can be changed to support tracking arbitrary number of hands.
-      # Please also remember to modify max_vec_size in
-      # ClipVectorSizeCalculatorOptions in
-      # mediapipe/graphs/hand_tracking/subgraphs/multi_hand_detection_gpu.pbtxt
-      min_size: 2
-    }
-  }
-}
-
-# Drops the incoming image if the previous frame had at least N hands.
-# Otherwise, passes the incoming image through to trigger a new round of hand
-# detection in MultiHandDetectionSubgraph.
-node {
-  calculator: "GateCalculator"
-  input_stream: "input_video"
-  input_stream: "DISALLOW:prev_has_enough_hands"
-  output_stream: "multi_hand_detection_input_video"
-  node_options: {
-    [type.googleapis.com/mediapipe.GateCalculatorOptions] {
-      empty_packets_as_allow: true
-    }
-  }
-}
-
-# Subgraph that detections hands (see multi_hand_detection_cpu.pbtxt).
-node {
-  calculator: "MultiHandDetectionSubgraph"
-  input_stream: "multi_hand_detection_input_video"
-  output_stream: "DETECTIONS:multi_palm_detections"
-  output_stream: "NORM_RECTS:multi_palm_rects"
-}
-
-# Subgraph that localizes hand landmarks for multiple hands (see
-# multi_hand_landmark.pbtxt).
-node {
-  calculator: "MultiHandLandmarkSubgraph"
-  input_stream: "IMAGE:input_video"
-  input_stream: "NORM_RECTS:multi_hand_rects"
-  output_stream: "LANDMARKS:multi_hand_landmarks"
-  output_stream: "NORM_RECTS:multi_hand_rects_from_landmarks"
-}
-
-# Caches a hand rectangle fed back from MultiHandLandmarkSubgraph, and upon the
-# arrival of the next input image sends out the cached rectangle with the
-# timestamp replaced by that of the input image, essentially generating a packet
-# that carries the previous hand rectangle. Note that upon the arrival of the
-# very first input image, an empty packet is sent out to jump start the
-# feedback loop.
-node {
-  calculator: "PreviousLoopbackCalculator"
-  input_stream: "MAIN:input_video"
-  input_stream: "LOOP:multi_hand_rects_from_landmarks"
-  input_stream_info: {
-    tag_index: "LOOP"
-    back_edge: true
-  }
-  output_stream: "PREV_LOOP:prev_multi_hand_rects_from_landmarks"
-}
-
-# Performs association between NormalizedRect vector elements from previous
-# frame and those from the current frame if MultiHandDetectionSubgraph runs.
-# This calculator ensures that the output multi_hand_rects vector doesn't
-# contain overlapping regions based on the specified min_similarity_threshold.
-node {
-  calculator: "AssociationNormRectCalculator"
-  input_stream: "prev_multi_hand_rects_from_landmarks"
-  input_stream: "multi_palm_rects"
-  output_stream: "multi_hand_rects"
-  node_options: {
-    [type.googleapis.com/mediapipe.AssociationCalculatorOptions] {
-      min_similarity_threshold: 0.5
-    }
-  }
-}
-
-# Subgraph that renders annotations and overlays them on top of the input
-# images (see multi_hand_renderer_cpu.pbtxt).
-node {
-  calculator: "MultiHandRendererSubgraph"
-  input_stream: "IMAGE:input_video"
-  input_stream: "DETECTIONS:multi_palm_detections"
-  input_stream: "LANDMARKS:multi_hand_landmarks"
-  input_stream: "NORM_RECTS:0:multi_palm_rects"
-  input_stream: "NORM_RECTS:1:multi_hand_rects"
-  output_stream: "IMAGE:output_video"
-}
-```
-
-[`README file`]:https://github.com/google/mediapipe/tree/master/mediapipe/README.md
diff --git a/mediapipe/docs/multi_hand_tracking_mobile_gpu.md b/mediapipe/docs/multi_hand_tracking_mobile_gpu.md
index 8665f2546..7cbd74181 100644
--- a/mediapipe/docs/multi_hand_tracking_mobile_gpu.md
+++ b/mediapipe/docs/multi_hand_tracking_mobile_gpu.md
@@ -1,743 +1 @@
-# Multi-Hand Tracking (GPU)
-
-This doc focuses on the
-[example graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/multi_hand_tracking_mobile.pbtxt)
-that performs multi-hand tracking with TensorFlow Lite on GPU. It is related to
-the [hand_tracking_example](./hand_tracking_mobile_gpu.md), and we recommend
-users to review the (single) hand tracking example first.
-
-![multi_hand_tracking_android_gpu.gif](images/mobile/multi_hand_tracking_android_gpu.gif)
-
-In the visualization above, the red dots represent the hand landmarks and the
-green lines are simply connections between selected landmark paris for
-visualization of the hand skeleton. When there are fewer than `N` hands (`N=2`
-in the graphs here), the purple box represents a hand rectangle that covers the
-entire hand, derived from hand detection (see
-[hand_detection_example](./hand_detection_mobile_gpu.md)). When there are `N`
-hands (i.e. 2 hands for the graphs here), the red boxes represent hand
-rectangles for each of the hands, derived from the previous round of hand
-landmark localization using an ML model (see also
-[model card](https://mediapipe.page.link/handmc)). Hand landmark localization
-for each hand is performed only within the hand rectangle for computational
-efficiency and accuracy. Hand detection is only invoked whenever there are fewer
-than `N` hands in the previous iteration.
-
-This example can also run a model that localizes hand landmarks in 3D (i.e.,
-estimating an extra z coordinate):
-
-![multi_hand_tracking_3d_android_gpu.gif](images/mobile/multi_hand_tracking_3d_android_gpu.gif)
-
-In the visualization above, the localized hand landmarks are represented by dots
-in different shades, with the brighter ones denoting landmarks closer to the
-camera.
-
-## Android
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/multihandtrackinggpu)
-
-To build the app yourself, run:
-
-```bash
-bazel build -c opt --config=android_arm64 mediapipe/examples/android/src/java/com/google/mediapipe/apps/multihandtrackinggpu
-```
-
-Once the app is built, install it on Android device with:
-
-```bash
-adb install bazel-bin/mediapipe/examples/android/src/java/com/google/mediapipe/apps/multihandtrackinggpu/multihandtrackinggpu.apk
-```
-
-## iOS
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/multihandtrackinggpu).
-
-See the general [instructions](./building_examples.md#ios) for building iOS
-examples and generating an Xcode project. This will be the HandDetectionGpuApp
-target.
-
-To build on the command line:
-
-```bash
-bazel build -c opt --config=ios_arm64 mediapipe/examples/ios/multihandtrackinggpu:MultiHandTrackingGpuApp
-```
-
-## Graph
-
-The multi-hand tracking [main graph](#main-graph) internal utilizes a
-[multi_hand_detection_subgraph](#multi-hand-detection-subgraph), a
-[multi_hand_landmark_subgraph](#multi-hand-landmark-subgraph), and a
-[multi_hand_renderer_subgraph](#multi-hand-renderer-subgraph).
-
-The subgraphs show up in the main graph visualization as nodes colored in
-purple, and the subgraph itself can also be visualized just like a regular
-graph. For more information on how to visualize a graph that includes subgraphs,
-see the Visualizing Subgraphs section in the
-[visualizer documentation](./visualizer.md).
-
-### Main Graph
-
-![multi_hand_tracking_mobile_graph](images/mobile/multi_hand_tracking_mobile.png)
-
-There are two key differences between this graph and the
-[single_hand_tracking_mobile_graph](./hand_tracking_mobile_gpu.md).
-
-1.  There is a `NormalizedRectVectorHasMinSize` calculator, that checks if in
-    input vector of `NormalizedRect` objects has a minimum size equal to `N`. In
-    this graph, if the vector contains fewer than `N` objects,
-    `MultiHandDetection` subgraph runs. Otherwise, the `GateCalculator` doesn't
-    send any image packets to the `MultiHandDetection` subgraph. This way, the
-    main graph is efficient in that it avoids running the costly hand detection
-    step when there are already `N` hands in the frame.
-2.  The `MergeCalculator` has been replaced by the `AssociationNormRect`
-    calculator. This `AssociationNormRect` takes as input a vector of
-    `NormalizedRect` objects from the `MultiHandDetection` subgraph on the
-    current frame, and a vector of `NormalizedRect` objects from the
-    `MultiHandLandmark` subgraph from the previous frame, and performs an
-    association operation between these objects. This calculator ensures that
-    the output vector doesn't contain overlapping regions based on the specified
-    `min_similarity_threshold`.
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/multi_hand_tracking_mobile.pbtxt)
-
-```bash
-# MediaPipe graph that performs multi-hand tracking with TensorFlow Lite on GPU.
-# Used in the examples in
-# mediapipie/examples/android/src/java/com/mediapipe/apps/multihandtrackinggpu.
-
-# Images coming into and out of the graph.
-input_stream: "input_video"
-output_stream: "output_video"
-
-# Throttles the images flowing downstream for flow control. It passes through
-# the very first incoming image unaltered, and waits for downstream nodes
-# (calculators and subgraphs) in the graph to finish their tasks before it
-# passes through another image. All images that come in while waiting are
-# dropped, limiting the number of in-flight images in most part of the graph to
-# 1. This prevents the downstream nodes from queuing up incoming images and data
-# excessively, which leads to increased latency and memory usage, unwanted in
-# real-time mobile applications. It also eliminates unnecessarily computation,
-# e.g., the output produced by a node may get dropped downstream if the
-# subsequent nodes are still busy processing previous inputs.
-node {
-  calculator: "FlowLimiterCalculator"
-  input_stream: "input_video"
-  input_stream: "FINISHED:multi_hand_rects"
-  input_stream_info: {
-    tag_index: "FINISHED"
-    back_edge: true
-  }
-  output_stream: "throttled_input_video"
-}
-
-# Determines if an input vector of NormalizedRect has a size greater than or
-# equal to the provided min_size.
-node {
-  calculator: "NormalizedRectVectorHasMinSizeCalculator"
-  input_stream: "ITERABLE:prev_multi_hand_rects_from_landmarks"
-  output_stream: "prev_has_enough_hands"
-  node_options: {
-    [type.googleapis.com/mediapipe.CollectionHasMinSizeCalculatorOptions] {
-      # This value can be changed to support tracking arbitrary number of hands.
-      # Please also remember to modify max_vec_size in
-      # ClipVectorSizeCalculatorOptions in
-      # mediapipe/graphs/hand_tracking/subgraphs/multi_hand_detection_gpu.pbtxt
-      min_size: 2
-    }
-  }
-}
-
-# Drops the incoming image if the previous frame had at least N hands.
-# Otherwise, passes the incoming image through to trigger a new round of hand
-# detection in MultiHandDetectionSubgraph.
-node {
-  calculator: "GateCalculator"
-  input_stream: "throttled_input_video"
-  input_stream: "DISALLOW:prev_has_enough_hands"
-  output_stream: "multi_hand_detection_input_video"
-  node_options: {
-    [type.googleapis.com/mediapipe.GateCalculatorOptions] {
-      empty_packets_as_allow: true
-    }
-  }
-}
-
-# Subgraph that detections hands (see multi_hand_detection_gpu.pbtxt).
-node {
-  calculator: "MultiHandDetectionSubgraph"
-  input_stream: "multi_hand_detection_input_video"
-  output_stream: "DETECTIONS:multi_palm_detections"
-  output_stream: "NORM_RECTS:multi_palm_rects"
-}
-
-# Subgraph that localizes hand landmarks for multiple hands (see
-# multi_hand_landmark.pbtxt).
-node {
-  calculator: "MultiHandLandmarkSubgraph"
-  input_stream: "IMAGE:throttled_input_video"
-  input_stream: "NORM_RECTS:multi_hand_rects"
-  output_stream: "LANDMARKS:multi_hand_landmarks"
-  output_stream: "NORM_RECTS:multi_hand_rects_from_landmarks"
-}
-
-# Caches a hand rectangle fed back from MultiHandLandmarkSubgraph, and upon the
-# arrival of the next input image sends out the cached rectangle with the
-# timestamp replaced by that of the input image, essentially generating a packet
-# that carries the previous hand rectangle. Note that upon the arrival of the
-# very first input image, an empty packet is sent out to jump start the
-# feedback loop.
-node {
-  calculator: "PreviousLoopbackCalculator"
-  input_stream: "MAIN:throttled_input_video"
-  input_stream: "LOOP:multi_hand_rects_from_landmarks"
-  input_stream_info: {
-    tag_index: "LOOP"
-    back_edge: true
-  }
-  output_stream: "PREV_LOOP:prev_multi_hand_rects_from_landmarks"
-}
-
-# Performs association between NormalizedRect vector elements from previous
-# frame and those from the current frame if MultiHandDetectionSubgraph runs.
-# This calculator ensures that the output multi_hand_rects vector doesn't
-# contain overlapping regions based on the specified min_similarity_threshold.
-node {
-  calculator: "AssociationNormRectCalculator"
-  input_stream: "prev_multi_hand_rects_from_landmarks"
-  input_stream: "multi_palm_rects"
-  output_stream: "multi_hand_rects"
-  node_options: {
-    [type.googleapis.com/mediapipe.AssociationCalculatorOptions] {
-      min_similarity_threshold: 0.5
-    }
-  }
-}
-
-# Subgraph that renders annotations and overlays them on top of the input
-# images (see multi_hand_renderer_gpu.pbtxt).
-node {
-  calculator: "MultiHandRendererSubgraph"
-  input_stream: "IMAGE:throttled_input_video"
-  input_stream: "DETECTIONS:multi_palm_detections"
-  input_stream: "LANDMARKS:multi_hand_landmarks"
-  input_stream: "NORM_RECTS:0:multi_palm_rects"
-  input_stream: "NORM_RECTS:1:multi_hand_rects"
-  output_stream: "IMAGE:output_video"
-}
-```
-
-### Multi-Hand Detection Subgraph
-
-![multi_hand_detection_gpu_subgraph](images/mobile/multi_hand_detection_gpu_subgraph.png)
-
-This graph outputs a vector of `NormalizedRect` objects corresponding to each of
-the hand instances visible in the frame. Note that at the end of this graph,
-there is a `ClipNormalizedRectVectorSizeCalculator`. This calculator clips the
-size of the input vector to a maximum size `N`. This implies that the
-`MultiHandDetection` subgraph outputs a vector of maximum `N` hand instance
-locations.
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/subgraphs/multi_hand_detection_gpu.pbtxt)
-
-```bash
-# MediaPipe multi-hand detection subgraph.
-
-type: "MultiHandDetectionSubgraph"
-
-input_stream: "input_video"
-output_stream: "DETECTIONS:palm_detections"
-output_stream: "NORM_RECTS:clipped_hand_rects_from_palm_detections"
-
-# Transforms the input image on GPU to a 256x256 image. To scale the input
-# image, the scale_mode option is set to FIT to preserve the aspect ratio,
-# resulting in potential letterboxing in the transformed image.
-node: {
-  calculator: "ImageTransformationCalculator"
-  input_stream: "IMAGE_GPU:input_video"
-  output_stream: "IMAGE_GPU:transformed_input_video"
-  output_stream: "LETTERBOX_PADDING:letterbox_padding"
-  node_options: {
-    [type.googleapis.com/mediapipe.ImageTransformationCalculatorOptions] {
-      output_width: 256
-      output_height: 256
-      scale_mode: FIT
-    }
-  }
-}
-
-# Generates a single side packet containing a TensorFlow Lite op resolver that
-# supports custom ops needed by the model used in this graph.
-node {
-  calculator: "TfLiteCustomOpResolverCalculator"
-  output_side_packet: "opresolver"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteCustomOpResolverCalculatorOptions] {
-      use_gpu: true
-    }
-  }
-}
-
-# Converts the transformed input image on GPU into an image tensor stored as a
-# TfLiteTensor.
-node {
-  calculator: "TfLiteConverterCalculator"
-  input_stream: "IMAGE_GPU:transformed_input_video"
-  output_stream: "TENSORS_GPU:image_tensor"
-}
-
-# Runs a TensorFlow Lite model on GPU that takes an image tensor and outputs a
-# vector of tensors representing, for instance, detection boxes/keypoints and
-# scores.
-node {
-  calculator: "TfLiteInferenceCalculator"
-  input_stream: "TENSORS_GPU:image_tensor"
-  output_stream: "TENSORS_GPU:detection_tensors"
-  input_side_packet: "CUSTOM_OP_RESOLVER:opresolver"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteInferenceCalculatorOptions] {
-      model_path: "mediapipe/models/palm_detection.tflite"
-      use_gpu: true
-    }
-  }
-}
-
-# Generates a single side packet containing a vector of SSD anchors based on
-# the specification in the options.
-node {
-  calculator: "SsdAnchorsCalculator"
-  output_side_packet: "anchors"
-  node_options: {
-    [type.googleapis.com/mediapipe.SsdAnchorsCalculatorOptions] {
-      num_layers: 5
-      min_scale: 0.1171875
-      max_scale: 0.75
-      input_size_height: 256
-      input_size_width: 256
-      anchor_offset_x: 0.5
-      anchor_offset_y: 0.5
-      strides: 8
-      strides: 16
-      strides: 32
-      strides: 32
-      strides: 32
-      aspect_ratios: 1.0
-      fixed_anchor_size: true
-    }
-  }
-}
-
-# Decodes the detection tensors generated by the TensorFlow Lite model, based on
-# the SSD anchors and the specification in the options, into a vector of
-# detections. Each detection describes a detected object.
-node {
-  calculator: "TfLiteTensorsToDetectionsCalculator"
-  input_stream: "TENSORS_GPU:detection_tensors"
-  input_side_packet: "ANCHORS:anchors"
-  output_stream: "DETECTIONS:detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteTensorsToDetectionsCalculatorOptions] {
-      num_classes: 1
-      num_boxes: 2944
-      num_coords: 18
-      box_coord_offset: 0
-      keypoint_coord_offset: 4
-      num_keypoints: 7
-      num_values_per_keypoint: 2
-      sigmoid_score: true
-      score_clipping_thresh: 100.0
-      reverse_output_order: true
-
-      x_scale: 256.0
-      y_scale: 256.0
-      h_scale: 256.0
-      w_scale: 256.0
-      min_score_thresh: 0.7
-    }
-  }
-}
-
-# Performs non-max suppression to remove excessive detections.
-node {
-  calculator: "NonMaxSuppressionCalculator"
-  input_stream: "detections"
-  output_stream: "filtered_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.NonMaxSuppressionCalculatorOptions] {
-      min_suppression_threshold: 0.3
-      overlap_type: INTERSECTION_OVER_UNION
-      algorithm: WEIGHTED
-      return_empty_detections: true
-    }
-  }
-}
-
-# Maps detection label IDs to the corresponding label text ("Palm"). The label
-# map is provided in the label_map_path option.
-node {
-  calculator: "DetectionLabelIdToTextCalculator"
-  input_stream: "filtered_detections"
-  output_stream: "labeled_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionLabelIdToTextCalculatorOptions] {
-      label_map_path: "mediapipe/models/palm_detection_labelmap.txt"
-    }
-  }
-}
-
-# Adjusts detection locations (already normalized to [0.f, 1.f]) on the
-# letterboxed image (after image transformation with the FIT scale mode) to the
-# corresponding locations on the same image with the letterbox removed (the
-# input image to the graph before image transformation).
-node {
-  calculator: "DetectionLetterboxRemovalCalculator"
-  input_stream: "DETECTIONS:labeled_detections"
-  input_stream: "LETTERBOX_PADDING:letterbox_padding"
-  output_stream: "DETECTIONS:palm_detections"
-}
-
-# Extracts image size from the input images.
-node {
-  calculator: "ImagePropertiesCalculator"
-  input_stream: "IMAGE_GPU:input_video"
-  output_stream: "SIZE:image_size"
-}
-
-# Converts each palm detection into a rectangle (normalized by image size)
-# that encloses the palm and is rotated such that the line connecting center of
-# the wrist and MCP of the middle finger is aligned with the Y-axis of the
-# rectangle.
-node {
-  calculator: "DetectionsToRectsCalculator"
-  input_stream: "DETECTIONS:palm_detections"
-  input_stream: "IMAGE_SIZE:image_size"
-  output_stream: "NORM_RECTS:palm_rects"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionsToRectsCalculatorOptions] {
-      rotation_vector_start_keypoint_index: 0  # Center of wrist.
-      rotation_vector_end_keypoint_index: 2  # MCP of middle finger.
-      rotation_vector_target_angle_degrees: 90
-      output_zero_rect_for_empty_detections: true
-    }
-  }
-}
-
-# Expands and shifts the rectangle that contains the palm so that it's likely
-# to cover the entire hand.
-node {
-  calculator: "RectTransformationCalculator"
-  input_stream: "NORM_RECTS:palm_rects"
-  input_stream: "IMAGE_SIZE:image_size"
-  output_stream: "hand_rects_from_palm_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.RectTransformationCalculatorOptions] {
-      scale_x: 2.6
-      scale_y: 2.6
-      shift_y: -0.5
-      square_long: true
-    }
-  }
-}
-
-# Clips the size of the input vector to the provided max_vec_size. This
-# determines the maximum number of hand instances this graph outputs.
-# Note that the performance gain of clipping detections earlier in this graph is
-# minimal because NMS will minimize overlapping detections and the number of
-# detections isn't expected to exceed 5-10.
-node {
-  calculator: "ClipNormalizedRectVectorSizeCalculator"
-  input_stream: "hand_rects_from_palm_detections"
-  output_stream: "clipped_hand_rects_from_palm_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.ClipVectorSizeCalculatorOptions] {
-      # This value can be changed to support tracking arbitrary number of hands.
-      # Please also remember to modify min_size in
-      # CollectionHsMinSizeCalculatorOptions in
-      # mediapipe/graphs/hand_tracking/multi_hand_tracking_mobile.pbtxt and
-      # mediapipe/graphs/hand_tracking/multi_hand_tracking_desktop_live.pbtxt.
-      max_vec_size: 2
-    }
-  }
-}
-```
-
-### Multi-Hand Landmark Subgraph
-
-![multi_hand_landmark_subgraph.pbtxt](images/mobile/multi_hand_landmark_subgraph.png)
-
-This graph accepts as input a vector of `NormalizedRect` objects, corresponding
-the the region of each hand instance in the input image. For each
-`NormalizedRect` object, the graph runs the existing `HandLandmark` subgraph and
-collect the outputs of this subgraph into vectors. This is enabled by
-`BeginLoop` and `EndLoop` calculators.
-
-The `BeginLoop` calculator accepts as input a packet containing an iterable
-collection of elements. This calculator is templatized (see
-[begin_loop_calculator.h](https://github.com/google/mediapipe/tree/master/mediapipe/calculators/core/begin_loop_calculator.h)).
-If the input packet arrived at a timestamp `ts`, this calculator outputs each
-element in the collection at a fake timestamp `internal_ts`. At the end of the
-collection, the calculator outputs the arrival timestamp `ts` in the output
-stream tagged with `BATCH_END`.
-
-The nodes between the `BeginLoop` calculator and the corresponding `EndLoop`
-calculator process individual packets at the fake timestamps `internal_ts`.
-After each element is processed, it is sent to the `EndLoop` calculator (see
-[end_loop_calculator.h](https://github.com/google/mediapipe/tree/master/mediapipe/calculators/core/end_loop_calculator.h)),
-which collects these elements in an output collection. The `EndLoop` calculator
-listens for packets from the `BATCH_END` output stream of the `BeginLoop`
-calculator. When the `BATCH_END` packet containing the real timestamp `ts`
-arrives at the `EndLoop` calculator, the `EndLoop` calculator outputs a packet
-containing the collection of processed elements at the real timestamp `ts`.
-
-In the multi-hand landmark subgraph, the `EndLoop` calculators collect the
-output vector of hand landmarks per hand instance, the boolean values indicating
-the presence of each hand and the `NormalizedRect` objects corresponding to the
-regions surrounding each hand into vectors.
-
-Finally, based on the hand presence boolean value, the graph filters the
-collections of hand landmarks and `NormalizdRect` objects corresponding to each
-hand instance.
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/subgraphs/multi_hand_landmark.pbtxt)
-
-```bash
-# MediaPipe hand landmark localization subgraph.
-
-type: "MultiHandLandmarkSubgraph"
-
-input_stream: "IMAGE:input_video"
-# A vector of NormalizedRect, one per each hand detected.
-input_stream: "NORM_RECTS:multi_hand_rects"
-# A vector of NormalizedLandmarks, one set per each hand.
-output_stream: "LANDMARKS:filtered_multi_hand_landmarks"
-# A vector of NormalizedRect, one per each hand.
-output_stream: "NORM_RECTS:filtered_multi_hand_rects_for_next_frame"
-
-# Outputs each element of multi_hand_rects at a fake timestamp for the rest
-# of the graph to process. Clones the input_video packet for each
-# single_hand_rect at the fake timestamp. At the end of the loop,
-# outputs the BATCH_END timestamp for downstream calculators to inform them
-# that all elements in the vector have been processed.
-node {
-  calculator: "BeginLoopNormalizedRectCalculator"
-  input_stream: "ITERABLE:multi_hand_rects"
-  input_stream: "CLONE:input_video"
-  output_stream: "ITEM:single_hand_rect"
-  output_stream: "CLONE:input_video_cloned"
-  output_stream: "BATCH_END:single_hand_rect_timestamp"
-}
-
-node {
-  calculator: "HandLandmarkSubgraph"
-  input_stream: "IMAGE:input_video_cloned"
-  input_stream: "NORM_RECT:single_hand_rect"
-  output_stream: "LANDMARKS:single_hand_landmarks"
-  output_stream: "NORM_RECT:single_hand_rect_from_landmarks"
-  output_stream: "PRESENCE:single_hand_presence"
-}
-
-# Collects the boolean presence value for each single hand into a vector. Upon
-# receiving the BATCH_END timestamp, outputs a vector of boolean values at the
-# BATCH_END timestamp.
-node {
-  calculator: "EndLoopBooleanCalculator"
-  input_stream: "ITEM:single_hand_presence"
-  input_stream: "BATCH_END:single_hand_rect_timestamp"
-  output_stream: "ITERABLE:multi_hand_presence"
-}
-
-# Collects a set of landmarks for each hand into a vector. Upon receiving the
-# BATCH_END timestamp, outputs the vector of landmarks at the BATCH_END
-# timestamp.
-node {
-  calculator: "EndLoopNormalizedLandmarkListVectorCalculator"
-  input_stream: "ITEM:single_hand_landmarks"
-  input_stream: "BATCH_END:single_hand_rect_timestamp"
-  output_stream: "ITERABLE:multi_hand_landmarks"
-}
-
-# Collects a NormalizedRect for each hand into a vector. Upon receiving the
-# BATCH_END timestamp, outputs the vector of NormalizedRect at the BATCH_END
-# timestamp.
-node {
-  calculator: "EndLoopNormalizedRectCalculator"
-  input_stream: "ITEM:single_hand_rect_from_landmarks"
-  input_stream: "BATCH_END:single_hand_rect_timestamp"
-  output_stream: "ITERABLE:multi_hand_rects_for_next_frame"
-}
-
-# Filters the input vector of landmarks based on hand presence value for each
-# hand. If the hand presence for hand #i is false, the set of landmarks
-# corresponding to that hand are dropped from the vector.
-node {
-  calculator: "FilterLandmarkListCollectionCalculator"
-  input_stream: "ITERABLE:multi_hand_landmarks"
-  input_stream: "CONDITION:multi_hand_presence"
-  output_stream: "ITERABLE:filtered_multi_hand_landmarks"
-}
-
-# Filters the input vector of NormalizedRect based on hand presence value for
-# each hand. If the hand presence for hand #i is false, the NormalizedRect
-# corresponding to that hand are dropped from the vector.
-node {
-  calculator: "FilterNormalizedRectCollectionCalculator"
-  input_stream: "ITERABLE:multi_hand_rects_for_next_frame"
-  input_stream: "CONDITION:multi_hand_presence"
-  output_stream: "ITERABLE:filtered_multi_hand_rects_for_next_frame"
-}
-```
-
-### Multi-Hand Renderer Subgraph
-
-![multi_hand_renderer_gpu_subgraph.pbtxt](images/mobile/multi_hand_renderer_gpu_subgraph.png)
-
-This graph also uses `BeginLoop` and `EndLoop` calculators to iteratively
-convert a set of hand landmarks per hand instance into corresponding
-`RenderData` objects.
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/hand_tracking/subgraphs/multi_hand_renderer_gpu.pbtxt)
-
-```bash
-# MediaPipe multi-hand tracking rendering subgraph.
-
-type: "MultiHandRendererSubgraph"
-
-input_stream: "IMAGE:input_image"
-# A vector of NormalizedLandmarks, one for each hand.
-input_stream: "LANDMARKS:multi_hand_landmarks"
-# A vector of NormalizedRect, one for each hand.
-input_stream: "NORM_RECTS:0:multi_palm_rects"
-# A vector of NormalizedRect, one for each hand.
-input_stream: "NORM_RECTS:1:multi_hand_rects"
-# A vector of Detection, one for each hand.
-input_stream: "DETECTIONS:palm_detections"
-output_stream: "IMAGE:output_image"
-
-# Converts detections to drawing primitives for annotation overlay.
-node {
-  calculator: "DetectionsToRenderDataCalculator"
-  input_stream: "DETECTIONS:palm_detections"
-  output_stream: "RENDER_DATA:detection_render_data"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionsToRenderDataCalculatorOptions] {
-      thickness: 4.0
-      color { r: 0 g: 255 b: 0 }
-    }
-  }
-}
-
-# Converts normalized rects to drawing primitives for annotation overlay.
-node {
-  calculator: "RectToRenderDataCalculator"
-  input_stream: "NORM_RECTS:multi_hand_rects"
-  output_stream: "RENDER_DATA:multi_hand_rects_render_data"
-  node_options: {
-    [type.googleapis.com/mediapipe.RectToRenderDataCalculatorOptions] {
-      filled: false
-      color { r: 255 g: 0 b: 0 }
-      thickness: 4.0
-    }
-  }
-}
-
-# Converts normalized rects to drawing primitives for annotation overlay.
-node {
-  calculator: "RectToRenderDataCalculator"
-  input_stream: "NORM_RECTS:multi_palm_rects"
-  output_stream: "RENDER_DATA:multi_palm_rects_render_data"
-  node_options: {
-    [type.googleapis.com/mediapipe.RectToRenderDataCalculatorOptions] {
-      filled: false
-      color { r: 125 g: 0 b: 122 }
-      thickness: 4.0
-    }
-  }
-}
-
-# Outputs each element of multi_palm_landmarks at a fake timestamp for the rest
-# of the graph to process. At the end of the loop, outputs the BATCH_END
-# timestamp for downstream calculators to inform them that all elements in the
-# vector have been processed.
-node {
-  calculator: "BeginLoopNormalizedLandmarkListVectorCalculator"
-  input_stream: "ITERABLE:multi_hand_landmarks"
-  output_stream: "ITEM:single_hand_landmarks"
-  output_stream: "BATCH_END:landmark_timestamp"
-}
-
-# Converts landmarks to drawing primitives for annotation overlay.
-node {
-  calculator: "LandmarksToRenderDataCalculator"
-  input_stream: "NORM_LANDMARKS:single_hand_landmarks"
-  output_stream: "RENDER_DATA:single_hand_landmark_render_data"
-  node_options: {
-    [type.googleapis.com/mediapipe.LandmarksToRenderDataCalculatorOptions] {
-      landmark_connections: 0
-      landmark_connections: 1
-      landmark_connections: 1
-      landmark_connections: 2
-      landmark_connections: 2
-      landmark_connections: 3
-      landmark_connections: 3
-      landmark_connections: 4
-      landmark_connections: 0
-      landmark_connections: 5
-      landmark_connections: 5
-      landmark_connections: 6
-      landmark_connections: 6
-      landmark_connections: 7
-      landmark_connections: 7
-      landmark_connections: 8
-      landmark_connections: 5
-      landmark_connections: 9
-      landmark_connections: 9
-      landmark_connections: 10
-      landmark_connections: 10
-      landmark_connections: 11
-      landmark_connections: 11
-      landmark_connections: 12
-      landmark_connections: 9
-      landmark_connections: 13
-      landmark_connections: 13
-      landmark_connections: 14
-      landmark_connections: 14
-      landmark_connections: 15
-      landmark_connections: 15
-      landmark_connections: 16
-      landmark_connections: 13
-      landmark_connections: 17
-      landmark_connections: 0
-      landmark_connections: 17
-      landmark_connections: 17
-      landmark_connections: 18
-      landmark_connections: 18
-      landmark_connections: 19
-      landmark_connections: 19
-      landmark_connections: 20
-      landmark_color { r: 255 g: 0 b: 0 }
-      connection_color { r: 0 g: 255 b: 0 }
-      thickness: 4.0
-    }
-  }
-}
-
-# Collects a RenderData object for each hand into a vector. Upon receiving the
-# BATCH_END timestamp, outputs the vector of RenderData at the BATCH_END
-# timestamp.
-node {
-  calculator: "EndLoopRenderDataCalculator"
-  input_stream: "ITEM:single_hand_landmark_render_data"
-  input_stream: "BATCH_END:landmark_timestamp"
-  output_stream: "ITERABLE:multi_hand_landmarks_render_data"
-}
-
-# Draws annotations and overlays them on top of the input images. Consumes
-# a vector of RenderData objects and draws each of them on the input frame.
-node {
-  calculator: "AnnotationOverlayCalculator"
-  input_stream: "IMAGE_GPU:input_image"
-  input_stream: "detection_render_data"
-  input_stream: "multi_hand_rects_render_data"
-  input_stream: "multi_palm_rects_render_data"
-  input_stream: "VECTOR:0:multi_hand_landmarks_render_data"
-  output_stream: "IMAGE_GPU:output_image"
-}
-```
+Content moved to [MediapPipe Hand](https://google.github.io/mediapipe/solutions/hand)
diff --git a/mediapipe/docs/object_detection_coral_devboard.md b/mediapipe/docs/object_detection_coral_devboard.md
deleted file mode 100644
index 4275860ca..000000000
--- a/mediapipe/docs/object_detection_coral_devboard.md
+++ /dev/null
@@ -1,23 +0,0 @@
-## Object Detection on Coral with Webcam
-
-MediaPipe is able to run cross platform across device types like desktop, mobile
-and edge devices. Here is an example of running MediaPipe
-[object detection pipeline](./object_detection_desktop.md) on edge device like
-the [Coral Dev Board](https://coral.ai/products/dev-board).
-
-This MediaPipe Coral object
-detection pipeline is running [coral specific quantized version](https://github.com/google/mediapipe/blob/master/mediapipe/examples/coral/models/object-detector-quantized_edgetpu.tflite)
-of the [MediaPipe object detection TFLite model](https://github.com/google/mediapipe/blob/master/mediapipe/models/object_detection_front.tflite)
-accelerated on Edge TPU.
-
-### Cross compilation of MediaPipe Coral binaries in Docker
-
-We recommend building the MediaPipe binaries not on the edge device due to
-limited compute resulting in long build times. Instead, we will build MediaPipe
-binaries using Docker containers on a more powerful host machine.
-
-For step by
-step details of cross compiling and running MediaPipe binaries on the Coral Dev
-Board, please refer to [README.md in MediaPipe Coral example folder](https://github.com/google/mediapipe/tree/master/mediapipe/examples/coral).
-
-![Object Detection running on Coral](images/object_detection_demo_coral.jpg)
diff --git a/mediapipe/docs/object_detection_desktop.md b/mediapipe/docs/object_detection_desktop.md
index 0dbbb9a3b..cdf2e0b8d 100644
--- a/mediapipe/docs/object_detection_desktop.md
+++ b/mediapipe/docs/object_detection_desktop.md
@@ -1,461 +1,2 @@
-## Object Detection on Desktop
-
-This is an example of using MediaPipe to run object detection models (TensorFlow
-and TensorFlow Lite) and render bounding boxes on the detected objects. To know
-more about the object detection models and TensorFlow-to-TFLite model
-conversion, please refer to the model [`README file`]. Moreover, if you are
-interested in running the same TensorfFlow Lite model on Android, please see the
-[Object Detection on GPU on Android](object_detection_android_gpu.md) and
-[Object Detection on CPU on Android](object_detection_android_cpu.md) examples.
-
-We show the object detection demo with both TensorFlow model and TensorFlow Lite model:
-
--   [TensorFlow Object Detection Demo](#tensorflow-object-detection-demo)
--   [TensorFlow Lite Object Detection Demo](#tensorflow-lite-object-detection-demo)
--   [TensorFlow Lite Object Detection Demo with Webcam (CPU)](#tensorflow-lite-object-detection-demo-with-webcam-cpu)
-
-Note: If MediaPipe depends on OpenCV 2, please see the [known issues with OpenCV 2](#known-issues-with-opencv-2) section.
-
-### TensorFlow Object Detection Demo
-
-Note: If you would like to run TensorFlow inference on GPU on Linux, please
-follow
-[TensorFlow CUDA Support and Setup on Linux Desktop](gpu.md#tensorflow-cuda-support-and-setup-on-linux-desktop)
-instead.
-
-To build and run the TensorFlow inference example on CPU on desktop, run:
-
-```bash
-# Note that this command also builds TensorFlow targets from scratch, it may
-# take a long time (e.g., up to 30 mins) to build for the first time.
-$ bazel build -c opt \
-    --define MEDIAPIPE_DISABLE_GPU=1 \
-    --define no_aws_support=true \
-    --linkopt=-s \
-    mediapipe/examples/desktop/object_detection:object_detection_tensorflow
-
-# It should print:
-# Target //mediapipe/examples/desktop/object_detection:object_detection_tensorflow up-to-date:
-#   bazel-bin/mediapipe/examples/desktop/object_detection/object_detection_tensorflow
-# INFO: Elapsed time: 172.262s, Critical Path: 125.68s
-# INFO: 2675 processes: 2673 linux-sandbox, 2 local.
-# INFO: Build completed successfully, 2807 total actions
-
-# Replace <input video path> and <output video path>.
-# You can find a test video in mediapipe/examples/desktop/object_detection.
-$ GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/object_detection/object_detection_tensorflow \
-  --calculator_graph_config_file=mediapipe/graphs/object_detection/object_detection_desktop_tensorflow_graph.pbtxt \
-  --input_side_packets=input_video_path=<input video path>,output_video_path=<output video path>
-```
-
-#### Graph
-
-![graph visualization](images/object_detection_desktop_tensorflow.png)
-
-To visualize the graph as shown above, copy the text specification of the graph
-below and paste it into
-[MediaPipe Visualizer](https://viz.mediapipe.dev).
-
-```bash
-# MediaPipe graph that performs object detection on desktop with TensorFlow
-# on CPU.
-# Used in the example in
-# mediapipe/examples/desktop/object_detection:object_detection_tensorflow.
-
-# Decodes an input video file into images and a video header.
-node {
-  calculator: "OpenCvVideoDecoderCalculator"
-  input_side_packet: "INPUT_FILE_PATH:input_video_path"
-  output_stream: "VIDEO:input_video"
-  output_stream: "VIDEO_PRESTREAM:input_video_header"
-}
-
-# Converts the input image into an image tensor as a tensorflow::Tensor.
-node {
-  calculator: "ImageFrameToTensorCalculator"
-  input_stream: "input_video"
-  output_stream: "image_tensor"
-}
-
-# Generates a single side packet containing a TensorFlow session from a saved
-# model. The directory path that contains the saved model is specified in the
-# saved_model_path option, and the name of the saved model file has to be
-# "saved_model.pb".
-node {
-  calculator: "TensorFlowSessionFromSavedModelCalculator"
-  output_side_packet: "SESSION:object_detection_session"
-  node_options: {
-    [type.googleapis.com/mediapipe.TensorFlowSessionFromSavedModelCalculatorOptions]: {
-      saved_model_path: "mediapipe/models/object_detection_saved_model"
-    }
-  }
-}
-
-# Runs a TensorFlow session (specified as an input side packet) that takes an
-# image tensor and outputs multiple tensors that describe the objects detected
-# in the image. The batch_size option is set to 1 to disable batching entirely.
-# Note that the particular TensorFlow model used in this session handles image
-# scaling internally before the object-detection inference, and therefore no
-# additional calculator for image transformation is needed in this MediaPipe
-# graph.
-node: {
-  calculator: "TensorFlowInferenceCalculator"
-  input_side_packet: "SESSION:object_detection_session"
-  input_stream: "INPUTS:image_tensor"
-  output_stream: "DETECTION_BOXES:detection_boxes_tensor"
-  output_stream: "DETECTION_CLASSES:detection_classes_tensor"
-  output_stream: "DETECTION_SCORES:detection_scores_tensor"
-  output_stream: "NUM_DETECTIONS:num_detections_tensor"
-  node_options: {
-    [type.googleapis.com/mediapipe.TensorFlowInferenceCalculatorOptions]: {
-      batch_size: 1
-    }
-  }
-}
-
-# Decodes the detection tensors from the TensorFlow model into a vector of
-# detections. Each detection describes a detected object.
-node {
-  calculator: "ObjectDetectionTensorsToDetectionsCalculator"
-  input_stream: "BOXES:detection_boxes_tensor"
-  input_stream: "SCORES:detection_scores_tensor"
-  input_stream: "CLASSES:detection_classes_tensor"
-  input_stream: "NUM_DETECTIONS:num_detections_tensor"
-  output_stream: "DETECTIONS:detections"
-}
-
-# Performs non-max suppression to remove excessive detections.
-node {
-  calculator: "NonMaxSuppressionCalculator"
-  input_stream: "detections"
-  output_stream: "filtered_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.NonMaxSuppressionCalculatorOptions] {
-      min_suppression_threshold: 0.4
-      min_score_threshold: 0.6
-      max_num_detections: 10
-      overlap_type: INTERSECTION_OVER_UNION
-    }
-  }
-}
-
-# Maps detection label IDs to the corresponding label text. The label map is
-# provided in the label_map_path option.
-node {
-  calculator: "DetectionLabelIdToTextCalculator"
-  input_stream: "filtered_detections"
-  output_stream: "output_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionLabelIdToTextCalculatorOptions] {
-      label_map_path: "mediapipe/models/ssdlite_object_detection_labelmap.txt"
-    }
-  }
-}
-
-# Converts the detections to drawing primitives for annotation overlay.
-node {
-  calculator: "DetectionsToRenderDataCalculator"
-  input_stream: "DETECTION_VECTOR:output_detections"
-  output_stream: "RENDER_DATA:render_data"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionsToRenderDataCalculatorOptions] {
-      thickness: 4.0
-      color { r: 255 g: 0 b: 0 }
-    }
-  }
-}
-
-# Draws annotations and overlays them on top of the original image coming into
-# the graph.
-node {
-  calculator: "AnnotationOverlayCalculator"
-  input_stream: "IMAGE:input_video"
-  input_stream: "render_data"
-  output_stream: "IMAGE:output_video"
-}
-
-# Encodes the annotated images into a video file, adopting properties specified
-# in the input video header, e.g., video framerate.
-node {
-  calculator: "OpenCvVideoEncoderCalculator"
-  input_stream: "VIDEO:output_video"
-  input_stream: "VIDEO_PRESTREAM:input_video_header"
-  input_side_packet: "OUTPUT_FILE_PATH:output_video_path"
-  node_options: {
-    [type.googleapis.com/mediapipe.OpenCvVideoEncoderCalculatorOptions]: {
-      codec: "avc1"
-      video_format: "mp4"
-    }
-  }
-}
-```
-
-### TensorFlow Lite Object Detection Demo
-
-To build and run the TensorFlow Lite example on desktop, run:
-
-```bash
-$ bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 \
-    mediapipe/examples/desktop/object_detection:object_detection_tflite
-
-# It should print:
-# Target //mediapipe/examples/desktop/object_detection:object_detection_tflite up-to-date:
-#   bazel-bin/mediapipe/examples/desktop/object_detection/object_detection_tflite
-# INFO: Elapsed time: 36.417s, Critical Path: 23.22s
-# INFO: 711 processes: 710 linux-sandbox, 1 local.
-# INFO: Build completed successfully, 734 total actions
-
-# Replace <input video path> and <output video path>.
-# You can find a test video in mediapipe/examples/desktop/object_detection.
-$ GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/object_detection/object_detection_tflite \
-    --calculator_graph_config_file=mediapipe/graphs/object_detection/object_detection_desktop_tflite_graph.pbtxt \
-    --input_side_packets=input_video_path=<input video path>,output_video_path=<output video path>
-```
-
-### TensorFlow Lite Object Detection Demo with Webcam (CPU)
-
-To build and run the TensorFlow Lite example on desktop (CPU) with Webcam, run:
-
-```bash
-# Video from webcam running on desktop CPU
-$ bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 \
-    mediapipe/examples/desktop/object_detection:object_detection_cpu
-# It should print:
-#Target //mediapipe/examples/desktop/object_detection:object_detection_cpu up-to-date:
-#  bazel-bin/mediapipe/examples/desktop/object_detection/object_detection_cpu
-#INFO: Build completed successfully, 12154 total actions
-
-# This will open up your webcam as long as it is connected and on
-# Any errors is likely due to your webcam being not accessible
-$ GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/object_detection/object_detection_cpu \
-    --calculator_graph_config_file=mediapipe/graphs/object_detection/object_detection_desktop_live.pbtxt
-```
-
-#### Graph
-
-![graph visualization](images/object_detection_desktop_tflite.png)
-
-To visualize the graph as shown above, copy the text specification of the graph
-below and paste it into
-[MediaPipe Visualizer](https://viz.mediapipe.dev).
-
-```bash
-# MediaPipe graph that performs object detection on desktop with TensorFlow Lite
-# on CPU.
-# Used in the example in
-# mediapipe/examples/desktop/object_detection:object_detection_tflite.
-
-# max_queue_size limits the number of packets enqueued on any input stream
-# by throttling inputs to the graph. This makes the graph only process one
-# frame per time.
-max_queue_size: 1
-
-# Decodes an input video file into images and a video header.
-node {
-  calculator: "OpenCvVideoDecoderCalculator"
-  input_side_packet: "INPUT_FILE_PATH:input_video_path"
-  output_stream: "VIDEO:input_video"
-  output_stream: "VIDEO_PRESTREAM:input_video_header"
-}
-
-# Transforms the input image on CPU to a 320x320 image. To scale the image, by
-# default it uses the STRETCH scale mode that maps the entire input image to the
-# entire transformed image. As a result, image aspect ratio may be changed and
-# objects in the image may be deformed (stretched or squeezed), but the object
-# detection model used in this graph is agnostic to that deformation.
-node: {
-  calculator: "ImageTransformationCalculator"
-  input_stream: "IMAGE:input_video"
-  output_stream: "IMAGE:transformed_input_video"
-  node_options: {
-    [type.googleapis.com/mediapipe.ImageTransformationCalculatorOptions] {
-      output_width: 320
-      output_height: 320
-    }
-  }
-}
-
-# Converts the transformed input image on CPU into an image tensor as a
-# TfLiteTensor. The zero_center option is set to true to normalize the
-# pixel values to [-1.f, 1.f] as opposed to [0.f, 1.f].
-node {
-  calculator: "TfLiteConverterCalculator"
-  input_stream: "IMAGE:transformed_input_video"
-  output_stream: "TENSORS:image_tensor"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteConverterCalculatorOptions] {
-      zero_center: true
-    }
-  }
-}
-
-# Runs a TensorFlow Lite model on CPU that takes an image tensor and outputs a
-# vector of tensors representing, for instance, detection boxes/keypoints and
-# scores.
-node {
-  calculator: "TfLiteInferenceCalculator"
-  input_stream: "TENSORS:image_tensor"
-  output_stream: "TENSORS:detection_tensors"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteInferenceCalculatorOptions] {
-      model_path: "mediapipe/models/ssdlite_object_detection.tflite"
-    }
-  }
-}
-
-# Generates a single side packet containing a vector of SSD anchors based on
-# the specification in the options.
-node {
-  calculator: "SsdAnchorsCalculator"
-  output_side_packet: "anchors"
-  node_options: {
-    [type.googleapis.com/mediapipe.SsdAnchorsCalculatorOptions] {
-      num_layers: 6
-      min_scale: 0.2
-      max_scale: 0.95
-      input_size_height: 320
-      input_size_width: 320
-      anchor_offset_x: 0.5
-      anchor_offset_y: 0.5
-      strides: 16
-      strides: 32
-      strides: 64
-      strides: 128
-      strides: 256
-      strides: 512
-      aspect_ratios: 1.0
-      aspect_ratios: 2.0
-      aspect_ratios: 0.5
-      aspect_ratios: 3.0
-      aspect_ratios: 0.3333
-      reduce_boxes_in_lowest_layer: true
-    }
-  }
-}
-
-# Decodes the detection tensors generated by the TensorFlow Lite model, based on
-# the SSD anchors and the specification in the options, into a vector of
-# detections. Each detection describes a detected object.
-node {
-  calculator: "TfLiteTensorsToDetectionsCalculator"
-  input_stream: "TENSORS:detection_tensors"
-  input_side_packet: "ANCHORS:anchors"
-  output_stream: "DETECTIONS:detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteTensorsToDetectionsCalculatorOptions] {
-      num_classes: 91
-      num_boxes: 2034
-      num_coords: 4
-      ignore_classes: 0
-      apply_exponential_on_box_size: true
-
-      x_scale: 10.0
-      y_scale: 10.0
-      h_scale: 5.0
-      w_scale: 5.0
-    }
-  }
-}
-
-# Performs non-max suppression to remove excessive detections.
-node {
-  calculator: "NonMaxSuppressionCalculator"
-  input_stream: "detections"
-  output_stream: "filtered_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.NonMaxSuppressionCalculatorOptions] {
-      min_suppression_threshold: 0.4
-      min_score_threshold: 0.6
-      max_num_detections: 5
-      overlap_type: INTERSECTION_OVER_UNION
-    }
-  }
-}
-
-# Maps detection label IDs to the corresponding label text. The label map is
-# provided in the label_map_path option.
-node {
-  calculator: "DetectionLabelIdToTextCalculator"
-  input_stream: "filtered_detections"
-  output_stream: "output_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionLabelIdToTextCalculatorOptions] {
-      label_map_path: "mediapipe/models/ssdlite_object_detection_labelmap.txt"
-    }
-  }
-}
-
-# Converts the detections to drawing primitives for annotation overlay.
-node {
-  calculator: "DetectionsToRenderDataCalculator"
-  input_stream: "DETECTION_VECTOR:output_detections"
-  output_stream: "RENDER_DATA:render_data"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionsToRenderDataCalculatorOptions] {
-      thickness: 4.0
-      color { r: 255 g: 0 b: 0 }
-    }
-  }
-}
-
-# Draws annotations and overlays them on top of the original image coming into
-# the graph.
-node {
-  calculator: "AnnotationOverlayCalculator"
-  input_stream: "IMAGE:input_video"
-  input_stream: "render_data"
-  output_stream: "IMAGE:output_video"
-}
-
-# Encodes the annotated images into a video file, adopting properties specified
-# in the input video header, e.g., video framerate.
-node {
-  calculator: "OpenCvVideoEncoderCalculator"
-  input_stream: "VIDEO:output_video"
-  input_stream: "VIDEO_PRESTREAM:input_video_header"
-  input_side_packet: "OUTPUT_FILE_PATH:output_video_path"
-  node_options: {
-    [type.googleapis.com/mediapipe.OpenCvVideoEncoderCalculatorOptions]: {
-      codec: "avc1"
-      video_format: "mp4"
-    }
-  }
-}
-```
-
-### Known issues with OpenCV 2
-
-Note that OpenCV 2 may not be able to render an mp4 file and returns the
-following error message:
-
-```
-[libx264 @ 0x7fe6eadf49a0] broken ffmpeg default settings detected
-[libx264 @ 0x7fe6eadf49a0] use an encoding preset (e.g. -vpre medium)
-[libx264 @ 0x7fe6eadf49a0] preset usage: -vpre <speed> -vpre <profile>
-[libx264 @ 0x7fe6eadf49a0] speed presets are listed in x264 --help
-[libx264 @ 0x7fe6eadf49a0] profile is optional; x264 defaults to high
-Could not open codec 'libx264': Unspecified errorE0612 19:40:09.067003  2089 simple_run_graph_main.cc:64] Fail to run the graph: CalculatorGraph::Run() failed in Run:
-Calculator::Process() for node "[OpenCvVideoEncoderCalculator, OpenCvVideoEncoderCalculator with node ID: 7 and input streams: <decorated_frames,video_prestream>]" failed: ; Fail to open file at ...
-```
-
-In that case, please change the OpenCvVideoEncoderCalculator option in either
-the [`TensorFlow graph`] or the [`TensorFlow Lite graph`] to the following and
-in the command line specify the output video to be a .mkv file.
-
-```bash
-node {
-  calculator: "OpenCvVideoEncoderCalculator"
-  input_stream: "VIDEO:output_video"
-  input_stream: "VIDEO_PRESTREAM:input_video_header"
-  input_side_packet: "OUTPUT_FILE_PATH:output_video_path"
-  node_options {
-    [type.googleapis.com/mediapipe.OpenCvVideoEncoderCalculatorOptions]: {
-      codec: "MPEG"
-     video_format: "mkv"
-  }
-}
-```
-
-[`README file`]:https://github.com/google/mediapipe/tree/master/mediapipe/models/object_detection_saved_model/README.md
-[`TensorFlow graph`]: https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection/object_detection_desktop_tensorflow_graph.pbtxt
-[`TensorFlow Lite graph`]: https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection/object_detection_desktop_tflite_graph.pbtxt
+Content moved to
+[MediapPipe Object Detection](https://google.github.io/mediapipe/solutions/object_detection)
diff --git a/mediapipe/docs/object_detection_mobile_cpu.md b/mediapipe/docs/object_detection_mobile_cpu.md
deleted file mode 100644
index c167315c2..000000000
--- a/mediapipe/docs/object_detection_mobile_cpu.md
+++ /dev/null
@@ -1,245 +0,0 @@
-# Object Detection (CPU)
-
-This doc focuses on the
-[example graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection/object_detection_mobile_cpu.pbtxt)
-that performs object detection with TensorFlow Lite on CPU.
-
-This is very similar to the
-[Object Detection on GPU on Android](object_detection_android_gpu.md) example
-except that at the beginning and the end of the graph it performs GPU-to-CPU and
-CPU-to-GPU image transfer respectively. As a result, the rest of graph, which
-shares the same configuration as the
-[GPU graph](images/mobile/object_detection_mobile_gpu.png), runs entirely on
-CPU.
-
-![object_detection_android_cpu_gif](images/mobile/object_detection_android_cpu.gif)
-
-## Android
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectioncpu)
-
-To build and install the app:
-
-```bash
-bazel build -c opt --config=android_arm64 mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectioncpu
-adb install bazel-bin/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectioncpu/objectdetectioncpu.apk
-```
-
-## iOS
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/handdetectiongpu).
-
-See the general [instructions](./building_examples.md#ios) for building iOS
-examples and generating an Xcode project. This will be the ObjectDetectionCpuApp
-target.
-
-To build on the command line:
-
-```bash
-bazel build -c opt --config=ios_arm64 mediapipe/examples/ios/objectdetectioncpu:ObjectDetectionCpuApp
-```
-
-## Graph
-
-![object_detection_mobile_cpu_graph](images/mobile/object_detection_mobile_cpu.png)
-
-To visualize the graph as shown above, copy the text specification of the graph
-below and paste it into [MediaPipe Visualizer](https://viz.mediapipe.dev/).
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection/object_detection_mobile_cpu.pbtxt)
-
-```bash
-# MediaPipe graph that performs object detection with TensorFlow Lite on CPU.
-# Used in the examples in
-# mediapipie/examples/android/src/java/com/mediapipe/apps/objectdetectioncpu and
-# mediapipie/examples/ios/objectdetectioncpu.
-
-# Images on GPU coming into and out of the graph.
-input_stream: "input_video"
-output_stream: "output_video"
-
-# Transfers the input image from GPU to CPU memory for the purpose of
-# demonstrating a CPU-based pipeline. Note that the input image on GPU has the
-# origin defined at the bottom-left corner (OpenGL convention). As a result,
-# the transferred image on CPU also shares the same representation.
-node: {
-  calculator: "GpuBufferToImageFrameCalculator"
-  input_stream: "input_video"
-  output_stream: "input_video_cpu"
-}
-
-# Throttles the images flowing downstream for flow control. It passes through
-# the very first incoming image unaltered, and waits for
-# TfLiteTensorsToDetectionsCalculator downstream in the graph to finish
-# generating the corresponding detections before it passes through another
-# image. All images that come in while waiting are dropped, limiting the number
-# of in-flight images between this calculator and
-# TfLiteTensorsToDetectionsCalculator to 1. This prevents the nodes in between
-# from queuing up incoming images and data excessively, which leads to increased
-# latency and memory usage, unwanted in real-time mobile applications. It also
-# eliminates unnecessarily computation, e.g., a transformed image produced by
-# ImageTransformationCalculator may get dropped downstream if the subsequent
-# TfLiteConverterCalculator or TfLiteInferenceCalculator is still busy
-# processing previous inputs.
-node {
-  calculator: "FlowLimiterCalculator"
-  input_stream: "input_video_cpu"
-  input_stream: "FINISHED:detections"
-  input_stream_info: {
-    tag_index: "FINISHED"
-    back_edge: true
-  }
-  output_stream: "throttled_input_video_cpu"
-}
-
-# Transforms the input image on CPU to a 320x320 image. To scale the image, by
-# default it uses the STRETCH scale mode that maps the entire input image to the
-# entire transformed image. As a result, image aspect ratio may be changed and
-# objects in the image may be deformed (stretched or squeezed), but the object
-# detection model used in this graph is agnostic to that deformation.
-node: {
-  calculator: "ImageTransformationCalculator"
-  input_stream: "IMAGE:throttled_input_video_cpu"
-  output_stream: "IMAGE:transformed_input_video_cpu"
-  node_options: {
-    [type.googleapis.com/mediapipe.ImageTransformationCalculatorOptions] {
-      output_width: 320
-      output_height: 320
-    }
-  }
-}
-
-# Converts the transformed input image on CPU into an image tensor stored as a
-# TfLiteTensor.
-node {
-  calculator: "TfLiteConverterCalculator"
-  input_stream: "IMAGE:transformed_input_video_cpu"
-  output_stream: "TENSORS:image_tensor"
-}
-
-# Runs a TensorFlow Lite model on CPU that takes an image tensor and outputs a
-# vector of tensors representing, for instance, detection boxes/keypoints and
-# scores.
-node {
-  calculator: "TfLiteInferenceCalculator"
-  input_stream: "TENSORS:image_tensor"
-  output_stream: "TENSORS:detection_tensors"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteInferenceCalculatorOptions] {
-      model_path: "ssdlite_object_detection.tflite"
-    }
-  }
-}
-
-# Generates a single side packet containing a vector of SSD anchors based on
-# the specification in the options.
-node {
-  calculator: "SsdAnchorsCalculator"
-  output_side_packet: "anchors"
-  node_options: {
-    [type.googleapis.com/mediapipe.SsdAnchorsCalculatorOptions] {
-      num_layers: 6
-      min_scale: 0.2
-      max_scale: 0.95
-      input_size_height: 320
-      input_size_width: 320
-      anchor_offset_x: 0.5
-      anchor_offset_y: 0.5
-      strides: 16
-      strides: 32
-      strides: 64
-      strides: 128
-      strides: 256
-      strides: 512
-      aspect_ratios: 1.0
-      aspect_ratios: 2.0
-      aspect_ratios: 0.5
-      aspect_ratios: 3.0
-      aspect_ratios: 0.3333
-      reduce_boxes_in_lowest_layer: true
-    }
-  }
-}
-
-# Decodes the detection tensors generated by the TensorFlow Lite model, based on
-# the SSD anchors and the specification in the options, into a vector of
-# detections. Each detection describes a detected object.
-node {
-  calculator: "TfLiteTensorsToDetectionsCalculator"
-  input_stream: "TENSORS:detection_tensors"
-  input_side_packet: "ANCHORS:anchors"
-  output_stream: "DETECTIONS:detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteTensorsToDetectionsCalculatorOptions] {
-      num_classes: 91
-      num_boxes: 2034
-      num_coords: 4
-      ignore_classes: 0
-      sigmoid_score: true
-      apply_exponential_on_box_size: true
-      x_scale: 10.0
-      y_scale: 10.0
-      h_scale: 5.0
-      w_scale: 5.0
-      min_score_thresh: 0.6
-    }
-  }
-}
-
-# Performs non-max suppression to remove excessive detections.
-node {
-  calculator: "NonMaxSuppressionCalculator"
-  input_stream: "detections"
-  output_stream: "filtered_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.NonMaxSuppressionCalculatorOptions] {
-      min_suppression_threshold: 0.4
-      max_num_detections: 3
-      overlap_type: INTERSECTION_OVER_UNION
-      return_empty_detections: true
-    }
-  }
-}
-
-# Maps detection label IDs to the corresponding label text. The label map is
-# provided in the label_map_path option.
-node {
-  calculator: "DetectionLabelIdToTextCalculator"
-  input_stream: "filtered_detections"
-  output_stream: "output_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionLabelIdToTextCalculatorOptions] {
-      label_map_path: "ssdlite_object_detection_labelmap.txt"
-    }
-  }
-}
-
-# Converts the detections to drawing primitives for annotation overlay.
-node {
-  calculator: "DetectionsToRenderDataCalculator"
-  input_stream: "DETECTIONS:output_detections"
-  output_stream: "RENDER_DATA:render_data"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionsToRenderDataCalculatorOptions] {
-      thickness: 4.0
-      color { r: 255 g: 0 b: 0 }
-    }
-  }
-}
-
-# Draws annotations and overlays them on top of the input images.
-node {
-  calculator: "AnnotationOverlayCalculator"
-  input_stream: "IMAGE:throttled_input_video_cpu"
-  input_stream: "render_data"
-  output_stream: "IMAGE:output_video_cpu"
-}
-
-# Transfers the annotated image from CPU back to GPU memory, to be sent out of
-# the graph.
-node: {
-  calculator: "ImageFrameToGpuBufferCalculator"
-  input_stream: "output_video_cpu"
-  output_stream: "output_video"
-}
-```
diff --git a/mediapipe/docs/object_detection_mobile_gpu.md b/mediapipe/docs/object_detection_mobile_gpu.md
index 159ef6be7..cdf2e0b8d 100644
--- a/mediapipe/docs/object_detection_mobile_gpu.md
+++ b/mediapipe/docs/object_detection_mobile_gpu.md
@@ -1,219 +1,2 @@
-# Object Detection (GPU)
-
-This doc focuses on the
-[below example graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection/object_detection_mobile_gpu.pbtxt)
-that performs object detection with TensorFlow Lite on GPU.
-
-![object_detection_android_gpu_gif](images/mobile/object_detection_android_gpu.gif)
-
-## Android
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectiongpu)
-
-To build and install the app:
-
-```bash
-bazel build -c opt --config=android_arm64 mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectiongpu
-adb install bazel-bin/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectiongpu/objectdetectiongpu.apk
-```
-
-## iOS
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/ios/objectdetectiongpu).
-
-See the general [instructions](./building_examples.md#ios) for building iOS
-examples and generating an Xcode project. This will be the ObjectDetectionGpuApp
-target.
-
-To build on the command line:
-
-```bash
-bazel build -c opt --config=ios_arm64 mediapipe/examples/ios/objectdetectiongpu:ObjectDetectionGpuApp
-```
-
-## Graph
-
-![object_detection_mobile_gpu_graph](images/mobile/object_detection_mobile_gpu.png)
-
-To visualize the graph as shown above, copy the text specification of the graph
-below and paste it into [MediaPipe Visualizer](https://viz.mediapipe.dev/).
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection/object_detection_mobile_gpu.pbtxt)
-
-```bash
-# MediaPipe graph that performs object detection with TensorFlow Lite on GPU.
-# Used in the examples in
-# mediapipie/examples/android/src/java/com/mediapipe/apps/objectdetectiongpu and
-# mediapipie/examples/ios/objectdetectiongpu.
-
-# Images on GPU coming into and out of the graph.
-input_stream: "input_video"
-output_stream: "output_video"
-
-# Throttles the images flowing downstream for flow control. It passes through
-# the very first incoming image unaltered, and waits for
-# TfLiteTensorsToDetectionsCalculator downstream in the graph to finish
-# generating the corresponding detections before it passes through another
-# image. All images that come in while waiting are dropped, limiting the number
-# of in-flight images between this calculator and
-# TfLiteTensorsToDetectionsCalculator to 1. This prevents the nodes in between
-# from queuing up incoming images and data excessively, which leads to increased
-# latency and memory usage, unwanted in real-time mobile applications. It also
-# eliminates unnecessarily computation, e.g., a transformed image produced by
-# ImageTransformationCalculator may get dropped downstream if the subsequent
-# TfLiteConverterCalculator or TfLiteInferenceCalculator is still busy
-# processing previous inputs.
-node {
-  calculator: "FlowLimiterCalculator"
-  input_stream: "input_video"
-  input_stream: "FINISHED:detections"
-  input_stream_info: {
-    tag_index: "FINISHED"
-    back_edge: true
-  }
-  output_stream: "throttled_input_video"
-}
-
-# Transforms the input image on GPU to a 320x320 image. To scale the image, by
-# default it uses the STRETCH scale mode that maps the entire input image to the
-# entire transformed image. As a result, image aspect ratio may be changed and
-# objects in the image may be deformed (stretched or squeezed), but the object
-# detection model used in this graph is agnostic to that deformation.
-node: {
-  calculator: "ImageTransformationCalculator"
-  input_stream: "IMAGE_GPU:throttled_input_video"
-  output_stream: "IMAGE_GPU:transformed_input_video"
-  node_options: {
-    [type.googleapis.com/mediapipe.ImageTransformationCalculatorOptions] {
-      output_width: 320
-      output_height: 320
-    }
-  }
-}
-
-# Converts the transformed input image on GPU into an image tensor stored as a
-# TfLiteTensor.
-node {
-  calculator: "TfLiteConverterCalculator"
-  input_stream: "IMAGE_GPU:transformed_input_video"
-  output_stream: "TENSORS_GPU:image_tensor"
-}
-
-# Runs a TensorFlow Lite model on GPU that takes an image tensor and outputs a
-# vector of tensors representing, for instance, detection boxes/keypoints and
-# scores.
-node {
-  calculator: "TfLiteInferenceCalculator"
-  input_stream: "TENSORS_GPU:image_tensor"
-  output_stream: "TENSORS:detection_tensors"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteInferenceCalculatorOptions] {
-      model_path: "ssdlite_object_detection.tflite"
-    }
-  }
-}
-
-# Generates a single side packet containing a vector of SSD anchors based on
-# the specification in the options.
-node {
-  calculator: "SsdAnchorsCalculator"
-  output_side_packet: "anchors"
-  node_options: {
-    [type.googleapis.com/mediapipe.SsdAnchorsCalculatorOptions] {
-      num_layers: 6
-      min_scale: 0.2
-      max_scale: 0.95
-      input_size_height: 320
-      input_size_width: 320
-      anchor_offset_x: 0.5
-      anchor_offset_y: 0.5
-      strides: 16
-      strides: 32
-      strides: 64
-      strides: 128
-      strides: 256
-      strides: 512
-      aspect_ratios: 1.0
-      aspect_ratios: 2.0
-      aspect_ratios: 0.5
-      aspect_ratios: 3.0
-      aspect_ratios: 0.3333
-      reduce_boxes_in_lowest_layer: true
-    }
-  }
-}
-
-# Decodes the detection tensors generated by the TensorFlow Lite model, based on
-# the SSD anchors and the specification in the options, into a vector of
-# detections. Each detection describes a detected object.
-node {
-  calculator: "TfLiteTensorsToDetectionsCalculator"
-  input_stream: "TENSORS:detection_tensors"
-  input_side_packet: "ANCHORS:anchors"
-  output_stream: "DETECTIONS:detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteTensorsToDetectionsCalculatorOptions] {
-      num_classes: 91
-      num_boxes: 2034
-      num_coords: 4
-      ignore_classes: 0
-      sigmoid_score: true
-      apply_exponential_on_box_size: true
-      x_scale: 10.0
-      y_scale: 10.0
-      h_scale: 5.0
-      w_scale: 5.0
-      min_score_thresh: 0.6
-    }
-  }
-}
-
-# Performs non-max suppression to remove excessive detections.
-node {
-  calculator: "NonMaxSuppressionCalculator"
-  input_stream: "detections"
-  output_stream: "filtered_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.NonMaxSuppressionCalculatorOptions] {
-      min_suppression_threshold: 0.4
-      max_num_detections: 3
-      overlap_type: INTERSECTION_OVER_UNION
-      return_empty_detections: true
-    }
-  }
-}
-
-# Maps detection label IDs to the corresponding label text. The label map is
-# provided in the label_map_path option.
-node {
-  calculator: "DetectionLabelIdToTextCalculator"
-  input_stream: "filtered_detections"
-  output_stream: "output_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionLabelIdToTextCalculatorOptions] {
-      label_map_path: "ssdlite_object_detection_labelmap.txt"
-    }
-  }
-}
-
-# Converts the detections to drawing primitives for annotation overlay.
-node {
-  calculator: "DetectionsToRenderDataCalculator"
-  input_stream: "DETECTIONS:output_detections"
-  output_stream: "RENDER_DATA:render_data"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionsToRenderDataCalculatorOptions] {
-      thickness: 4.0
-      color { r: 255 g: 0 b: 0 }
-    }
-  }
-}
-
-# Draws annotations and overlays them on top of the input images.
-node {
-  calculator: "AnnotationOverlayCalculator"
-  input_stream: "IMAGE_GPU:throttled_input_video"
-  input_stream: "render_data"
-  output_stream: "IMAGE_GPU:output_video"
-}
-```
+Content moved to
+[MediapPipe Object Detection](https://google.github.io/mediapipe/solutions/object_detection)
diff --git a/mediapipe/docs/object_tracking_mobile_gpu.md b/mediapipe/docs/object_tracking_mobile_gpu.md
index aaac36386..6dc594d0f 100644
--- a/mediapipe/docs/object_tracking_mobile_gpu.md
+++ b/mediapipe/docs/object_tracking_mobile_gpu.md
@@ -1,492 +1,2 @@
-# Object Detection and Tracking
-
-This doc focuses on the
-[below example graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/tracking/object_detection_tracking_mobile_gpu.pbtxt)
-that performs object detection and tracking.
-Note that object detection is using TensorFlow Lite on GPU while tracking is using CPU.
-
-For overall context on object detection and tracking, please read this
-[Google Developers Blog](https://mediapipe.page.link/objecttrackingblog).
-
-![object_tracking_android_gpu_gif](images/mobile/object_tracking_android_gpu.gif)
-
-## Android
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objecttrackinggpu)
-
-To build and install the app:
-
-```bash
-bazel build -c opt --config=android_arm64 mediapipe/examples/android/src/java/com/google/mediapipe/apps/objecttrackinggpu
-```
-
-Once the app is built, install it on Android device with:
-
-```bash
-adb install bazel-bin/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objecttrackinggpu/objecttrackinggpu.apk
-```
-
-## Graph
-The object detection and tracking [main graph](#main-graph) internally utilizes a
-[object detection subgraph](#object-detection-subgraph), a
-[object tracking subgraph](#object-tracking-subgraph) and a
-[renderer subgraph](#renderer-subgraph).
-
-
-The subgraphs show up in the main graph visualization as nodes colored in
-purple, and the subgraph itself can also be visualized just like a regular
-graph. For more information on how to visualize a graph that includes subgraphs,
-see the Visualizing Subgraphs section in the
-[visualizer documentation](./visualizer.md).
-
-### Main Graph
-
-
-![object_detection_mobile_gpu_graph](images/mobile/object_tracking_mobile_gpu.png)
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection/object_detection_mobile_gpu.pbtxt)
-
-```bash
-# MediaPipe graph that performs object detection and tracking.
-# Used in the examples in
-# mediapipie/examples/android/src/java/com/mediapipe/apps/objecttrackinggpu
-
-# Images on GPU coming into and out of the graph.
-input_stream: "input_video"
-output_stream: "output_video"
-
-# Resamples the images by specific frame rate. This calculator is used to
-# control the frequecy of subsequent calculators/subgraphs, e.g. less power
-# consumption for expensive process.
-node {
-  calculator: "PacketResamplerCalculator"
-  input_stream: "DATA:input_video"
-  output_stream: "DATA:throttled_input_video"
-  node_options: {
-    [type.googleapis.com/mediapipe.PacketResamplerCalculatorOptions] {
-      frame_rate: 0.5
-    }
-  }
-}
-
-# Subgraph that detections objects (see object_detection_gpu.pbtxt).
-node {
-  calculator: "ObjectDetectionSubgraph"
-  input_stream: "IMAGE:throttled_input_video"
-  output_stream: "DETECTIONS:output_detections"
-}
-
-# Subgraph that tracks objects (see object_tracking.pbtxt).
-node {
-  calculator: "ObjectTrackingSubgraph"
-  input_stream: "VIDEO:input_video"
-  input_stream: "DETECTIONS:output_detections"
-  output_stream: "DETECTIONS:tracked_detections"
-}
-
-# Subgraph that renders annotations and overlays them on top of the input
-# images (see renderer_gpu.pbtxt).
-node {
-  calculator: "RendererSubgraph"
-  input_stream: "IMAGE:input_video"
-  input_stream: "DETECTIONS:tracked_detections"
-  output_stream: "IMAGE:output_video"
-}
-```
-
-### Object Detection Subgraph
-
-![object_detection_gpu_subgraph](images/mobile/object_detection_gpu_subgraph.png)
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/tracking/subgraphs/object_detection_gpu.pbtxt)
-
-```bash
-# MediaPipe object detection subgraph.
-
-type: "ObjectDetectionSubgraph"
-
-input_stream: "IMAGE:input_video"
-output_stream: "DETECTIONS:output_detections"
-
-# Transforms the input image on GPU to a 320x320 image. To scale the image, by
-# default it uses the STRETCH scale mode that maps the entire input image to the
-# entire transformed image. As a result, image aspect ratio may be changed and
-# objects in the image may be deformed (stretched or squeezed), but the object
-# detection model used in this graph is agnostic to that deformation.
-node: {
-  calculator: "ImageTransformationCalculator"
-  input_stream: "IMAGE_GPU:input_video"
-  output_stream: "IMAGE_GPU:transformed_input_video"
-  node_options: {
-    [type.googleapis.com/mediapipe.ImageTransformationCalculatorOptions] {
-      output_width: 320
-      output_height: 320
-    }
-  }
-}
-
-# Converts the transformed input image on GPU into an image tensor stored as a
-# TfLiteTensor.
-node {
-  calculator: "TfLiteConverterCalculator"
-  input_stream: "IMAGE_GPU:transformed_input_video"
-  output_stream: "TENSORS_GPU:image_tensor"
-}
-
-# Runs a TensorFlow Lite model on GPU that takes an image tensor and outputs a
-# vector of tensors representing, for instance, detection boxes/keypoints and
-# scores.
-node {
-  calculator: "TfLiteInferenceCalculator"
-  input_stream: "TENSORS_GPU:image_tensor"
-  output_stream: "TENSORS_GPU:detection_tensors"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteInferenceCalculatorOptions] {
-      model_path: "mediapipe/models/ssdlite_object_detection.tflite"
-    }
-  }
-}
-
-# Generates a single side packet containing a vector of SSD anchors based on
-# the specification in the options.
-node {
-  calculator: "SsdAnchorsCalculator"
-  output_side_packet: "anchors"
-  node_options: {
-    [type.googleapis.com/mediapipe.SsdAnchorsCalculatorOptions] {
-      num_layers: 6
-      min_scale: 0.2
-      max_scale: 0.95
-      input_size_height: 320
-      input_size_width: 320
-      anchor_offset_x: 0.5
-      anchor_offset_y: 0.5
-      strides: 16
-      strides: 32
-      strides: 64
-      strides: 128
-      strides: 256
-      strides: 512
-      aspect_ratios: 1.0
-      aspect_ratios: 2.0
-      aspect_ratios: 0.5
-      aspect_ratios: 3.0
-      aspect_ratios: 0.3333
-      reduce_boxes_in_lowest_layer: true
-    }
-  }
-}
-
-# Decodes the detection tensors generated by the TensorFlow Lite model, based on
-# the SSD anchors and the specification in the options, into a vector of
-# detections. Each detection describes a detected object.
-node {
-  calculator: "TfLiteTensorsToDetectionsCalculator"
-  input_stream: "TENSORS_GPU:detection_tensors"
-  input_side_packet: "ANCHORS:anchors"
-  output_stream: "DETECTIONS:detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteTensorsToDetectionsCalculatorOptions] {
-      num_classes: 91
-      num_boxes: 2034
-      num_coords: 4
-      ignore_classes: 0
-      sigmoid_score: true
-      apply_exponential_on_box_size: true
-      x_scale: 10.0
-      y_scale: 10.0
-      h_scale: 5.0
-      w_scale: 5.0
-      min_score_thresh: 0.6
-    }
-  }
-}
-
-# Performs non-max suppression to remove excessive detections.
-node {
-  calculator: "NonMaxSuppressionCalculator"
-  input_stream: "detections"
-  output_stream: "filtered_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.NonMaxSuppressionCalculatorOptions] {
-      min_suppression_threshold: 0.4
-      max_num_detections: 3
-      overlap_type: INTERSECTION_OVER_UNION
-      return_empty_detections: true
-    }
-  }
-}
-
-# Maps detection label IDs to the corresponding label text. The label map is
-# provided in the label_map_path option.
-node {
-  calculator: "DetectionLabelIdToTextCalculator"
-  input_stream: "filtered_detections"
-  output_stream: "output_detections"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionLabelIdToTextCalculatorOptions] {
-      label_map_path: "mediapipe/models/ssdlite_object_detection_labelmap.txt"
-    }
-  }
-}
-```
-
-### Object Tracking Subgraph
-
-Object tracking subgraph uses a box tracking subgraph which is a generic
-tracking library that can be used for other use cases.
-
-![object_tracking_subgraph](images/mobile/object_tracking_subgraph.png)
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/tracking/subgraphs/object_tracking_gpu.pbtxt)
-
-```bash
-# MediaPipe object tracking subgraph.
-
-type: "ObjectTrackingSubgraph"
-
-input_stream: "VIDEO:input_video"
-input_stream: "DETECTIONS:new_detections"
-output_stream: "DETECTIONS:tracked_detections"
-
-# Assigns an unique id for each new detection.
-node {
-  calculator: "DetectionUniqueIdCalculator"
-  input_stream: "DETECTIONS:new_detections"
-  output_stream: "DETECTIONS:detections_with_id"
-}
-
-# Converts detections to TimedBox protos which are used as initial location
-# for tracking.
-node {
-  calculator: "DetectionsToTimedBoxListCalculator"
-  input_stream: "DETECTIONS:detections_with_id"
-  output_stream: "BOXES:start_pos"
-}
-
-# Subgraph that tracks boxes (see box_tracking.pbtxt).
-node {
-  calculator: "BoxTrackingSubgraph"
-  input_stream: "VIDEO:input_video"
-  input_stream: "BOXES:start_pos"
-  input_stream: "CANCEL_ID:cancel_object_id"
-  output_stream: "BOXES:boxes"
-}
-
-# Managers new detected objects and objects that are being tracked.
-# It associates the duplicated detections and updates the locations of
-# detections from tracking.
-node: {
-  calculator: "TrackedDetectionManagerCalculator"
-  input_stream: "DETECTIONS:detections_with_id"
-  input_stream: "TRACKING_BOXES:boxes"
-  output_stream: "DETECTIONS:tracked_detections"
-  output_stream: "CANCEL_OBJECT_ID:cancel_object_id"
-
-  input_stream_handler {
-    input_stream_handler: "SyncSetInputStreamHandler"
-    options {
-      [mediapipe.SyncSetInputStreamHandlerOptions.ext] {
-        sync_set {
-          tag_index: "TRACKING_BOXES"
-        }
-        sync_set {
-          tag_index: "DETECTIONS"
-        }
-      }
-    }
-  }
-}
-
-```
-
-### Box Tracking Subgraph
-
-![box_tracking_subgraph](images/mobile/box_tracking_subgraph.png)
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/tracking/subgraphs/box_tracking_gpu.pbtxt)
-
-```bash
-# MediaPipe box tracking subgraph.
-
-type: "BoxTrackingSubgraph"
-
-input_stream: "VIDEO:input_video"
-input_stream: "BOXES:start_pos"
-input_stream: "CANCEL_ID:cancel_object_id"
-output_stream: "BOXES:boxes"
-
-node: {
-  calculator: "ImageTransformationCalculator"
-  input_stream: "IMAGE_GPU:input_video"
-  output_stream: "IMAGE_GPU:downscaled_input_video"
-  node_options: {
-    [type.googleapis.com/mediapipe.ImageTransformationCalculatorOptions] {
-      output_width: 240
-      output_height: 320
-    }
-  }
-}
-
-# Converts GPU buffer to ImageFrame for processing tracking.
-node: {
-  calculator: "GpuBufferToImageFrameCalculator"
-  input_stream: "downscaled_input_video"
-  output_stream: "downscaled_input_video_cpu"
-}
-
-# Performs motion analysis on an incoming video stream.
-node: {
-  calculator: "MotionAnalysisCalculator"
-  input_stream: "VIDEO:downscaled_input_video_cpu"
-  output_stream: "CAMERA:camera_motion"
-  output_stream: "FLOW:region_flow"
-
-  node_options: {
-    [type.googleapis.com/mediapipe.MotionAnalysisCalculatorOptions]: {
-      analysis_options {
-        analysis_policy: ANALYSIS_POLICY_CAMERA_MOBILE
-        flow_options {
-          fast_estimation_min_block_size: 100
-          top_inlier_sets: 1
-          frac_inlier_error_threshold: 3e-3
-          downsample_mode: DOWNSAMPLE_TO_INPUT_SIZE
-          verification_distance: 5.0
-          verify_long_feature_acceleration: true
-          verify_long_feature_trigger_ratio: 0.1
-          tracking_options {
-            max_features: 500
-            adaptive_extraction_levels: 2
-            min_eig_val_settings {
-              adaptive_lowest_quality_level: 2e-4
-            }
-            klt_tracker_implementation: KLT_OPENCV
-          }
-        }
-      }
-    }
-  }
-}
-
-# Reads optical flow fields defined in
-# mediapipe/framework/formats/motion/optical_flow_field.h,
-# returns a VideoFrame with 2 channels (v_x and v_y), each channel is quantized
-# to 0-255.
-node: {
-  calculator: "FlowPackagerCalculator"
-  input_stream: "FLOW:region_flow"
-  input_stream: "CAMERA:camera_motion"
-  output_stream: "TRACKING:tracking_data"
-
-  node_options: {
-    [type.googleapis.com/mediapipe.FlowPackagerCalculatorOptions]: {
-      flow_packager_options: {
-        binary_tracking_data_support: false
-      }
-    }
-  }
-}
-
-# Tracks box positions over time.
-node: {
-  calculator: "BoxTrackerCalculator"
-  input_stream: "TRACKING:tracking_data"
-  input_stream: "TRACK_TIME:input_video"
-  input_stream: "START_POS:start_pos"
-  input_stream: "CANCEL_OBJECT_ID:cancel_object_id"
-  input_stream_info: {
-    tag_index: "CANCEL_OBJECT_ID"
-    back_edge: true
-  }
-  output_stream: "BOXES:boxes"
-
-  input_stream_handler {
-    input_stream_handler: "SyncSetInputStreamHandler"
-    options {
-      [mediapipe.SyncSetInputStreamHandlerOptions.ext] {
-        sync_set {
-          tag_index: "TRACKING"
-          tag_index: "TRACK_TIME"
-        }
-        sync_set {
-          tag_index: "START_POS"
-        }
-        sync_set {
-          tag_index: "CANCEL_OBJECT_ID"
-        }
-      }
-    }
-  }
-
-  node_options: {
-    [type.googleapis.com/mediapipe.BoxTrackerCalculatorOptions]: {
-      tracker_options: {
-        track_step_options {
-          track_object_and_camera: true
-          tracking_degrees: TRACKING_DEGREE_OBJECT_SCALE
-          inlier_spring_force: 0.0
-          static_motion_temporal_ratio: 3e-2
-        }
-      }
-      visualize_tracking_data: false
-      streaming_track_data_cache_size: 100
-    }
-  }
-}
-```
-
-### Renderer Subgraph
-
-![object_tracking_renderer_gpu_subgraph.pbtxt](images/mobile/object_tracking_renderer_gpu_subgraph.png)
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/tracking/subgraphs/renderer_gpu.pbtxt)
-
-```bash
-# MediaPipe object tracking rendering subgraph.
-
-type: "RendererSubgraph"
-
-input_stream: "IMAGE:input_image"
-input_stream: "DETECTIONS:detections"
-output_stream: "IMAGE:output_image"
-
-# Converts the detections to drawing primitives for annotation overlay.
-node {
-  calculator: "DetectionsToRenderDataCalculator"
-  input_stream: "DETECTIONS:detections"
-  output_stream: "RENDER_DATA:detections_render_data"
-  node_options: {
-    [type.googleapis.com/mediapipe.DetectionsToRenderDataCalculatorOptions] {
-      thickness: 4.0
-      color { r: 255 g: 0 b: 0 }
-      render_detection_id: true
-    }
-  }
-}
-
-# Draws annotations and overlays them on top of the input images.
-node {
-  calculator: "AnnotationOverlayCalculator"
-  input_stream: "IMAGE_GPU:input_image"
-  input_stream: "detections_render_data"
-  output_stream: "IMAGE_GPU:output_image"
-}
-
-```
-
-## Desktop
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/desktop/object_tracking)
-
-Note that object detection is using TensorFlow Lite on CPU and tracking is using
-CPU.
-
-To build and run the app:
-
-```bash
-bazel build -c opt mediapipe/examples/desktop/object_tracking:object_tracking_cpu \
-  --define MEDIAPIPE_DISABLE_GPU=1
-
-bazel-bin/mediapipe/examples/desktop/object_tracking/object_tracking_cpu \
-  --calculator_graph_config_file=mediapipe/graphs/tracking/object_detection_tracking_desktop_live.pbtxt
-```
+Content moved to
+[MediapPipe Box Tracking](https://google.github.io/mediapipe/solutions/box_tracking)
diff --git a/mediapipe/docs/objectron_mobile_gpu.md b/mediapipe/docs/objectron_mobile_gpu.md
index e0dda48c2..118438de0 100644
--- a/mediapipe/docs/objectron_mobile_gpu.md
+++ b/mediapipe/docs/objectron_mobile_gpu.md
@@ -1,489 +1,2 @@
-# MediaPipe Objectron (GPU)
-
-This doc focuses on the
-[below example graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection_3d/shoe_classic_occlusion_tracking.pbtxt)
-that performs 3D object detection and tracking with TensorFlow Lite on GPU.
-
-Objectron for shoes                                                             | Objectron for chairs
-:-----------------------------------------------------------------------------: | :------------------:
-![objectron_shoe_android_gpu_gif](images/mobile/objectron_shoe_android_gpu.gif) | ![objectron_chair_android_gpu_gif](images/mobile/objectron_chair_android_gpu.gif)
-
-For overall context on MediaPipe Objectron, please read the
-[Google AI Blog](https://mediapipe.page.link/objectron-aiblog). The Objectron's
-ML model (see also the [model card](https://mediapipe.page.link/objectron-mc))
-estimates a 3D bounding box for the detected object.
-
-## Android
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetection3d)
-
-An arm64 build of Objectron for shoes can be
-[downloaded here](https://drive.google.com/open?id=1S0K4hbWt3o31FfQ4QU3Rz7IHrvOUMx1d),
-and for chairs can be
-[downloaded here](https://drive.google.com/open?id=1MM8K-13bXLCVS1EHQ-KgkVyEahEPrKej).
-
-To build and install the Objectron for shoes:
-
-```bash
-bazel build -c opt --config android_arm64 mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetection3d:objectdetection3d
-```
-
-Similarly to build and install the Objectron for chairs, add **--define
-chair=true** flag to build command.
-
-```bash
-bazel build -c opt --define chair=true --config android_arm64 mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetection3d:objectdetection3d
-```
-
-Once the app is built, install in on Android device with:
-
-```bash
-adb install bazel-bin/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetection3d/objectdetection3d.apk
-```
-
-## Graph
-
-The Objectron main graph internally utilizes the Objectron detection subgraph,
-and the Objectron tracking subgraph. To visualize the graph as shown above, copy
-the text specification of the graph below and paste it into
-[MediaPipe Visualizer](https://viz.mediapipe.dev/).
-
-### Main Graph
-
-This is the main graph for the shoe detector. This graph runs detection and
-tracking and renders the output to the display.
-
-![object_detection_mobile_gpu_graph](images/mobile/object_detection_3d_android_gpu.png)
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection_3d/shoe_classic_occlusion_tracking.pbtxt)
-
-```bash
-# MediaPipe object detection 3D with tracking graph.
-
-# Images on GPU coming into and out of the graph.
-input_stream: "input_video"
-output_stream: "output_video"
-
-# Creates a copy of the input_video stream. At the end of the graph, the
-# GlAnimationOverlayCalculator will consume the input_video texture and draws
-# on top of it.
-node: {
-  calculator: "GlScalerCalculator"
-  input_stream: "VIDEO:input_video"
-  output_stream: "VIDEO:input_video_copy"
-}
-
-# Resamples the images by specific frame rate. This calculator is used to
-# control the frequecy of subsequent calculators/subgraphs, e.g. less power
-# consumption for expensive process.
-node {
-  calculator: "PacketResamplerCalculator"
-  input_stream: "DATA:input_video_copy"
-  output_stream: "DATA:sampled_input_video"
-  node_options: {
-    [type.googleapis.com/mediapipe.PacketResamplerCalculatorOptions] {
-      frame_rate: 5
-    }
-  }
-}
-
-node {
-  calculator: "ObjectronDetectionSubgraphGpu"
-  input_stream: "IMAGE_GPU:sampled_input_video"
-  output_stream: "ANNOTATIONS:objects"
-}
-
-node {
-  calculator: "ObjectronTrackingSubgraphGpu"
-  input_stream: "FRAME_ANNOTATION:objects"
-  input_stream: "IMAGE_GPU:input_video_copy"
-  output_stream: "LIFTED_FRAME_ANNOTATION:lifted_tracked_objects"
-}
-
-# The rendering nodes:
-# We are rendering two meshes: 1) a 3D bounding box, which we overlay directly
-# on the texture, and 2) a shoe CAD model, which we use as an occlusion mask.
-# These models are designed using different tools, so we supply a transformation
-# to bring both of them to the Objectron's coordinate system.
-
-# Creates a model matrices for the tracked object given the lifted 3D points.
-# This calculator does two things: 1) Estimates object's pose (orientation,
-# translation, and scale) from the 3D vertices, and
-# 2) bring the object from the objectron's coordinate system to the renderer
-# (OpenGL) coordinate system. Since the final goal is to render a mesh file on
-# top of the object, we also supply a transformation to bring the mesh to the
-# objectron's coordinate system, and rescale mesh to the unit size.
-node {
-  calculator: "AnnotationsToModelMatricesCalculator"
-  input_stream: "ANNOTATIONS:lifted_tracked_objects"
-  output_stream: "MODEL_MATRICES:model_matrices"
-  node_options: {
-    [type.googleapis.com/mediapipe.AnnotationsToModelMatricesCalculatorOptions] {
-      # Re-scale the CAD model to the size of a unit box
-      model_scale: 0.05
-      model_scale: 0.05
-      model_scale: 0.05
-      # Bring the box CAD model to objectron's coordinate system. This
-      # is equivalent of -pi/2 rotation along the y-axis (right-hand rule):
-      # Eigen::AngleAxisf(-M_PI / 2., Eigen::Vector3f::UnitY())
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: -1.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: 1.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: 1.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: 1.0
-    }
-  }
-}
-
-# Compute the model matrices for the CAD model of the shoe, to be used as an
-# occlusion mask. The model will be rendered at the exact same location as the
-# bounding box.
-node {
-  calculator: "AnnotationsToModelMatricesCalculator"
-  input_stream: "ANNOTATIONS:lifted_tracked_objects"
-  output_stream: "MODEL_MATRICES:mask_model_matrices"
-  #input_side_packet: "MODEL_SCALE:model_scale"
-  node_options: {
-    [type.googleapis.com/mediapipe.AnnotationsToModelMatricesCalculatorOptions] {
-      # Re-scale the CAD model to the size of a unit box
-      model_scale: 0.45
-      model_scale: 0.25
-      model_scale: 0.15
-      # Bring the shoe CAD model to Deep Pursuit 3D's coordinate system. This
-      # is equivalent of -pi/2 rotation along the x-axis (right-hand rule):
-      # Eigen::AngleAxisf(-M_PI / 2., Eigen::Vector3f::UnitX())
-      model_transformation: 1.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: 1.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: -1.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: 0.0
-      model_transformation: 1.0
-    }
-  }
-}
-
-# Render everything together. First we render the 3D bounding box animation,
-# then we render the occlusion mask.
-node: {
-  calculator: "GlAnimationOverlayCalculator"
-  input_stream: "VIDEO:input_video"
-  input_stream: "MODEL_MATRICES:model_matrices"
-  input_stream: "MASK_MODEL_MATRICES:mask_model_matrices"
-  output_stream: "output_video"
-  input_side_packet: "TEXTURE:box_texture"
-  input_side_packet: "ANIMATION_ASSET:box_asset_name"
-  input_side_packet: "MASK_TEXTURE:obj_texture"
-  input_side_packet: "MASK_ASSET:obj_asset_name"
-  node_options: {
-    [type.googleapis.com/mediapipe.GlAnimationOverlayCalculatorOptions] {
-      # Output resolution is 480x640 with the aspect ratio of 0.75
-      aspect_ratio: 0.75
-      vertical_fov_degrees: 70.
-      animation_speed_fps: 25
-    }
-  }
-}
-
-```
-
-### Objectron Detection Subgraph
-
-Objectron detection subgraph uses the *TfLiteInferenceCalculator* to run
-inference and decodes the output tensor to *FrameAnnotation* protobuf. The
-*FrameAnnotation* contains nine keypoints: the bounding box's center, as well as
-its eight vertices. The boxes will be passed to the Objectron tracking subgraph.
-
-![object_detection_subgraph](images/mobile/objectron_detection_subgraph.png)
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection_3d/subgraphs/objectron_detection_gpu.pbtxt)
-
-```bash
-# MediaPipe Objectron detection gpu subgraph
-
-type: "ObjectronDetectionSubgraphGpu"
-
-input_stream: "IMAGE_GPU:input_video"
-output_stream: "ANNOTATIONS:objects"
-
-# Transforms the input image on GPU to a 480x640 image. To scale the input
-# image, the scale_mode option is set to FIT to preserve the aspect ratio,
-# resulting in potential letterboxing in the transformed image.
-node: {
-  calculator: "ImageTransformationCalculator"
-  input_stream: "IMAGE_GPU:input_video"
-  output_stream: "IMAGE_GPU:transformed_input_video"
-  node_options: {
-    [type.googleapis.com/mediapipe.ImageTransformationCalculatorOptions] {
-      output_width: 480
-      output_height: 640
-      scale_mode: FIT
-    }
-  }
-}
-
-# Converts the transformed input image on GPU into an image tensor stored as a
-# TfLiteTensor.
-node {
-  calculator: "TfLiteConverterCalculator"
-  input_stream: "IMAGE_GPU:transformed_input_video"
-  output_stream: "TENSORS_GPU:image_tensor"
-}
-
-# Generates a single side packet containing a TensorFlow Lite op resolver that
-# supports custom ops needed by the model used in this graph.
-node {
-  calculator: "TfLiteCustomOpResolverCalculator"
-  output_side_packet: "opresolver"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteCustomOpResolverCalculatorOptions] {
-      use_gpu: true
-    }
-  }
-}
-
-# Runs a TensorFlow Lite model on GPU that takes an image tensor and outputs a
-# vector of tensors representing, for instance, detection boxes/keypoints and
-# scores.
-node {
-  calculator: "TfLiteInferenceCalculator"
-  input_stream: "TENSORS_GPU:image_tensor"
-  output_stream: "TENSORS:detection_tensors"
-  input_side_packet: "CUSTOM_OP_RESOLVER:opresolver"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteInferenceCalculatorOptions] {
-      model_path: "object_detection_3d.tflite"
-    }
-  }
-}
-
-# Decodes the model's output tensor (the heatmap and the distance fields) to 2D
-# keypoints. There are nine 2D keypoints: one center keypoint and eight vertices
-# for the 3D bounding box. The calculator parameters determine's the decoder's
-# sensitivity.
-node {
-  calculator: "TfLiteTensorsToObjectsCalculator"
-  input_stream: "TENSORS:detection_tensors"
-  output_stream: "ANNOTATIONS:objects"
-  node_options: {
-    [type.googleapis.com/mediapipe.TfLiteTensorsToObjectsCalculatorOptions] {
-      num_classes: 1
-      num_keypoints: 9
-      decoder_config {
-        heatmap_threshold: 0.6
-        local_max_distance: 2
-        offset_scale_coef: 1.0
-        voting_radius: 2
-        voting_allowance: 1
-        voting_threshold: 0.2
-      }
-    }
-  }
-}
-```
-
-### Object Tracking Subgraph
-
-Object tracking subgraph uses a *BoxTracker* calculator which is a generic
-tracking library, also used in
-[Mediapipe's 2D Object Detection and Tracking](https://github.com/google/mediapipe/tree/master/mediapipe/g3doc/object_tracking_mobile_gpu.md).
-The tracking runs every frame and when a new detection is available, it
-consolidates the detection and tracking results. The tracker tracks the box with
-its 2D keypoints, so at the end we lift the 2D keypoints to 3D using EPnP
-algorithm in *Lift2DFrameAnnotationTo3D* Calculator.
-
-![object_tracking_subgraph](images/mobile/objectron_tracking_subgraph.png)
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/object_detection_3d/subgraphs/objectron_tracking_gpu.pbtxt)
-
-```bash
-# MediaPipe Objectron tracking gpu subgraph
-
-type: "ObjectronTrackingSubgraphGpu"
-
-input_stream: "FRAME_ANNOTATION:objects"
-input_stream: "IMAGE_GPU:input_video"
-output_stream: "LIFTED_FRAME_ANNOTATION:lifted_tracked_objects"
-
-
-# Converts the detected keypoints to Boxes, used by the tracking subgraph.
-node {
-  calculator: "FrameAnnotationToTimedBoxListCalculator"
-  input_stream: "FRAME_ANNOTATION:objects"
-  output_stream: "BOXES:start_pos"
-}
-
-node: {
-  calculator: "ImageTransformationCalculator"
-  input_stream: "IMAGE_GPU:input_video"
-  output_stream: "IMAGE_GPU:downscaled_input_video"
-  node_options: {
-    [type.googleapis.com/mediapipe.ImageTransformationCalculatorOptions] {
-      output_width: 240
-      output_height: 320
-    }
-  }
-}
-
-# Converts GPU buffer to ImageFrame for processing tracking.
-node: {
-  calculator: "GpuBufferToImageFrameCalculator"
-  input_stream: "downscaled_input_video"
-  output_stream: "downscaled_input_video_cpu"
-}
-
-# Performs motion analysis on an incoming video stream.
-node: {
-  calculator: "MotionAnalysisCalculator"
-  input_stream: "VIDEO:downscaled_input_video_cpu"
-  output_stream: "CAMERA:camera_motion"
-  output_stream: "FLOW:region_flow"
-
-  node_options: {
-    [type.googleapis.com/mediapipe.MotionAnalysisCalculatorOptions]: {
-      analysis_options {
-        analysis_policy: ANALYSIS_POLICY_CAMERA_MOBILE
-        flow_options {
-          fast_estimation_min_block_size: 100
-          top_inlier_sets: 1
-          frac_inlier_error_threshold: 3e-3
-          downsample_mode: DOWNSAMPLE_TO_INPUT_SIZE
-          verification_distance: 5.0
-          verify_long_feature_acceleration: true
-          verify_long_feature_trigger_ratio: 0.1
-          tracking_options {
-            max_features: 500
-            adaptive_extraction_levels: 2
-            min_eig_val_settings {
-              adaptive_lowest_quality_level: 2e-4
-            }
-            klt_tracker_implementation: KLT_OPENCV
-          }
-        }
-      }
-    }
-  }
-}
-
-# Reads optical flow fields defined in
-# mediapipe/framework/formats/motion/optical_flow_field.h,
-# returns a VideoFrame with 2 channels (v_x and v_y), each channel is quantized
-# to 0-255.
-node: {
-  calculator: "FlowPackagerCalculator"
-  input_stream: "FLOW:region_flow"
-  input_stream: "CAMERA:camera_motion"
-  output_stream: "TRACKING:tracking_data"
-
-  node_options: {
-    [type.googleapis.com/mediapipe.FlowPackagerCalculatorOptions]: {
-      flow_packager_options: {
-        binary_tracking_data_support: false
-      }
-    }
-  }
-}
-
-# Tracks box positions over time.
-node: {
-  calculator: "BoxTrackerCalculator"
-  input_stream: "TRACKING:tracking_data"
-  input_stream: "TRACK_TIME:input_video"
-  input_stream: "START_POS:start_pos"
-  input_stream: "CANCEL_OBJECT_ID:cancel_object_id"
-  input_stream_info: {
-    tag_index: "CANCEL_OBJECT_ID"
-    back_edge: true
-  }
-  output_stream: "BOXES:boxes"
-
-  input_stream_handler {
-    input_stream_handler: "SyncSetInputStreamHandler"
-    options {
-      [mediapipe.SyncSetInputStreamHandlerOptions.ext] {
-        sync_set {
-          tag_index: "TRACKING"
-          tag_index: "TRACK_TIME"
-        }
-        sync_set {
-          tag_index: "START_POS"
-        }
-        sync_set {
-          tag_index: "CANCEL_OBJECT_ID"
-        }
-      }
-    }
-  }
-
-  node_options: {
-    [type.googleapis.com/mediapipe.BoxTrackerCalculatorOptions]: {
-      tracker_options: {
-        track_step_options {
-          track_object_and_camera: true
-          tracking_degrees: TRACKING_DEGREE_OBJECT_ROTATION_SCALE
-          inlier_spring_force: 0.0
-          static_motion_temporal_ratio: 3e-2
-        }
-      }
-      visualize_tracking_data: false
-      streaming_track_data_cache_size: 100
-    }
-  }
-}
-
-# Consolidates tracking and detection results.
-node {
-  calculator: "FrameAnnotationTrackerCalculator"
-  input_stream: "FRAME_ANNOTATION:objects"
-  input_stream: "TRACKED_BOXES:boxes"
-  output_stream: "TRACKED_FRAME_ANNOTATION:tracked_objects"
-  output_stream: "CANCEL_OBJECT_ID:cancel_object_id"
-  node_options: {
-    [type.googleapis.com/mediapipe.FrameAnnotationTrackerCalculatorOptions] {
-      img_width: 240
-      img_height: 320
-    }
-  }
-
-  input_stream_handler {
-    input_stream_handler: "SyncSetInputStreamHandler"
-    options {
-      [mediapipe.SyncSetInputStreamHandlerOptions.ext] {
-        sync_set {
-          tag_index: "FRAME_ANNOTATION"
-        }
-        sync_set {
-          tag_index: "TRACKED_BOXES"
-        }
-      }
-    }
-  }
-}
-
-# Lift the tracked 2D keypoints to 3D using EPnP algorithm.
-node {
-  calculator: "Lift2DFrameAnnotationTo3DCalculator"
-  input_stream: "FRAME_ANNOTATION:tracked_objects"
-  output_stream: "LIFTED_FRAME_ANNOTATION:lifted_tracked_objects"
-}
-```
+Content moved to
+[MediapPipe Objectron](https://google.github.io/mediapipe/solutions/objectron)
diff --git a/mediapipe/docs/profiler_config.md b/mediapipe/docs/profiler_config.md
deleted file mode 100644
index 08ce18f6b..000000000
--- a/mediapipe/docs/profiler_config.md
+++ /dev/null
@@ -1,74 +0,0 @@
-# Profiler Configuration Settings
-
-<!--*
-# Document freshness: For more information, see go/fresh-source.
-freshness: { owner: 'mhays' reviewed: '2020-05-08' }
-*-->
-
-[TOC]
-
-The following settings are used when setting up [MediaPipe Tracing](tracer.md)
-Many of them are advanced and not recommended for general usage. Consult
-[MediaPipe Tracing](tracer.md) for a friendlier introduction.
-
-histogram_interval_size_usec :Specifies the size of the runtimes histogram
-intervals (in microseconds) to generate the histogram of the Process() time. The
-last interval extends to +inf. If not specified, the interval is 1000000 usec =
-1 sec.
-
-num_histogram_intervals :Specifies the number of intervals to generate the
-histogram of the `Process()` runtime. If not specified, one interval is used.
-
-enable_profiler
-:   If true, the profiler starts profiling when graph is initialized.
-
-enable_stream_latency
-:   If true, the profiler also profiles the stream latency and input-output
-    latency. No-op if enable_profiler is false.
-
-use_packet_timestamp_for_added_packet
-:   If true, the profiler uses packet timestamp (as production time and source
-    production time) for packets added by calling
-    `CalculatorGraph::AddPacketToInputStream()`. If false, uses the profiler's
-    clock.
-
-trace_log_capacity
-:   The maximum number of trace events buffered in memory. The default value
-    buffers up to 20000 events.
-
-trace_event_types_disabled
-:   Trace event types that are not logged.
-
-trace_log_path
-:   The output directory and base-name prefix for trace log files. Log files are
-    written to: StrCat(trace_log_path, index, "`.binarypb`")
-
-trace_log_count
-:   The number of trace log files retained. The trace log files are named
-    "`trace_0.log`" through "`trace_k.log`". The default value specifies 2
-    output files retained.
-
-trace_log_interval_usec
-:   The interval in microseconds between trace log output. The default value
-    specifies trace log output once every 0.5 sec.
-
-trace_log_margin_usec
-:   The interval in microseconds between TimeNow and the highest times included
-    in trace log output. This margin allows time for events to be appended to
-    the TraceBuffer.
-
-trace_log_duration_events
-:   False specifies an event for each calculator invocation. True specifies a
-    separate event for each start and finish time.
-
-trace_log_interval_count
-:   The number of trace log intervals per file. The total log duration is:
-    `trace_log_interval_usec * trace_log_file_count * trace_log_interval_count`.
-    The default value specifies 10 intervals per file.
-
-trace_log_disabled
-:   An option to turn ON/OFF writing trace files to disk. Saving trace files to
-    disk is enabled by default.
-
-trace_enabled
-:   If true, tracer timing events are recorded and reported.
diff --git a/mediapipe/docs/template_matching_desktop_cpu.md b/mediapipe/docs/template_matching_desktop_cpu.md
deleted file mode 100644
index 97b2cb3f7..000000000
--- a/mediapipe/docs/template_matching_desktop_cpu.md
+++ /dev/null
@@ -1,31 +0,0 @@
-# Template Matching using KNIFT on Desktop
-
-This doc focuses on the
-[example graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/template_matching/template_matching_desktop.pbtxt)
-that performs template matching with KNIFT (Keypoint Neural Invariant Feature
-Transform) on desktop CPU.
-
-If you are interested in more detail about KNIFT or running the example on
-mobile, please see
-[Template Matching using KNIFT on Mobile (CPU)](template_matching_mobile_cpu.md).
-
-To build the desktop app, run:
-
-```bash
-$ bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 \
-    mediapipe/examples/desktop/template_matching:template_matching_tflite
-```
-
-To run the desktop app, please specify a template index file
-([example](https://github.com/google/mediapipe/tree/master/mediapipe/models/knift_index.pb)) and a
-video to be matched. For how to build your own index file, please see
-[here](template_matching_mobile_cpu.md#build-index-file).
-
-```bash
-$ GLOG_logtostderr=1 bazel-bin/mediapipe/examples/desktop/template_matching/template_matching_tflite \
-    --calculator_graph_config_file=mediapipe/graphs/template_matching/template_matching_desktop.pbtxt --input_side_packets="input_video_path=<input video path>,output_video_path=<output video path>"
-```
-
-## Graph
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/template_matching/template_matching_desktop.pbtxt)
diff --git a/mediapipe/docs/template_matching_mobile_cpu.md b/mediapipe/docs/template_matching_mobile_cpu.md
index 78d813442..b3b945b8b 100644
--- a/mediapipe/docs/template_matching_mobile_cpu.md
+++ b/mediapipe/docs/template_matching_mobile_cpu.md
@@ -1,94 +1,2 @@
-# Template Matching using KNIFT on Mobile (CPU)
-
-This doc focuses on the
-[example graph](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/template_matching/template_matching_mobile_cpu.pbtxt)
-that performs template matching with KNIFT (Keypoint Neural Invariant Feature
-Transform) on mobile CPU.
-
-![template_matching_mobile_cpu.gif](images/mobile/template_matching_android_cpu.gif)
-
-In the visualization above, the green dots represent detected keypoints on each
-frame and the red box represents the targets matched by templates using KNIFT
-features (see also [model card](https://mediapipe.page.link/knift-mc)). For more
-information, please see
-[Google Developers Blog](https://mediapipe.page.link/knift-blog).
-
-## Build Index Files
-
-In MediaPipe, we've already provided a file in
-[knift_index.pb](https://github.com/google/mediapipe/tree/master/mediapipe/models/knift_index.pb),
-pre-computed from the 3 template images (of USD bills) shown below. If you'd
-like to use your own template images, please follow the steps below, or
-otherwise you can jump directly to [Android](#android).
-
-![template_matching_mobile_template.jpg](images/mobile/template_matching_mobile_template.jpg)
-
-### Step 1:
-
-Put all template images in a single directory.
-
-### Step 2:
-
-To build the index file for all templates in the directory, run:
-
-```bash
-$ bazel build -c opt --define MEDIAPIPE_DISABLE_GPU=1 \
-    mediapipe/examples/desktop/template_matching:template_matching_tflite
-$ bazel-bin/mediapipe/examples/desktop/template_matching/template_matching_tflite \
-    --calculator_graph_config_file=mediapipe/graphs/template_matching/index_building.pbtxt \
-    --input_side_packets="file_directory=<template image directory>,file_suffix=png,output_index_filename=<output index filename>"
-```
-
-The output index file includes the extracted KNIFT features.
-
-### Step 3:
-
-Replace
-[mediapipe/models/knift_index.pb](https://github.com/google/mediapipe/tree/master/mediapipe/models/knift_index.pb)
-with the index file you generated, and update
-[mediapipe/models/knift_labelmap.txt](https://github.com/google/mediapipe/tree/master/mediapipe/models/knift_labelmap.txt)
-with your own template names.
-
-## Android
-
-[Source](https://github.com/google/mediapipe/tree/master/mediapipe/examples/android/src/java/com/google/mediapipe/apps/templatematchingcpu)
-
-A prebuilt arm64 APK can be
-[downloaded here](https://drive.google.com/open?id=1tSWRfes9rAM4NrzmJBplguNQQvaeBZSa).
-
-To build and install the app yourself, run:
-
-Note: MediaPipe uses OpenCV 3 by default. However, because of
-[issues](https://github.com/opencv/opencv/issues/11488) between NDK 17+ and
-OpenCV 3 when using
-[knnMatch](https://docs.opencv.org/3.4/db/d39/classcv_1_1DescriptorMatcher.html#a378f35c9b1a5dfa4022839a45cdf0e89),
-please use the following commands to temporarily switch to OpenCV 4 for the
-template matching exmaple on Android, and switch back to OpenCV 3 afterwards.
-
-```bash
-# Switch to OpenCV 4
-sed -i -e 's:3.4.3/opencv-3.4.3:4.0.1/opencv-4.0.1:g' WORKSPACE
-sed -i -e 's:libopencv_java3:libopencv_java4:g' third_party/opencv_android.BUILD
-
-# Build and install app
-bazel build -c opt --config=android_arm64 mediapipe/examples/android/src/java/com/google/mediapipe/apps/templatematchingcpu:templatematchingcpu
-adb install -r bazel-bin/mediapipe/examples/android/src/java/com/google/mediapipe/apps/templatematchingcpu/templatematchingcpu.apk
-
-# Switch back to OpenCV 3
-sed -i -e 's:4.0.1/opencv-4.0.1:3.4.3/opencv-3.4.3:g' WORKSPACE
-sed -i -e 's:libopencv_java4:libopencv_java3:g' third_party/opencv_android.BUILD
-```
-
-## Use XNNPACK Delegate
-
-The example uses XNNPACK delegate by default. Users can change the
-[option in TfLiteInferenceCalculator](https://github.com/google/mediapipe/tree/master/mediapipe/calculators/tflite/tflite_inference_calculator.proto)
-to use default TF Lite inference.
-
-## Graph
-
-### Main Graph
-
-![template_matching_mobile_graph](images/mobile/template_matching_mobile_graph.png)
-
-[Source pbtxt file](https://github.com/google/mediapipe/tree/master/mediapipe/graphs/template_matching/template_matching_mobile_cpu.pbtxt)
+Content moved to
+[MediapPipe KNIFT](https://google.github.io/mediapipe/solutions/knift)
diff --git a/mediapipe/docs/web.md b/mediapipe/docs/web.md
deleted file mode 100644
index 15c1e2a5f..000000000
--- a/mediapipe/docs/web.md
+++ /dev/null
@@ -1,25 +0,0 @@
-## MediaPipe on the Web
-
-MediaPipe on the Web is an effort to use [WebAssembly](https://webassembly.org/)
-to bring MediaPipe graphs, calculators, and related technologies to the web. The
-aim is to have all the pieces (ML, rendering, and processing) running directly
-in the browser client-side. The official API is under construction, but the core
-technology has been proven effective, and we can already show interactive
-cross-platform demos using your live webcam.
-
-[For more details, read this Google Developer blog post](https://mediapipe.page.link/webdevblog)
-
-![image](images/web_effect.gif) ![image](images/web_segmentation.gif)
-
-### Hand Tracking (with and without SIMD support)
-
-For [Chrome Developer Summit 2019](https://developer.chrome.com/devsummit/), we
-used this technology to showcase the potential for performance improvements
-using Chrome experimental [WebAssembly SIMD](https://github.com/WebAssembly/simd)
-support.  Below are two different versions of the
-[MediaPipe Hand Tracking Example](https://mediapipe.readthedocs.io/en/latest/hand_tracking_desktop.html)
- running on the web:
-
-  1. WebAssembly MVP [demo](https://mediapipe.page.link/cds-ht) running around 5-8 frames per second on Desktop Chrome
-
-  2. WebAssembly SIMD [demo](https://mediapipe.page.link/cds-ht-simd) running around 15-18 frames per second on *Canary* Chrome for Desktop, which must additionally be launched with the option `--js-flags="--experimental-wasm-simd"`
diff --git a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/basic/AndroidManifest.xml b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/basic/AndroidManifest.xml
index b5318afe3..99288624c 100644
--- a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/basic/AndroidManifest.xml
+++ b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/basic/AndroidManifest.xml
@@ -31,5 +31,6 @@
       <meta-data android:name="binaryGraphName" android:value="${binaryGraphName}"/>
       <meta-data android:name="inputVideoStreamName" android:value="${inputVideoStreamName}"/>
       <meta-data android:name="outputVideoStreamName" android:value="${outputVideoStreamName}"/>
+      <meta-data android:name="flipFramesVertically" android:value="${flipFramesVertically}"/>
   </application>
 </manifest>
diff --git a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/basic/BUILD b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/basic/BUILD
index 3c6695414..04e660a7d 100644
--- a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/basic/BUILD
+++ b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/basic/BUILD
@@ -73,6 +73,7 @@ android_binary(
         "binaryGraphName": "mobile_gpu.binarypb",
         "inputVideoStreamName": "input_video",
         "outputVideoStreamName": "output_video",
+        "flipFramesVertically": "True",
     },
     multidex = "native",
     deps = [
diff --git a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/basic/MainActivity.java b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/basic/MainActivity.java
index b35fd3c3e..ab2fc47ab 100644
--- a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/basic/MainActivity.java
+++ b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/basic/MainActivity.java
@@ -38,10 +38,12 @@ import com.google.mediapipe.glutil.EglManager;
 public class MainActivity extends AppCompatActivity {
   private static final String TAG = "MainActivity";
 
-  // Flips the camera-preview frames vertically before sending them into FrameProcessor to be
-  // processed in a MediaPipe graph, and flips the processed frames back when they are displayed.
-  // This is needed because OpenGL represents images assuming the image origin is at the bottom-left
-  // corner, whereas MediaPipe in general assumes the image origin is at top-left.
+  // Flips the camera-preview frames vertically by default, before sending them into FrameProcessor
+  // to be processed in a MediaPipe graph, and flips the processed frames back when they are
+  // displayed. This maybe needed because OpenGL represents images assuming the image origin is at
+  // the bottom-left corner, whereas MediaPipe in general assumes the image origin is at the
+  // top-left corner.
+  // NOTE: use "flipFramesVertically" in manifest metadata to override this behavior.
   private static final boolean FLIP_FRAMES_VERTICALLY = true;
 
   static {
@@ -101,7 +103,11 @@ public class MainActivity extends AppCompatActivity {
             applicationInfo.metaData.getString("binaryGraphName"),
             applicationInfo.metaData.getString("inputVideoStreamName"),
             applicationInfo.metaData.getString("outputVideoStreamName"));
-    processor.getVideoSurfaceOutput().setFlipY(FLIP_FRAMES_VERTICALLY);
+
+    processor
+        .getVideoSurfaceOutput()
+        .setFlipY(
+            applicationInfo.metaData.getBoolean("flipFramesVertically", FLIP_FRAMES_VERTICALLY));
 
     PermissionHelper.checkAndRequestCameraPermissions(this);
   }
@@ -110,7 +116,8 @@ public class MainActivity extends AppCompatActivity {
   protected void onResume() {
     super.onResume();
     converter = new ExternalTextureConverter(eglManager.getContext());
-    converter.setFlipY(FLIP_FRAMES_VERTICALLY);
+    converter.setFlipY(
+        applicationInfo.metaData.getBoolean("flipFramesVertically", FLIP_FRAMES_VERTICALLY));
     converter.setConsumer(processor);
     if (PermissionHelper.cameraPermissionsGranted(this)) {
       startCamera();
diff --git a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectioncpu/BUILD b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectioncpu/BUILD
index f24da44eb..ba12b8133 100644
--- a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectioncpu/BUILD
+++ b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectioncpu/BUILD
@@ -50,6 +50,7 @@ android_binary(
         "binaryGraphName": "mobile_cpu.binarypb",
         "inputVideoStreamName": "input_video",
         "outputVideoStreamName": "output_video",
+        "flipFramesVertically": "True",
     },
     multidex = "native",
     deps = [
diff --git a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectiongpu/BUILD b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectiongpu/BUILD
index 0f1d694a5..56f6cd040 100644
--- a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectiongpu/BUILD
+++ b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facedetectiongpu/BUILD
@@ -50,6 +50,7 @@ android_binary(
         "binaryGraphName": "mobile_gpu.binarypb",
         "inputVideoStreamName": "input_video",
         "outputVideoStreamName": "output_video",
+        "flipFramesVertically": "True",
     },
     multidex = "native",
     deps = [
diff --git a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facemeshgpu/BUILD b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facemeshgpu/BUILD
index 73ff82f9b..0146466dd 100644
--- a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facemeshgpu/BUILD
+++ b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/facemeshgpu/BUILD
@@ -50,6 +50,7 @@ android_binary(
         "binaryGraphName": "face_mesh_mobile_gpu.binarypb",
         "inputVideoStreamName": "input_video",
         "outputVideoStreamName": "output_video",
+        "flipFramesVertically": "True",
     },
     multidex = "native",
     deps = [
diff --git a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/hairsegmentationgpu/BUILD b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/hairsegmentationgpu/BUILD
index b9387955a..901576bcf 100644
--- a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/hairsegmentationgpu/BUILD
+++ b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/hairsegmentationgpu/BUILD
@@ -49,6 +49,7 @@ android_binary(
         "binaryGraphName": "mobile_gpu.binarypb",
         "inputVideoStreamName": "input_video",
         "outputVideoStreamName": "output_video",
+        "flipFramesVertically": "True",
     },
     multidex = "native",
     deps = [
diff --git a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/handdetectiongpu/BUILD b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/handdetectiongpu/BUILD
index 1d9012310..6f0b52369 100644
--- a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/handdetectiongpu/BUILD
+++ b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/handdetectiongpu/BUILD
@@ -50,6 +50,7 @@ android_binary(
         "binaryGraphName": "hand_detection_mobile_gpu.binarypb",
         "inputVideoStreamName": "input_video",
         "outputVideoStreamName": "output_video",
+        "flipFramesVertically": "True",
     },
     multidex = "native",
     deps = [
diff --git a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/handtrackinggpu/BUILD b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/handtrackinggpu/BUILD
index d7ca29074..e9d6d5155 100644
--- a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/handtrackinggpu/BUILD
+++ b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/handtrackinggpu/BUILD
@@ -52,6 +52,7 @@ android_binary(
         "binaryGraphName": "hand_tracking_mobile_gpu.binarypb",
         "inputVideoStreamName": "input_video",
         "outputVideoStreamName": "output_video",
+        "flipFramesVertically": "True",
     },
     multidex = "native",
     deps = [
diff --git a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/multihandtrackinggpu/BUILD b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/multihandtrackinggpu/BUILD
index 6e01bee9f..be6152554 100644
--- a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/multihandtrackinggpu/BUILD
+++ b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/multihandtrackinggpu/BUILD
@@ -52,6 +52,7 @@ android_binary(
         "binaryGraphName": "multi_hand_tracking_mobile_gpu.binarypb",
         "inputVideoStreamName": "input_video",
         "outputVideoStreamName": "output_video",
+        "flipFramesVertically": "True",
     },
     multidex = "native",
     deps = [
diff --git a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectioncpu/BUILD b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectioncpu/BUILD
index 5b273747c..0f14a48a2 100644
--- a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectioncpu/BUILD
+++ b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectioncpu/BUILD
@@ -50,6 +50,7 @@ android_binary(
         "binaryGraphName": "mobile_cpu.binarypb",
         "inputVideoStreamName": "input_video",
         "outputVideoStreamName": "output_video",
+        "flipFramesVertically": "True",
     },
     multidex = "native",
     deps = [
diff --git a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectiongpu/BUILD b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectiongpu/BUILD
index 9f5fa722a..84d5364b9 100644
--- a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectiongpu/BUILD
+++ b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objectdetectiongpu/BUILD
@@ -50,6 +50,7 @@ android_binary(
         "binaryGraphName": "mobile_gpu.binarypb",
         "inputVideoStreamName": "input_video",
         "outputVideoStreamName": "output_video",
+        "flipFramesVertically": "True",
     },
     multidex = "native",
     deps = [
diff --git a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objecttrackinggpu/BUILD b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objecttrackinggpu/BUILD
index 97f4c408c..75f9c075e 100644
--- a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objecttrackinggpu/BUILD
+++ b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/objecttrackinggpu/BUILD
@@ -50,6 +50,7 @@ android_binary(
         "binaryGraphName": "mobile_gpu.binarypb",
         "inputVideoStreamName": "input_video",
         "outputVideoStreamName": "output_video",
+        "flipFramesVertically": "True",
     },
     multidex = "native",
     deps = [
diff --git a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/templatematchingcpu/BUILD b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/templatematchingcpu/BUILD
index 4e0ad1208..4ca58d99b 100644
--- a/mediapipe/examples/android/src/java/com/google/mediapipe/apps/templatematchingcpu/BUILD
+++ b/mediapipe/examples/android/src/java/com/google/mediapipe/apps/templatematchingcpu/BUILD
@@ -51,6 +51,7 @@ android_binary(
         "binaryGraphName": "mobile_cpu.binarypb",
         "inputVideoStreamName": "input_video",
         "outputVideoStreamName": "output_video",
+        "flipFramesVertically": "True",
     },
     multidex = "native",
     deps = [
diff --git a/mediapipe/examples/coral/README.md b/mediapipe/examples/coral/README.md
index de01b6dc2..a65f449bb 100644
--- a/mediapipe/examples/coral/README.md
+++ b/mediapipe/examples/coral/README.md
@@ -116,6 +116,8 @@ Docker container for building MediaPipe applications that run on Edge TPU.
 
 * Object detection demo
 
+![Object Detection running on Coral](./images/object_detection_demo_coral.jpg)
+
         bazel build -c opt --crosstool_top=@crosstool//:toolchains --compiler=gcc --cpu=aarch64 --define MEDIAPIPE_DISABLE_GPU=1 --copt -DMEDIAPIPE_EDGE_TPU --copt=-flax-vector-conversions mediapipe/examples/coral:object_detection_tpu
 
  Copy object_detection_tpu binary to the MediaPipe checkout on the coral device
@@ -127,6 +129,8 @@ Docker container for building MediaPipe applications that run on Edge TPU.
 
 * Face detection demo
 
+![Face Detection running on Coral](./images/face_detection_demo_coral.gif)
+
         bazel build -c opt --crosstool_top=@crosstool//:toolchains --compiler=gcc --cpu=aarch64 --define MEDIAPIPE_DISABLE_GPU=1 --copt -DMEDIAPIPE_EDGE_TPU --copt=-flax-vector-conversions mediapipe/examples/coral:face_detection_tpu
 
  Copy face_detection_tpu binary to the MediaPipe checkout on the coral device
diff --git a/mediapipe/docs/images/face_detection_demo_coral.gif b/mediapipe/examples/coral/images/face_detection_demo_coral.gif
similarity index 100%
rename from mediapipe/docs/images/face_detection_demo_coral.gif
rename to mediapipe/examples/coral/images/face_detection_demo_coral.gif
diff --git a/mediapipe/docs/images/object_detection_demo_coral.jpg b/mediapipe/examples/coral/images/object_detection_demo_coral.jpg
similarity index 100%
rename from mediapipe/docs/images/object_detection_demo_coral.jpg
rename to mediapipe/examples/coral/images/object_detection_demo_coral.jpg
diff --git a/mediapipe/examples/desktop/autoflip/BUILD b/mediapipe/examples/desktop/autoflip/BUILD
index f7507b040..db4625401 100644
--- a/mediapipe/examples/desktop/autoflip/BUILD
+++ b/mediapipe/examples/desktop/autoflip/BUILD
@@ -30,7 +30,9 @@ mediapipe_cc_proto_library(
     name = "autoflip_messages_cc_proto",
     srcs = ["autoflip_messages.proto"],
     cc_deps = ["//mediapipe/framework:calculator_cc_proto"],
-    visibility = ["//mediapipe/examples:__subpackages__"],
+    visibility = [
+        "//mediapipe/examples:__subpackages__",
+    ],
     deps = [":autoflip_messages_proto"],
 )
 
diff --git a/mediapipe/examples/desktop/autoflip/autoflip_messages.proto b/mediapipe/examples/desktop/autoflip/autoflip_messages.proto
index e77a05f18..726237e6b 100644
--- a/mediapipe/examples/desktop/autoflip/autoflip_messages.proto
+++ b/mediapipe/examples/desktop/autoflip/autoflip_messages.proto
@@ -73,7 +73,7 @@ message RectF {
 
 // An image region of interest (eg a detected face or object), accompanied by an
 // importance score.
-// Next tag: 9
+// Next tag: 10
 message SalientRegion {
   reserved 3;
   // The bounding box for this region in the image.
@@ -98,7 +98,19 @@ message SalientRegion {
 
   // If true, object cannot move in the output window (e.g. text would look
   // strange moving around).
+  // TODO: this feature is not implemented, remove proto message.
   optional bool requires_static_location = 7 [default = false];
+
+  // When used with ContentZoomingCalculator, this flag can be set in the
+  // SignalFusingCalculator indicating that areas outside of these detections
+  // can be cropped from the frame.  When no salient regions have this flag set
+  // true, no zooming is performed.  When one or more salient regions have this
+  // flag set true, the max zoom value will be used that keeps all
+  // “only_required” detections within view.  The ContentZoomingCalculator
+  // currently supports zooming by finding the size of non-salient top/bottom
+  // borders regions and provides this information to the
+  // SceneCroppingCalculator for reframing.
+  optional bool only_required = 9 [default = false];
 }
 
 // Stores the message type, including standard types (face, object) and custom
@@ -180,4 +192,10 @@ message ExternalRenderFrame {
   optional Color padding_color = 3;
   // Timestamp in microseconds of this frame.
   optional uint64 timestamp_us = 4;
+  // Target width of the cropped video in pixels. |render_to_location| is
+  // relative to this dimension.
+  optional int32 target_width = 5;
+  // Target height of the cropped video in pixels. |render_to_location| is
+  // relative to this dimension.
+  optional int32 target_height = 6;
 }
diff --git a/mediapipe/examples/desktop/autoflip/calculators/BUILD b/mediapipe/examples/desktop/autoflip/calculators/BUILD
index e16b1baf9..3b1712924 100644
--- a/mediapipe/examples/desktop/autoflip/calculators/BUILD
+++ b/mediapipe/examples/desktop/autoflip/calculators/BUILD
@@ -16,7 +16,10 @@ load("//mediapipe/framework/port:build_config.bzl", "mediapipe_cc_proto_library"
 
 licenses(["notice"])  # Apache 2.0
 
-package(default_visibility = ["//mediapipe/examples:__subpackages__"])
+package(default_visibility = [
+    "//mediapipe/examples:__subpackages__",
+    "//mediapipe/viz:__subpackages__",
+])
 
 cc_library(
     name = "border_detection_calculator",
@@ -51,6 +54,44 @@ mediapipe_cc_proto_library(
     deps = [":border_detection_calculator_proto"],
 )
 
+cc_library(
+    name = "content_zooming_calculator",
+    srcs = ["content_zooming_calculator.cc"],
+    deps = [
+        ":content_zooming_calculator_cc_proto",
+        "//mediapipe/examples/desktop/autoflip:autoflip_messages_cc_proto",
+        "//mediapipe/examples/desktop/autoflip/quality:kinematic_path_solver",
+        "//mediapipe/framework:calculator_framework",
+        "//mediapipe/framework/formats:image_frame",
+        "//mediapipe/framework/formats:image_frame_opencv",
+        "//mediapipe/framework/port:ret_check",
+        "//mediapipe/framework/port:status",
+    ],
+    alwayslink = 1,
+)
+
+proto_library(
+    name = "content_zooming_calculator_proto",
+    srcs = ["content_zooming_calculator.proto"],
+    deps = [
+        "//mediapipe/examples/desktop/autoflip/quality:kinematic_path_solver_proto",
+        "//mediapipe/framework:calculator_proto",
+    ],
+)
+
+mediapipe_cc_proto_library(
+    name = "content_zooming_calculator_cc_proto",
+    srcs = ["content_zooming_calculator.proto"],
+    cc_deps = [
+        "//mediapipe/examples/desktop/autoflip/quality:kinematic_path_solver_cc_proto",
+        "//mediapipe/framework:calculator_cc_proto",
+    ],
+    visibility = ["//mediapipe/examples:__subpackages__"],
+    deps = [
+        ":content_zooming_calculator_proto",
+    ],
+)
+
 cc_test(
     name = "border_detection_calculator_test",
     srcs = [
@@ -75,6 +116,30 @@ cc_test(
     ],
 )
 
+cc_test(
+    name = "content_zooming_calculator_test",
+    srcs = [
+        "content_zooming_calculator_test.cc",
+    ],
+    linkstatic = 1,
+    deps = [
+        ":content_zooming_calculator",
+        ":content_zooming_calculator_cc_proto",
+        "//mediapipe/examples/desktop/autoflip:autoflip_messages_cc_proto",
+        "//mediapipe/framework:calculator_framework",
+        "//mediapipe/framework:calculator_runner",
+        "//mediapipe/framework/formats:image_frame",
+        "//mediapipe/framework/formats:image_frame_opencv",
+        "//mediapipe/framework/port:benchmark",
+        "//mediapipe/framework/port:gtest_main",
+        "//mediapipe/framework/port:opencv_core",
+        "//mediapipe/framework/port:parse_text_proto",
+        "//mediapipe/framework/port:ret_check",
+        "//mediapipe/framework/port:status",
+        "@com_google_absl//absl/strings",
+    ],
+)
+
 cc_library(
     name = "video_filtering_calculator",
     srcs = ["video_filtering_calculator.cc"],
diff --git a/mediapipe/examples/desktop/autoflip/calculators/content_zooming_calculator.cc b/mediapipe/examples/desktop/autoflip/calculators/content_zooming_calculator.cc
new file mode 100644
index 000000000..38fb72b06
--- /dev/null
+++ b/mediapipe/examples/desktop/autoflip/calculators/content_zooming_calculator.cc
@@ -0,0 +1,280 @@
+// Copyright 2019 The MediaPipe Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//      http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include <algorithm>
+#include <memory>
+
+#include "mediapipe/examples/desktop/autoflip/autoflip_messages.pb.h"
+#include "mediapipe/examples/desktop/autoflip/calculators/content_zooming_calculator.pb.h"
+#include "mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.h"
+#include "mediapipe/framework/calculator_framework.h"
+#include "mediapipe/framework/formats/image_frame.h"
+#include "mediapipe/framework/formats/image_frame_opencv.h"
+#include "mediapipe/framework/port/ret_check.h"
+#include "mediapipe/framework/port/status.h"
+#include "mediapipe/framework/port/status_builder.h"
+
+constexpr char kVideoFrame[] = "VIDEO";
+constexpr char kVideoSize[] = "VIDEO_SIZE";
+constexpr char kDetectionSet[] = "DETECTIONS";
+constexpr char kDetectedBorders[] = "BORDERS";
+// Field-of-view (degrees) of the camera's x-axis (width).
+// TODO: Parameterize FOV based on camera specs.
+constexpr float kWidthFieldOfView = 60;
+
+namespace mediapipe {
+namespace autoflip {
+
+// Content zooming calculator zooms in on content when a detection has
+// "only_required" set true.  It does this by computing the value of top/bottom
+// borders to remove from the output and sends these to the
+// SceneCroppingCalculator.  When more than one detections are received the zoom
+// box is calculated as the union of the detections.  Typical applications
+// include mobile makeover and autofliplive face reframing.  Currently only
+// supports y-dimension zooming.
+class ContentZoomingCalculator : public CalculatorBase {
+ public:
+  ContentZoomingCalculator()
+      : initialized_(false), last_only_required_detection_(0) {}
+  ~ContentZoomingCalculator() override {}
+  ContentZoomingCalculator(const ContentZoomingCalculator&) = delete;
+  ContentZoomingCalculator& operator=(const ContentZoomingCalculator&) = delete;
+
+  static ::mediapipe::Status GetContract(mediapipe::CalculatorContract* cc);
+  ::mediapipe::Status Open(mediapipe::CalculatorContext* cc) override;
+  ::mediapipe::Status Process(mediapipe::CalculatorContext* cc) override;
+
+ private:
+  // Converts bounds to tilt offset and height.
+  ::mediapipe::Status ConvertToTiltZoom(float xmin, float xmax, float ymin,
+                                        float ymax, int* tilt_offset,
+                                        int* height);
+  ContentZoomingCalculatorOptions options_;
+  // Detection frame width/height.
+  int frame_height_;
+  int frame_width_;
+  // Path solver used to smooth top/bottom border crop values.
+  std::unique_ptr<KinematicPathSolver> path_solver_height_;
+  std::unique_ptr<KinematicPathSolver> path_solver_offset_;
+  // Are parameters initialized.
+  bool initialized_;
+  // Stores the time of the last "only_required" input.
+  int64 last_only_required_detection_;
+  // Border values of last message with detection.
+  int last_measured_height_;
+  int last_measured_y_offset_;
+  // Min border values.
+  float min_height_value_;
+};
+REGISTER_CALCULATOR(ContentZoomingCalculator);
+
+::mediapipe::Status ContentZoomingCalculator::GetContract(
+    mediapipe::CalculatorContract* cc) {
+  RET_CHECK(
+      !(cc->Inputs().HasTag(kVideoFrame) && cc->Inputs().HasTag(kVideoSize)))
+      << "Provide only VIDEO or VIDEO_SIZE, not both.";
+  if (cc->Inputs().HasTag(kVideoFrame)) {
+    cc->Inputs().Tag(kVideoFrame).Set<ImageFrame>();
+  } else if (cc->Inputs().HasTag(kVideoSize)) {
+    cc->Inputs().Tag(kVideoSize).Set<std::pair<int, int>>();
+  } else {
+    return ::mediapipe::UnknownErrorBuilder(MEDIAPIPE_LOC)
+           << "Input VIDEO or VIDEO_SIZE must be provided.";
+  }
+  cc->Inputs().Tag(kDetectionSet).Set<DetectionSet>();
+  cc->Outputs().Tag(kDetectedBorders).Set<StaticFeatures>();
+  return ::mediapipe::OkStatus();
+}
+
+::mediapipe::Status ContentZoomingCalculator::Open(
+    mediapipe::CalculatorContext* cc) {
+  options_ = cc->Options<ContentZoomingCalculatorOptions>();
+  if (options_.has_kinematic_options()) {
+    return ::mediapipe::UnknownErrorBuilder(MEDIAPIPE_LOC)
+           << "Deprecated kinematic_options was set, please set "
+              "kinematic_options_zoom and kinematic_options_tilt.";
+  }
+  if (options_.has_min_motion_to_reframe()) {
+    return ::mediapipe::UnknownErrorBuilder(MEDIAPIPE_LOC)
+           << "Deprecated min_motion_to_reframe was set, please set "
+              "in kinematic_options_zoom and kinematic_options_tilt directly.";
+  }
+  return ::mediapipe::OkStatus();
+}
+
+::mediapipe::Status ContentZoomingCalculator::ConvertToTiltZoom(
+    float xmin, float xmax, float ymin, float ymax, int* tilt_offset,
+    int* height) {
+  // Find center of the y-axis offset (for tilt control).
+  float y_center = ymin + (ymax - ymin) / 2;
+  // Find size and apply scale factor to y-axis.
+  float fit_size = fmax((ymax - ymin) / options_.scale_factor(), xmax - xmin);
+  // Apply min zoom for cases where the target size is wider than input frame
+  // size.
+  fit_size = fmin(min_height_value_, fit_size);
+  // Prevent box from extending beyond the image.
+  if (y_center - fit_size / 2 < 0) {
+    y_center = fit_size / 2;
+  } else if (y_center + fit_size / 2 > 1) {
+    y_center = 1 - fit_size / 2;
+  }
+  // Scale to pixel coordinates.
+  *tilt_offset = frame_height_ * y_center;
+  *height = frame_height_ * fit_size;
+  return ::mediapipe::OkStatus();
+}
+
+namespace {
+::mediapipe::Status UpdateRanges(const SalientRegion& region, float* xmin,
+                                 float* xmax, float* ymin, float* ymax) {
+  if (!region.has_location_normalized()) {
+    return ::mediapipe::UnknownErrorBuilder(MEDIAPIPE_LOC)
+           << "SalientRegion did not have location normalized set.";
+  }
+  *xmin = fmin(*xmin, region.location_normalized().x());
+  *xmax = fmax(*xmax, region.location_normalized().x() +
+                          region.location_normalized().width());
+  *ymin = fmin(*ymin, region.location_normalized().y());
+  *ymax = fmax(*ymax, region.location_normalized().y() +
+                          region.location_normalized().height());
+
+  return ::mediapipe::OkStatus();
+}
+void MakeStaticFeatures(const int top_border, const int bottom_border,
+                        const int frame_width, const int frame_height,
+                        StaticFeatures* static_feature) {
+  auto border_top = static_feature->add_border();
+  border_top->set_relative_position(Border::TOP);
+  border_top->mutable_border_position()->set_x(0);
+  border_top->mutable_border_position()->set_y(0);
+  border_top->mutable_border_position()->set_width(frame_width);
+  border_top->mutable_border_position()->set_height(top_border);
+
+  auto border_bottom = static_feature->add_border();
+  border_bottom->set_relative_position(Border::BOTTOM);
+  border_bottom->mutable_border_position()->set_x(0);
+  border_bottom->mutable_border_position()->set_y(frame_height - bottom_border);
+  border_bottom->mutable_border_position()->set_width(frame_width);
+  border_bottom->mutable_border_position()->set_height(bottom_border);
+}
+}  // namespace
+
+::mediapipe::Status ContentZoomingCalculator::Process(
+    mediapipe::CalculatorContext* cc) {
+  if (cc->Inputs().HasTag(kVideoFrame)) {
+    cv::Mat frame = mediapipe::formats::MatView(
+        &cc->Inputs().Tag(kVideoFrame).Get<ImageFrame>());
+    frame_width_ = frame.cols;
+    frame_height_ = frame.rows;
+  } else if (cc->Inputs().HasTag(kVideoSize)) {
+    frame_width_ =
+        cc->Inputs().Tag(kVideoSize).Get<std::pair<int, int>>().first;
+    frame_height_ =
+        cc->Inputs().Tag(kVideoSize).Get<std::pair<int, int>>().second;
+  } else {
+    return ::mediapipe::UnknownErrorBuilder(MEDIAPIPE_LOC)
+           << "Input VIDEO or VIDEO_SIZE must be provided.";
+  }
+
+  if (!initialized_) {
+    path_solver_height_ = std::make_unique<KinematicPathSolver>(
+        options_.kinematic_options_zoom(), 0, frame_height_,
+        static_cast<float>(frame_width_) / kWidthFieldOfView);
+    path_solver_offset_ = std::make_unique<KinematicPathSolver>(
+        options_.kinematic_options_tilt(), 0, frame_height_,
+        static_cast<float>(frame_width_) / kWidthFieldOfView);
+    min_height_value_ = 1.0;
+    // If target size is set and wider than input aspect, make sure to always
+    // crop the min required amount.
+    if (options_.has_target_size()) {
+      RET_CHECK_GT(options_.target_size().width(), 0)
+          << "Provided target width not valid.";
+      RET_CHECK_GT(options_.target_size().height(), 0)
+          << "Provided target height not valid.";
+      float input_aspect = frame_width_ / static_cast<float>(frame_height_);
+      float target_aspect = options_.target_size().width() /
+                            static_cast<float>(options_.target_size().height());
+      min_height_value_ =
+          (input_aspect < target_aspect) ? input_aspect / target_aspect : 1.0;
+    }
+    last_measured_height_ = min_height_value_ * frame_height_;
+    last_measured_y_offset_ = frame_width_ / 2;
+    initialized_ = true;
+  }
+
+  auto detection_set = cc->Inputs().Tag(kDetectionSet).Get<DetectionSet>();
+  bool only_required_found = false;
+
+  // Compute the box that contains all "is_required" detections.
+  float xmin = 1, ymin = 1, xmax = 0, ymax = 0;
+  for (const auto& region : detection_set.detections()) {
+    if (!region.only_required()) {
+      continue;
+    }
+    only_required_found = true;
+    MP_RETURN_IF_ERROR(UpdateRanges(region, &xmin, &xmax, &ymin, &ymax));
+  }
+
+  // Convert bounds to tilt/zoom and in pixel coordinates.
+  int offset, height;
+  MP_RETURN_IF_ERROR(
+      ConvertToTiltZoom(xmin, xmax, ymin, ymax, &offset, &height));
+
+  if (only_required_found) {
+    // A only required detection was found.
+    last_only_required_detection_ = cc->InputTimestamp().Microseconds();
+    last_measured_height_ = height;
+    last_measured_y_offset_ = offset;
+  } else if (cc->InputTimestamp().Microseconds() -
+                 last_only_required_detection_ >=
+             options_.us_before_zoomout()) {
+    // No only_require detections found within salient regions packets arriving
+    // since us_before_zoomout duration.
+    height = min_height_value_ * frame_height_;
+    offset = frame_height_ / 2;
+  } else {
+    // No only detection found but using last detection due to
+    // duration_before_zoomout_us setting.
+    height = last_measured_height_;
+    offset = last_measured_y_offset_;
+  }
+
+  // Compute smoothed camera paths.
+  MP_RETURN_IF_ERROR(path_solver_height_->AddObservation(
+      height, cc->InputTimestamp().Microseconds()));
+  MP_RETURN_IF_ERROR(path_solver_offset_->AddObservation(
+      offset, cc->InputTimestamp().Microseconds()));
+  int path_size;
+  MP_RETURN_IF_ERROR(path_solver_height_->GetState(&path_size));
+  int path_offset;
+  MP_RETURN_IF_ERROR(path_solver_offset_->GetState(&path_offset));
+
+  // Convert to top/bottom borders to remove.
+  int path_top = path_offset - path_size / 2;
+  int path_bottom = frame_height_ - (path_offset + path_size / 2);
+
+  // Transmit result downstream.
+  std::unique_ptr<StaticFeatures> features =
+      absl::make_unique<StaticFeatures>();
+  MakeStaticFeatures(path_top, path_bottom, frame_width_, frame_height_,
+                     features.get());
+  cc->Outputs()
+      .Tag(kDetectedBorders)
+      .AddPacket(Adopt(features.release()).At(cc->InputTimestamp()));
+
+  return ::mediapipe::OkStatus();
+}
+
+}  // namespace autoflip
+}  // namespace mediapipe
diff --git a/mediapipe/examples/desktop/autoflip/calculators/content_zooming_calculator.proto b/mediapipe/examples/desktop/autoflip/calculators/content_zooming_calculator.proto
new file mode 100644
index 000000000..78d7c9e93
--- /dev/null
+++ b/mediapipe/examples/desktop/autoflip/calculators/content_zooming_calculator.proto
@@ -0,0 +1,51 @@
+// Copyright 2019 The MediaPipe Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//      http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+syntax = "proto2";
+
+package mediapipe.autoflip;
+
+import "mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.proto";
+import "mediapipe/framework/calculator.proto";
+
+message ContentZoomingCalculatorOptions {
+  extend mediapipe.CalculatorOptions {
+    optional ContentZoomingCalculatorOptions ext = 313091992;
+  }
+  // Amount the only required area should fill the image.  When set to 1,
+  // reframing is done to remove content to the very edge of the salient region
+  // bounding box.  When a smaller value is used, zooming will be done to fill
+  // this ratio of the frame.
+  optional float scale_factor = 1 [default = .9];
+  // Kinematic options for zooming.
+  optional KinematicOptions kinematic_options_zoom = 6;
+  // Kinematic options for tilt (y-axis reframing.)
+  optional KinematicOptions kinematic_options_tilt = 7;
+  // Duration (in MicroSeconds) before returning to fully zoomed out position
+  // when no "only_required" frames are received.
+  optional int64 us_before_zoomout = 9 [default = 1000000];
+  // Value of target output size, required to be set if different than input.
+  // Should match target_width and target_height in croppingcalculator.
+  message Size {
+    optional int64 width = 1;
+    optional int64 height = 2;
+  }
+  optional Size target_size = 8;
+
+  // Deprecated parameters
+  optional KinematicOptions kinematic_options = 2 [deprecated = true];
+  optional int64 min_motion_to_reframe = 4 [deprecated = true];
+  optional float min_vertical_zoom = 5 [default = 1, deprecated = true];
+  optional int64 frames_before_zoomout = 3 [default = 30, deprecated = true];
+}
diff --git a/mediapipe/examples/desktop/autoflip/calculators/content_zooming_calculator_test.cc b/mediapipe/examples/desktop/autoflip/calculators/content_zooming_calculator_test.cc
new file mode 100644
index 000000000..e7398d255
--- /dev/null
+++ b/mediapipe/examples/desktop/autoflip/calculators/content_zooming_calculator_test.cc
@@ -0,0 +1,242 @@
+// Copyright 2019 The MediaPipe Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//      http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include <memory>
+
+#include "mediapipe/examples/desktop/autoflip/autoflip_messages.pb.h"
+#include "mediapipe/examples/desktop/autoflip/calculators/content_zooming_calculator.pb.h"
+#include "mediapipe/framework/calculator_framework.h"
+#include "mediapipe/framework/calculator_runner.h"
+#include "mediapipe/framework/formats/image_frame.h"
+#include "mediapipe/framework/formats/image_frame_opencv.h"
+#include "mediapipe/framework/port/benchmark.h"
+#include "mediapipe/framework/port/gmock.h"
+#include "mediapipe/framework/port/gtest.h"
+#include "mediapipe/framework/port/opencv_core_inc.h"
+#include "mediapipe/framework/port/parse_text_proto.h"
+#include "mediapipe/framework/port/ret_check.h"
+#include "mediapipe/framework/port/status.h"
+#include "mediapipe/framework/port/status_matchers.h"
+
+namespace mediapipe {
+namespace autoflip {
+namespace {
+
+const char kConfigA[] = R"(
+    calculator: "ContentZoomingCalculator"
+    input_stream: "VIDEO:camera_frames"
+    input_stream: "DETECTIONS:detection_set"
+    output_stream: "BORDERS:borders"
+    )";
+
+const char kConfigB[] = R"(
+    calculator: "ContentZoomingCalculator"
+    input_stream: "VIDEO:camera_frames"
+    input_stream: "DETECTIONS:detection_set"
+    output_stream: "BORDERS:borders"
+    options: {
+      [mediapipe.autoflip.ContentZoomingCalculatorOptions.ext]: {
+        target_size {
+          width: 1000
+          height: 500
+        }
+      }
+    }
+    )";
+
+const char kConfigC[] = R"(
+    calculator: "ContentZoomingCalculator"
+    input_stream: "VIDEO_SIZE:size"
+    input_stream: "DETECTIONS:detection_set"
+    output_stream: "BORDERS:borders"
+    )";
+
+void CheckBorder(const StaticFeatures& static_features, int width, int height,
+                 int top_border, int bottom_border) {
+  ASSERT_EQ(2, static_features.border().size());
+  auto part = static_features.border(0);
+  EXPECT_EQ(part.border_position().x(), 0);
+  EXPECT_EQ(part.border_position().y(), 0);
+  EXPECT_EQ(part.border_position().width(), width);
+  EXPECT_EQ(part.border_position().height(), top_border);
+  EXPECT_EQ(Border::TOP, part.relative_position());
+
+  part = static_features.border(1);
+  EXPECT_EQ(part.border_position().x(), 0);
+  EXPECT_EQ(part.border_position().y(), height - bottom_border);
+  EXPECT_EQ(part.border_position().width(), width);
+  EXPECT_EQ(part.border_position().height(), bottom_border);
+  EXPECT_EQ(Border::BOTTOM, part.relative_position());
+}
+
+TEST(ContentZoomingCalculatorTest, ZoomTest) {
+  auto runner = ::absl::make_unique<CalculatorRunner>(
+      ParseTextProtoOrDie<CalculatorGraphConfig::Node>(kConfigA));
+  auto detection_set = std::make_unique<DetectionSet>();
+  auto* detection = detection_set->add_detections();
+  detection->set_only_required(true);
+  auto* location = detection->mutable_location_normalized();
+  location->set_height(.1);
+  location->set_width(.1);
+  location->set_x(.4);
+  location->set_y(.5);
+
+  auto input_frame =
+      ::absl::make_unique<ImageFrame>(ImageFormat::SRGB, 1000, 1000);
+  runner->MutableInputs()->Tag("VIDEO").packets.push_back(
+      Adopt(input_frame.release()).At(Timestamp(0)));
+
+  runner->MutableInputs()
+      ->Tag("DETECTIONS")
+      .packets.push_back(Adopt(detection_set.release()).At(Timestamp(0)));
+
+  // Run the calculator.
+  MP_ASSERT_OK(runner->Run());
+
+  const std::vector<Packet>& output_packets =
+      runner->Outputs().Tag("BORDERS").packets;
+  ASSERT_EQ(1, output_packets.size());
+  const auto& static_features = output_packets[0].Get<StaticFeatures>();
+  CheckBorder(static_features, 1000, 1000, 495, 395);
+}
+
+TEST(ContentZoomingCalculatorTest, MinAspectBorderValues) {
+  auto runner = ::absl::make_unique<CalculatorRunner>(
+      ParseTextProtoOrDie<CalculatorGraphConfig::Node>(kConfigB));
+  auto detection_set = std::make_unique<DetectionSet>();
+  auto* detection = detection_set->add_detections();
+  detection->set_only_required(true);
+  auto* location = detection->mutable_location_normalized();
+  location->set_height(1);
+  location->set_width(1);
+  location->set_x(0);
+  location->set_y(0);
+
+  auto input_frame =
+      ::absl::make_unique<ImageFrame>(ImageFormat::SRGB, 1000, 1000);
+  runner->MutableInputs()->Tag("VIDEO").packets.push_back(
+      Adopt(input_frame.release()).At(Timestamp(0)));
+
+  runner->MutableInputs()
+      ->Tag("DETECTIONS")
+      .packets.push_back(Adopt(detection_set.release()).At(Timestamp(0)));
+
+  // Run the calculator.
+  MP_ASSERT_OK(runner->Run());
+
+  const std::vector<Packet>& output_packets =
+      runner->Outputs().Tag("BORDERS").packets;
+  ASSERT_EQ(1, output_packets.size());
+  const auto& static_features = output_packets[0].Get<StaticFeatures>();
+  CheckBorder(static_features, 1000, 1000, 250, 250);
+}
+
+TEST(ContentZoomingCalculatorTest, TwoFacesWide) {
+  auto runner = ::absl::make_unique<CalculatorRunner>(
+      ParseTextProtoOrDie<CalculatorGraphConfig::Node>(kConfigA));
+  auto detection_set = std::make_unique<DetectionSet>();
+  auto* detection = detection_set->add_detections();
+  detection->set_only_required(true);
+  auto* location = detection->mutable_location_normalized();
+  location->set_height(.2);
+  location->set_width(.2);
+  location->set_x(.2);
+  location->set_y(.4);
+
+  location = detection->mutable_location_normalized();
+  location->set_height(.2);
+  location->set_width(.2);
+  location->set_x(.6);
+  location->set_y(.4);
+
+  auto input_frame =
+      ::absl::make_unique<ImageFrame>(ImageFormat::SRGB, 1000, 1000);
+  runner->MutableInputs()->Tag("VIDEO").packets.push_back(
+      Adopt(input_frame.release()).At(Timestamp(0)));
+
+  runner->MutableInputs()
+      ->Tag("DETECTIONS")
+      .packets.push_back(Adopt(detection_set.release()).At(Timestamp(0)));
+
+  // Run the calculator.
+  MP_ASSERT_OK(runner->Run());
+
+  const std::vector<Packet>& output_packets =
+      runner->Outputs().Tag("BORDERS").packets;
+  ASSERT_EQ(1, output_packets.size());
+  const auto& static_features = output_packets[0].Get<StaticFeatures>();
+
+  CheckBorder(static_features, 1000, 1000, 389, 389);
+}
+
+TEST(ContentZoomingCalculatorTest, NoDetectionOnInit) {
+  auto runner = ::absl::make_unique<CalculatorRunner>(
+      ParseTextProtoOrDie<CalculatorGraphConfig::Node>(kConfigA));
+  auto detection_set = std::make_unique<DetectionSet>();
+
+  auto input_frame =
+      ::absl::make_unique<ImageFrame>(ImageFormat::SRGB, 1000, 1000);
+  runner->MutableInputs()->Tag("VIDEO").packets.push_back(
+      Adopt(input_frame.release()).At(Timestamp(0)));
+
+  runner->MutableInputs()
+      ->Tag("DETECTIONS")
+      .packets.push_back(Adopt(detection_set.release()).At(Timestamp(0)));
+
+  // Run the calculator.
+  MP_ASSERT_OK(runner->Run());
+
+  const std::vector<Packet>& output_packets =
+      runner->Outputs().Tag("BORDERS").packets;
+  ASSERT_EQ(1, output_packets.size());
+  const auto& static_features = output_packets[0].Get<StaticFeatures>();
+
+  CheckBorder(static_features, 1000, 1000, 0, 0);
+}
+
+TEST(ContentZoomingCalculatorTest, ZoomTestPairSize) {
+  auto runner = ::absl::make_unique<CalculatorRunner>(
+      ParseTextProtoOrDie<CalculatorGraphConfig::Node>(kConfigC));
+  auto detection_set = std::make_unique<DetectionSet>();
+  auto* detection = detection_set->add_detections();
+  detection->set_only_required(true);
+  auto* location = detection->mutable_location_normalized();
+  location->set_height(.1);
+  location->set_width(.1);
+  location->set_x(.4);
+  location->set_y(.5);
+
+  auto input_size = ::absl::make_unique<std::pair<int, int>>(1000, 1000);
+  runner->MutableInputs()
+      ->Tag("VIDEO_SIZE")
+      .packets.push_back(Adopt(input_size.release()).At(Timestamp(0)));
+
+  runner->MutableInputs()
+      ->Tag("DETECTIONS")
+      .packets.push_back(Adopt(detection_set.release()).At(Timestamp(0)));
+
+  // Run the calculator.
+  MP_ASSERT_OK(runner->Run());
+
+  const std::vector<Packet>& output_packets =
+      runner->Outputs().Tag("BORDERS").packets;
+  ASSERT_EQ(1, output_packets.size());
+  const auto& static_features = output_packets[0].Get<StaticFeatures>();
+  CheckBorder(static_features, 1000, 1000, 495, 395);
+}
+
+}  // namespace
+}  // namespace autoflip
+
+}  // namespace mediapipe
diff --git a/mediapipe/examples/desktop/autoflip/calculators/face_to_region_calculator.cc b/mediapipe/examples/desktop/autoflip/calculators/face_to_region_calculator.cc
index f3333c91a..86f03cf7a 100644
--- a/mediapipe/examples/desktop/autoflip/calculators/face_to_region_calculator.cc
+++ b/mediapipe/examples/desktop/autoflip/calculators/face_to_region_calculator.cc
@@ -80,7 +80,9 @@ FaceToRegionCalculator::FaceToRegionCalculator() {}
 
 ::mediapipe::Status FaceToRegionCalculator::GetContract(
     mediapipe::CalculatorContract* cc) {
-  cc->Inputs().Tag("VIDEO").Set<ImageFrame>();
+  if (cc->Inputs().HasTag("VIDEO")) {
+    cc->Inputs().Tag("VIDEO").Set<ImageFrame>();
+  }
   cc->Inputs().Tag("FACES").Set<std::vector<mediapipe::Detection>>();
   cc->Outputs().Tag("REGIONS").Set<DetectionSet>();
   return ::mediapipe::OkStatus();
@@ -89,6 +91,17 @@ FaceToRegionCalculator::FaceToRegionCalculator() {}
 ::mediapipe::Status FaceToRegionCalculator::Open(
     mediapipe::CalculatorContext* cc) {
   options_ = cc->Options<FaceToRegionCalculatorOptions>();
+  if (!cc->Inputs().HasTag("VIDEO")) {
+    RET_CHECK(!options_.use_visual_scorer())
+        << "VIDEO input must be provided when using visual_scorer.";
+    RET_CHECK(!options_.export_individual_face_landmarks())
+        << "VIDEO input must be provided when export_individual_face_landmarks "
+           "is set true.";
+    RET_CHECK(!options_.export_bbox_from_landmarks())
+        << "VIDEO input must be provided when export_bbox_from_landmarks "
+           "is set true.";
+  }
+
   scorer_ = absl::make_unique<VisualScorer>(options_.scorer_options());
   frame_width_ = -1;
   frame_height_ = -1;
@@ -135,14 +148,19 @@ void FaceToRegionCalculator::ExtendSalientRegionWithPoint(
 
 ::mediapipe::Status FaceToRegionCalculator::Process(
     mediapipe::CalculatorContext* cc) {
-  if (cc->Inputs().Tag("VIDEO").Value().IsEmpty()) {
-    return ::mediapipe::UnknownErrorBuilder(MEDIAPIPE_LOC) << "No VIDEO input.";
+  if (cc->Inputs().HasTag("VIDEO") &&
+      cc->Inputs().Tag("VIDEO").Value().IsEmpty()) {
+    return ::mediapipe::UnknownErrorBuilder(MEDIAPIPE_LOC)
+           << "No VIDEO input at time " << cc->InputTimestamp().Seconds();
   }
 
-  cv::Mat frame =
-      mediapipe::formats::MatView(&cc->Inputs().Tag("VIDEO").Get<ImageFrame>());
-  frame_width_ = frame.cols;
-  frame_height_ = frame.rows;
+  cv::Mat frame;
+  if (cc->Inputs().HasTag("VIDEO")) {
+    frame = mediapipe::formats::MatView(
+        &cc->Inputs().Tag("VIDEO").Get<ImageFrame>());
+    frame_width_ = frame.cols;
+    frame_height_ = frame.rows;
+  }
 
   auto region_set = ::absl::make_unique<DetectionSet>();
   if (!cc->Inputs().Tag("FACES").Value().IsEmpty()) {
diff --git a/mediapipe/examples/desktop/autoflip/calculators/face_to_region_calculator_test.cc b/mediapipe/examples/desktop/autoflip/calculators/face_to_region_calculator_test.cc
index 971795ca7..4777c6e1d 100644
--- a/mediapipe/examples/desktop/autoflip/calculators/face_to_region_calculator_test.cc
+++ b/mediapipe/examples/desktop/autoflip/calculators/face_to_region_calculator_test.cc
@@ -40,6 +40,12 @@ const char kConfig[] = R"(
     output_stream: "REGIONS:regions"
     )";
 
+const char kConfigNoVideo[] = R"(
+    calculator: "FaceToRegionCalculator"
+    input_stream: "FACES:faces"
+    output_stream: "REGIONS:regions"
+    )";
+
 const char kFace1[] = R"(location_data {
            format: RELATIVE_BOUNDING_BOX
            relative_bounding_box {
@@ -88,13 +94,15 @@ const char kFace3[] = R"(location_data {
            relative_keypoints { x: 0 y: 0 }
          })";
 
-void SetInputs(CalculatorRunner* runner,
-               const std::vector<std::string>& faces) {
+void SetInputs(const std::vector<std::string>& faces, const bool include_video,
+               CalculatorRunner* runner) {
   // Setup an input video frame.
-  auto input_frame =
-      ::absl::make_unique<ImageFrame>(ImageFormat::SRGB, 800, 600);
-  runner->MutableInputs()->Tag("VIDEO").packets.push_back(
-      Adopt(input_frame.release()).At(Timestamp::PostStream()));
+  if (include_video) {
+    auto input_frame =
+        ::absl::make_unique<ImageFrame>(ImageFormat::SRGB, 800, 600);
+    runner->MutableInputs()->Tag("VIDEO").packets.push_back(
+        Adopt(input_frame.release()).At(Timestamp::PostStream()));
+  }
   // Setup two faces as input.
   auto input_faces = ::absl::make_unique<std::vector<Detection>>();
   // A face with landmarks.
@@ -105,30 +113,31 @@ void SetInputs(CalculatorRunner* runner,
       Adopt(input_faces.release()).At(Timestamp::PostStream()));
 }
 
-CalculatorGraphConfig::Node MakeConfig(bool whole_face, bool landmarks,
-                                       bool bb_from_landmarks) {
-  auto config = ParseTextProtoOrDie<CalculatorGraphConfig::Node>(kConfig);
-
+CalculatorGraphConfig::Node MakeConfig(std::string base_config, bool whole_face,
+                                       bool landmarks, bool bb_from_landmarks,
+                                       bool visual_scoring) {
+  auto config = ParseTextProtoOrDie<CalculatorGraphConfig::Node>(base_config);
   config.mutable_options()
       ->MutableExtension(FaceToRegionCalculatorOptions::ext)
       ->set_export_whole_face(whole_face);
-
   config.mutable_options()
       ->MutableExtension(FaceToRegionCalculatorOptions::ext)
       ->set_export_individual_face_landmarks(landmarks);
-
   config.mutable_options()
       ->MutableExtension(FaceToRegionCalculatorOptions::ext)
       ->set_export_bbox_from_landmarks(bb_from_landmarks);
+  config.mutable_options()
+      ->MutableExtension(FaceToRegionCalculatorOptions::ext)
+      ->set_use_visual_scorer(visual_scoring);
 
   return config;
 }
 
 TEST(FaceToRegionCalculatorTest, FaceFullTypeSize) {
   // Setup test
-  auto runner =
-      ::absl::make_unique<CalculatorRunner>(MakeConfig(true, false, false));
-  SetInputs(runner.get(), {kFace1, kFace2});
+  auto runner = ::absl::make_unique<CalculatorRunner>(
+      MakeConfig(kConfig, true, false, false, true));
+  SetInputs({kFace1, kFace2}, true, runner.get());
 
   // Run the calculator.
   MP_ASSERT_OK(runner->Run());
@@ -159,9 +168,9 @@ TEST(FaceToRegionCalculatorTest, FaceFullTypeSize) {
 
 TEST(FaceToRegionCalculatorTest, FaceLandmarksTypeSize) {
   // Setup test
-  auto runner =
-      ::absl::make_unique<CalculatorRunner>(MakeConfig(false, true, false));
-  SetInputs(runner.get(), {kFace1});
+  auto runner = ::absl::make_unique<CalculatorRunner>(
+      MakeConfig(kConfig, false, true, false, true));
+  SetInputs({kFace1}, true, runner.get());
 
   // Run the calculator.
   MP_ASSERT_OK(runner->Run());
@@ -190,9 +199,9 @@ TEST(FaceToRegionCalculatorTest, FaceLandmarksTypeSize) {
 
 TEST(FaceToRegionCalculatorTest, FaceLandmarksBox) {
   // Setup test
-  auto runner =
-      ::absl::make_unique<CalculatorRunner>(MakeConfig(false, false, true));
-  SetInputs(runner.get(), {kFace1});
+  auto runner = ::absl::make_unique<CalculatorRunner>(
+      MakeConfig(kConfig, false, false, true, true));
+  SetInputs({kFace1}, true, runner.get());
 
   // Run the calculator.
   MP_ASSERT_OK(runner->Run());
@@ -225,9 +234,9 @@ TEST(FaceToRegionCalculatorTest, FaceLandmarksBox) {
 
 TEST(FaceToRegionCalculatorTest, FaceScore) {
   // Setup test
-  auto runner =
-      ::absl::make_unique<CalculatorRunner>(MakeConfig(true, false, false));
-  SetInputs(runner.get(), {kFace3});
+  auto runner = ::absl::make_unique<CalculatorRunner>(
+      MakeConfig(kConfig, true, false, false, true));
+  SetInputs({kFace3}, true, runner.get());
 
   // Run the calculator.
   MP_ASSERT_OK(runner->Run());
@@ -242,6 +251,69 @@ TEST(FaceToRegionCalculatorTest, FaceScore) {
   EXPECT_FLOAT_EQ(landmark_1.score(), 0.25);
 }
 
+TEST(FaceToRegionCalculatorTest, FaceNoVideoVisualScoreFail) {
+  // Setup test
+  auto runner = ::absl::make_unique<CalculatorRunner>(
+      MakeConfig(kConfigNoVideo, true, false, false, true));
+  SetInputs({kFace3}, false, runner.get());
+
+  // Run the calculator.
+  ASSERT_FALSE(runner->Run().ok());
+}
+
+TEST(FaceToRegionCalculatorTest, FaceNoVideoLandmarksFail) {
+  // Setup test
+  auto runner = ::absl::make_unique<CalculatorRunner>(
+      MakeConfig(kConfigNoVideo, false, true, false, false));
+  SetInputs({kFace3}, false, runner.get());
+
+  // Run the calculator.
+  ASSERT_FALSE(runner->Run().ok());
+}
+
+TEST(FaceToRegionCalculatorTest, FaceNoVideoBBLandmarksFail) {
+  // Setup test
+  auto runner = ::absl::make_unique<CalculatorRunner>(
+      MakeConfig(kConfigNoVideo, false, false, true, false));
+  SetInputs({kFace3}, false, runner.get());
+
+  // Run the calculator.
+  ASSERT_FALSE(runner->Run().ok());
+}
+
+TEST(FaceToRegionCalculatorTest, FaceNoVideoPass) {
+  // Setup test
+  auto runner = ::absl::make_unique<CalculatorRunner>(
+      MakeConfig(kConfigNoVideo, true, false, false, false));
+  SetInputs({kFace1, kFace2}, false, runner.get());
+
+  // Run the calculator.
+  MP_ASSERT_OK(runner->Run());
+
+  // Check the output regions.
+  const std::vector<Packet>& output_packets =
+      runner->Outputs().Tag("REGIONS").packets;
+  ASSERT_EQ(1, output_packets.size());
+
+  const auto& regions = output_packets[0].Get<DetectionSet>();
+  ASSERT_EQ(2, regions.detections().size());
+  auto face_1 = regions.detections(0);
+  EXPECT_EQ(face_1.signal_type().standard(), SignalType::FACE_FULL);
+  EXPECT_FLOAT_EQ(face_1.location_normalized().x(), 0);
+  EXPECT_FLOAT_EQ(face_1.location_normalized().y(), 0.003333);
+  EXPECT_FLOAT_EQ(face_1.location_normalized().width(), 0.12125);
+  EXPECT_FLOAT_EQ(face_1.location_normalized().height(), 0.33333);
+  EXPECT_FLOAT_EQ(face_1.score(), 1);
+
+  auto face_2 = regions.detections(1);
+  EXPECT_EQ(face_2.signal_type().standard(), SignalType::FACE_FULL);
+  EXPECT_FLOAT_EQ(face_2.location_normalized().x(), 0.0025);
+  EXPECT_FLOAT_EQ(face_2.location_normalized().y(), 0.005);
+  EXPECT_FLOAT_EQ(face_2.location_normalized().width(), 0.25);
+  EXPECT_FLOAT_EQ(face_2.location_normalized().height(), 0.5);
+  EXPECT_FLOAT_EQ(face_2.score(), 1);
+}
+
 }  // namespace
 }  // namespace autoflip
 }  // namespace mediapipe
diff --git a/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator.cc b/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator.cc
index 2b0a743db..a8ba3eeb9 100644
--- a/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator.cc
+++ b/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator.cc
@@ -24,6 +24,7 @@
 #include "mediapipe/framework/calculator_framework.h"
 #include "mediapipe/framework/formats/image_frame.h"
 #include "mediapipe/framework/formats/image_frame_opencv.h"
+#include "mediapipe/framework/port/canonical_errors.h"
 #include "mediapipe/framework/port/opencv_core_inc.h"
 #include "mediapipe/framework/port/opencv_imgproc_inc.h"
 #include "mediapipe/framework/port/parse_text_proto.h"
@@ -35,6 +36,7 @@ namespace mediapipe {
 namespace autoflip {
 
 constexpr char kInputVideoFrames[] = "VIDEO_FRAMES";
+constexpr char kInputVideoSize[] = "VIDEO_SIZE";
 constexpr char kInputKeyFrames[] = "KEY_FRAMES";
 constexpr char kInputDetections[] = "DETECTION_FEATURES";
 constexpr char kInputStaticFeatures[] = "STATIC_FEATURES";
@@ -49,8 +51,17 @@ constexpr char kAspectRatio[] = "EXTERNAL_ASPECT_RATIO";
 // SALIENT_POINT_FRAME_VIZ_FRAMES can only be enabled when CROPPED_FRAMES is
 // enabled.
 constexpr char kOutputCroppedFrames[] = "CROPPED_FRAMES";
+// Shows detections on key frames.  Any static borders will be removed from the
+// output frame.
 constexpr char kOutputKeyFrameCropViz[] = "KEY_FRAME_CROP_REGION_VIZ_FRAMES";
+// Shows x/y (raw unsmoothed) cropping and focus points.  Any static borders
+// will be removed from the output frame.
 constexpr char kOutputFocusPointFrameViz[] = "SALIENT_POINT_FRAME_VIZ_FRAMES";
+// Shows final smoothed cropping and a focused area of the camera.  Any static
+// borders will remain and be shown in grey.  Output frame will match input
+// frame size.
+constexpr char kOutputFramingAndDetections[] = "FRAMING_DETECTIONS_VIZ_FRAMES";
+// Final summary of cropping.
 constexpr char kOutputSummary[] = "CROPPING_SUMMARY";
 
 // External rendering outputs
@@ -65,7 +76,12 @@ constexpr char kExternalRenderingFullVid[] = "EXTERNAL_RENDERING_FULL_VID";
   if (cc->InputSidePackets().HasTag(kAspectRatio)) {
     cc->InputSidePackets().Tag(kAspectRatio).Set<std::string>();
   }
-  cc->Inputs().Tag(kInputVideoFrames).Set<ImageFrame>();
+  if (cc->Inputs().HasTag(kInputVideoFrames)) {
+    cc->Inputs().Tag(kInputVideoFrames).Set<ImageFrame>();
+  }
+  if (cc->Inputs().HasTag(kInputVideoSize)) {
+    cc->Inputs().Tag(kInputVideoSize).Set<std::pair<int, int>>();
+  }
   if (cc->Inputs().HasTag(kInputKeyFrames)) {
     cc->Inputs().Tag(kInputKeyFrames).Set<ImageFrame>();
   }
@@ -73,7 +89,9 @@ constexpr char kExternalRenderingFullVid[] = "EXTERNAL_RENDERING_FULL_VID";
   if (cc->Inputs().HasTag(kInputStaticFeatures)) {
     cc->Inputs().Tag(kInputStaticFeatures).Set<StaticFeatures>();
   }
-  cc->Inputs().Tag(kInputShotBoundaries).Set<bool>();
+  if (cc->Inputs().HasTag(kInputShotBoundaries)) {
+    cc->Inputs().Tag(kInputShotBoundaries).Set<bool>();
+  }
 
   if (cc->Outputs().HasTag(kOutputCroppedFrames)) {
     cc->Outputs().Tag(kOutputCroppedFrames).Set<ImageFrame>();
@@ -84,6 +102,12 @@ constexpr char kExternalRenderingFullVid[] = "EXTERNAL_RENDERING_FULL_VID";
            "CROPPED_FRAMES is specified.";
     cc->Outputs().Tag(kOutputKeyFrameCropViz).Set<ImageFrame>();
   }
+  if (cc->Outputs().HasTag(kOutputFramingAndDetections)) {
+    RET_CHECK(cc->Outputs().HasTag(kOutputCroppedFrames))
+        << "FRAMING_DETECTIONS_VIZ_FRAMES can only be used when "
+           "CROPPED_FRAMES is specified.";
+    cc->Outputs().Tag(kOutputFramingAndDetections).Set<ImageFrame>();
+  }
   if (cc->Outputs().HasTag(kOutputFocusPointFrameViz)) {
     RET_CHECK(cc->Outputs().HasTag(kOutputCroppedFrames))
         << "SALIENT_POINT_FRAME_VIZ_FRAMES can only be used when "
@@ -101,6 +125,13 @@ constexpr char kExternalRenderingFullVid[] = "EXTERNAL_RENDERING_FULL_VID";
         .Tag(kExternalRenderingFullVid)
         .Set<std::vector<ExternalRenderFrame>>();
   }
+  RET_CHECK(cc->Inputs().HasTag(kInputVideoFrames) ^
+            cc->Inputs().HasTag(kInputVideoSize))
+      << "VIDEO_FRAMES or VIDEO_SIZE must be set and not both.";
+  RET_CHECK(!(cc->Inputs().HasTag(kInputVideoSize) &&
+              cc->Inputs().HasTag(kOutputCroppedFrames)))
+      << "CROPPED_FRAMES (internal cropping) has been set as an output without "
+         "VIDEO_FRAMES (video data) input.";
   RET_CHECK(cc->Outputs().HasTag(kExternalRenderingPerFrame) ||
             cc->Outputs().HasTag(kExternalRenderingFullVid) ||
             cc->Outputs().HasTag(kOutputCroppedFrames))
@@ -128,7 +159,12 @@ constexpr char kExternalRenderingFullVid[] = "EXTERNAL_RENDERING_FULL_VID";
   RET_CHECK(overlay_opacity_ >= 0.0 && overlay_opacity_ <= 1.0)
       << "Overlay opacity " << overlay_opacity_ << " is not in [0, 1].";
 
-  scene_cropper_ = absl::make_unique<SceneCropper>();
+  // Set default camera model to polynomial_path_solver.
+  if (!options_.camera_motion_options().has_kinematic_options()) {
+    options_.mutable_camera_motion_options()
+        ->mutable_polynomial_path_solver()
+        ->set_prior_frame_buffer_size(options_.prior_frame_buffer_size());
+  }
   if (cc->Outputs().HasTag(kOutputSummary)) {
     summary_ = absl::make_unique<VideoCroppingSummary>();
   }
@@ -137,6 +173,8 @@ constexpr char kExternalRenderingFullVid[] = "EXTERNAL_RENDERING_FULL_VID";
         absl::make_unique<std::vector<ExternalRenderFrame>>();
   }
   should_perform_frame_cropping_ = cc->Outputs().HasTag(kOutputCroppedFrames);
+  scene_camera_motion_analyzer_ = absl::make_unique<SceneCameraMotionAnalyzer>(
+      options_.scene_camera_motion_analyzer_options());
   return ::mediapipe::OkStatus();
 }
 
@@ -182,44 +220,59 @@ void ConstructExternalRenderMessage(
   padding_color_message->set_b(padding_color[2]);
   external_render_message->set_timestamp_us(timestamp_us);
 }
+
+double GetRatio(int width, int height) {
+  return static_cast<double>(width) / height;
+}
+
+int RoundToEven(float value) {
+  int rounded_value = std::round(value);
+  if (rounded_value % 2 == 1) {
+    rounded_value = std::max(2, rounded_value - 1);
+  }
+  return rounded_value;
+}
+
 }  // namespace
 
-::mediapipe::Status SceneCroppingCalculator::Process(
+::mediapipe::Status SceneCroppingCalculator::InitializeSceneCroppingCalculator(
     ::mediapipe::CalculatorContext* cc) {
-  // Sets frame dimension and format.
-  if (frame_width_ < 0 &&
-      !cc->Inputs().Tag(kInputVideoFrames).Value().IsEmpty()) {
+  if (cc->Inputs().HasTag(kInputVideoFrames)) {
     const auto& frame = cc->Inputs().Tag(kInputVideoFrames).Get<ImageFrame>();
     frame_width_ = frame.Width();
-    RET_CHECK_GT(frame_width_, 0) << "Input frame width is non-positive.";
     frame_height_ = frame.Height();
-    RET_CHECK_GT(frame_height_, 0) << "Input frame height is non-positive.";
     frame_format_ = frame.Format();
-    target_width_ = options_.target_width();
-    target_height_ = options_.target_height();
-    if (cc->InputSidePackets().HasTag(kInputExternalSettings)) {
-      auto conversion_options = ParseTextProtoOrDie<ConversionOptions>(
-          cc->InputSidePackets()
-              .Tag(kInputExternalSettings)
-              .Get<std::string>());
-      target_width_ = conversion_options.target_width();
-      target_height_ = conversion_options.target_height();
-    }
-    target_aspect_ratio_ = static_cast<double>(target_width_) / target_height_;
-    RET_CHECK_NE(options_.target_size_type(),
-                 SceneCroppingCalculatorOptions::UNKNOWN)
-        << "TargetSizeType not set properly.";
-    // Resets target size if keep original height or width.
-    if (options_.target_size_type() ==
-        SceneCroppingCalculatorOptions::KEEP_ORIGINAL_HEIGHT) {
-      target_height_ = frame_height_;
-      target_width_ = std::round(target_height_ * target_aspect_ratio_);
-    } else if (options_.target_size_type() ==
-               SceneCroppingCalculatorOptions::KEEP_ORIGINAL_WIDTH) {
-      target_width_ = frame_width_;
-      target_height_ = std::round(target_width_ / target_aspect_ratio_);
-    } else if (options_.target_size_type() ==
-               SceneCroppingCalculatorOptions::MAXIMIZE_TARGET_DIMENSION) {
+  } else if (cc->Inputs().HasTag(kInputVideoSize)) {
+    frame_width_ =
+        cc->Inputs().Tag(kInputVideoSize).Get<std::pair<int, int>>().first;
+    frame_height_ =
+        cc->Inputs().Tag(kInputVideoSize).Get<std::pair<int, int>>().second;
+  } else {
+    return ::mediapipe::UnknownErrorBuilder(MEDIAPIPE_LOC)
+           << "Input VIDEO or VIDEO_SIZE must be provided.";
+  }
+  RET_CHECK_GT(frame_height_, 0) << "Input frame height is non-positive.";
+  RET_CHECK_GT(frame_width_, 0) << "Input frame width is non-positive.";
+
+  // Calculate target width and height.
+  switch (options_.target_size_type()) {
+    case SceneCroppingCalculatorOptions::KEEP_ORIGINAL_HEIGHT:
+      RET_CHECK(options_.has_target_width() && options_.has_target_height())
+          << "Target width and height have to be specified.";
+      target_height_ = RoundToEven(frame_height_);
+      target_width_ =
+          RoundToEven(target_height_ * GetRatio(options_.target_width(),
+                                                options_.target_height()));
+      break;
+    case SceneCroppingCalculatorOptions::KEEP_ORIGINAL_WIDTH:
+      RET_CHECK(options_.has_target_width() && options_.has_target_height())
+          << "Target width and height have to be specified.";
+      target_width_ = RoundToEven(frame_width_);
+      target_height_ =
+          RoundToEven(target_width_ / GetRatio(options_.target_width(),
+                                               options_.target_height()));
+      break;
+    case SceneCroppingCalculatorOptions::MAXIMIZE_TARGET_DIMENSION: {
       RET_CHECK(cc->InputSidePackets().HasTag(kAspectRatio))
           << "MAXIMIZE_TARGET_DIMENSION is set without an "
              "external_aspect_ratio";
@@ -228,49 +281,81 @@ void ConstructExternalRenderMessage(
           cc->InputSidePackets().Tag(kAspectRatio).Get<std::string>(),
           &requested_aspect_ratio));
       const double original_aspect_ratio =
-          static_cast<double>(frame_width_) / frame_height_;
+          GetRatio(frame_width_, frame_height_);
       if (original_aspect_ratio > requested_aspect_ratio) {
-        target_height_ = frame_height_;
-        target_width_ = std::round(target_height_ * requested_aspect_ratio);
+        target_height_ = RoundToEven(frame_height_);
+        target_width_ = RoundToEven(target_height_ * requested_aspect_ratio);
       } else {
-        target_width_ = frame_width_;
-        target_height_ = std::round(target_width_ / requested_aspect_ratio);
+        target_width_ = RoundToEven(frame_width_);
+        target_height_ = RoundToEven(target_width_ / requested_aspect_ratio);
       }
+      break;
     }
-    // Makes sure that target size is even if keep original width or height.
-    if (options_.target_size_type() !=
-        SceneCroppingCalculatorOptions::USE_TARGET_DIMENSION) {
-      if (target_width_ % 2 == 1) {
-        target_width_ = std::max(2, target_width_ - 1);
-      }
-      if (target_height_ % 2 == 1) {
-        target_height_ = std::max(2, target_height_ - 1);
-      }
-      target_aspect_ratio_ =
-          static_cast<double>(target_width_) / target_height_;
-    }
-    // Set keyframe width/height for feature upscaling (overwritten by keyframe
-    // input if provided).
-    if (options_.has_video_features_width() &&
-        options_.has_video_features_height()) {
-      key_frame_width_ = options_.video_features_width();
-      key_frame_height_ = options_.video_features_height();
-    } else if (!cc->Inputs().HasTag(kInputKeyFrames)) {
-      key_frame_width_ = frame_width_;
-      key_frame_height_ = frame_height_;
-    }
-    // Check provided dimensions.
-    RET_CHECK_GT(target_width_, 0) << "Target width is non-positive.";
-    RET_CHECK_NE(target_width_ % 2, 1)
-        << "Target width cannot be odd, because encoder expects dimension "
-           "values to be even.";
-    RET_CHECK_GT(target_height_, 0) << "Target height is non-positive.";
-    RET_CHECK_NE(target_height_ % 2, 1)
-        << "Target height cannot be odd, because encoder expects dimension "
-           "values to be even.";
+    case SceneCroppingCalculatorOptions::USE_TARGET_DIMENSION:
+      RET_CHECK(options_.has_target_width() && options_.has_target_height())
+          << "Target width and height have to be specified.";
+      target_width_ = options_.target_width();
+      target_height_ = options_.target_height();
+      break;
+    case SceneCroppingCalculatorOptions::KEEP_ORIGINAL_DIMENSION:
+      target_width_ = frame_width_;
+      target_height_ = frame_height_;
+      break;
+    case SceneCroppingCalculatorOptions::UNKNOWN:
+      return mediapipe::InvalidArgumentError(
+          "target_size_type not set properly.");
+  }
+  target_aspect_ratio_ = GetRatio(target_width_, target_height_);
+
+  // Set keyframe width/height for feature upscaling.
+  RET_CHECK(!(cc->Inputs().HasTag(kInputKeyFrames) &&
+              (options_.has_video_features_width() ||
+               options_.has_video_features_height())))
+      << "Key frame size must be defined by either providing the input stream "
+         "KEY_FRAMES or setting video_features_width/video_features_height as "
+         "calculator options.  Both methods cannot be used together.";
+  if (options_.has_video_features_width() &&
+      options_.has_video_features_height()) {
+    key_frame_width_ = options_.video_features_width();
+    key_frame_height_ = options_.video_features_height();
+  } else if (!cc->Inputs().HasTag(kInputKeyFrames)) {
+    key_frame_width_ = frame_width_;
+    key_frame_height_ = frame_height_;
+  }
+  // Check provided dimensions.
+  RET_CHECK_GT(target_width_, 0) << "Target width is non-positive.";
+  // TODO: it seems this check is too strict and maybe limiting,
+  // considering the receiver of frames can be something other than encoder.
+  RET_CHECK_NE(target_width_ % 2, 1)
+      << "Target width cannot be odd, because encoder expects dimension "
+         "values to be even.";
+  RET_CHECK_GT(target_height_, 0) << "Target height is non-positive.";
+  RET_CHECK_NE(target_height_ % 2, 1)
+      << "Target height cannot be odd, because encoder expects dimension "
+         "values to be even.";
+
+  scene_cropper_ = absl::make_unique<SceneCropper>(
+      options_.camera_motion_options(), frame_width_, frame_height_);
+
+  return ::mediapipe::OkStatus();
+}
+
+bool HasFrameSignal(::mediapipe::CalculatorContext* cc) {
+  if (cc->Inputs().HasTag(kInputVideoFrames)) {
+    return !cc->Inputs().Tag(kInputVideoFrames).Value().IsEmpty();
+  }
+  return !cc->Inputs().Tag(kInputVideoSize).Value().IsEmpty();
+}
+
+::mediapipe::Status SceneCroppingCalculator::Process(
+    ::mediapipe::CalculatorContext* cc) {
+  // Sets frame dimension and initializes scenecroppingcalculator on first video
+  // frame.
+  if (frame_width_ < 0) {
+    MP_RETURN_IF_ERROR(InitializeSceneCroppingCalculator(cc));
   }
 
-  // Sets key frame dimension.
+  // Sets key frame dimension on first keyframe.
   if (cc->Inputs().HasTag(kInputKeyFrames) &&
       !cc->Inputs().Tag(kInputKeyFrames).Value().IsEmpty() &&
       key_frame_width_ < 0) {
@@ -281,21 +366,18 @@ void ConstructExternalRenderMessage(
 
   // Processes a scene when shot boundary or buffer is full.
   bool is_end_of_scene = false;
-  if (!cc->Inputs().Tag(kInputShotBoundaries).Value().IsEmpty()) {
+  if (cc->Inputs().HasTag(kInputShotBoundaries) &&
+      !cc->Inputs().Tag(kInputShotBoundaries).Value().IsEmpty()) {
     is_end_of_scene = cc->Inputs().Tag(kInputShotBoundaries).Get<bool>();
   }
-  const bool force_buffer_flush =
-      scene_frame_timestamps_.size() >= options_.max_scene_size();
-  if (!scene_frame_timestamps_.empty() &&
-      (is_end_of_scene || force_buffer_flush)) {
+
+  if (!scene_frame_timestamps_.empty() && (is_end_of_scene)) {
+    continue_last_scene_ = false;
     MP_RETURN_IF_ERROR(ProcessScene(is_end_of_scene, cc));
   }
 
   // Saves frame and timestamp and whether it is a key frame.
-  if (!cc->Inputs().Tag(kInputVideoFrames).Value().IsEmpty()) {
-    LOG_EVERY_N(ERROR, 10)
-        << "------------------------ (Breathing) Time(s): "
-        << cc->Inputs().Tag(kInputVideoFrames).Value().Timestamp().Seconds();
+  if (HasFrameSignal(cc)) {
     // Only buffer frames if |should_perform_frame_cropping_| is true.
     if (should_perform_frame_cropping_) {
       const auto& frame = cc->Inputs().Tag(kInputVideoFrames).Get<ImageFrame>();
@@ -328,6 +410,13 @@ void ConstructExternalRenderMessage(
     static_features_timestamps_.push_back(cc->InputTimestamp().Value());
   }
 
+  const bool force_buffer_flush =
+      scene_frame_timestamps_.size() >= options_.max_scene_size();
+  if (!scene_frame_timestamps_.empty() && force_buffer_flush) {
+    MP_RETURN_IF_ERROR(ProcessScene(is_end_of_scene, cc));
+    continue_last_scene_ = true;
+  }
+
   return ::mediapipe::OkStatus();
 }
 
@@ -352,7 +441,7 @@ void ConstructExternalRenderMessage(
 // TODO: split this function into two, one for calculating the border
 // sizes, the other for the actual removal of borders from the frames.
 ::mediapipe::Status SceneCroppingCalculator::RemoveStaticBorders(
-    int* top_border_size, int* bottom_border_size) {
+    CalculatorContext* cc, int* top_border_size, int* bottom_border_size) {
   *top_border_size = 0;
   *bottom_border_size = 0;
   MP_RETURN_IF_ERROR(ComputeSceneStaticBordersSize(
@@ -363,6 +452,13 @@ void ConstructExternalRenderMessage(
   effective_frame_height_ =
       frame_height_ - top_border_distance_ - bottom_border_distance;
 
+  // Store shallow copy of the original frames for debug display if required
+  // before static areas are removed.
+  if (cc->Outputs().HasTag(kOutputFramingAndDetections)) {
+    raw_scene_frames_or_empty_ = {scene_frames_or_empty_.begin(),
+                                  scene_frames_or_empty_.end()};
+  }
+
   if (top_border_distance_ > 0 || bottom_border_distance > 0) {
     VLOG(1) << "Remove top border " << top_border_distance_ << " bottom border "
             << bottom_border_distance;
@@ -442,8 +538,8 @@ void SceneCroppingCalculator::FilterKeyFrameInfo() {
 
   // Removes any static borders.
   int top_static_border_size, bottom_static_border_size;
-  MP_RETURN_IF_ERROR(
-      RemoveStaticBorders(&top_static_border_size, &bottom_static_border_size));
+  MP_RETURN_IF_ERROR(RemoveStaticBorders(cc, &top_static_border_size,
+                                         &bottom_static_border_size));
 
   // Decides if solid background color padding is possible and sets up color
   // interpolation functions in CIELAB. Uses linear interpolation by default.
@@ -453,7 +549,8 @@ void SceneCroppingCalculator::FilterKeyFrameInfo() {
       &has_solid_background_, &background_color_l_function_,
       &background_color_a_function_, &background_color_b_function_));
 
-  // Computes key frame crop regions.
+  // Computes key frame crop regions and moves information from raw
+  // key_frame_infos_ to key_frame_crop_results.
   MP_RETURN_IF_ERROR(InitializeFrameCropRegionComputer());
   const int num_key_frames = key_frame_infos_.size();
   std::vector<KeyFrameCropResult> key_frame_crop_results(num_key_frames);
@@ -462,20 +559,15 @@ void SceneCroppingCalculator::FilterKeyFrameInfo() {
         key_frame_infos_[i], &key_frame_crop_results[i]));
   }
 
-  // Analyzes scene camera motion and generates FocusPointFrames.
-  auto analyzer_options = options_.scene_camera_motion_analyzer_options();
-  analyzer_options.set_allow_sweeping(analyzer_options.allow_sweeping() &&
-                                      !has_solid_background_);
-  scene_camera_motion_analyzer_ =
-      absl::make_unique<SceneCameraMotionAnalyzer>(analyzer_options);
   SceneKeyFrameCropSummary scene_summary;
   std::vector<FocusPointFrame> focus_point_frames;
   SceneCameraMotion scene_camera_motion;
   MP_RETURN_IF_ERROR(
       scene_camera_motion_analyzer_->AnalyzeSceneAndPopulateFocusPointFrames(
-          key_frame_infos_, key_frame_crop_options_, key_frame_crop_results,
-          frame_width_, effective_frame_height_, scene_frame_timestamps_,
-          &scene_summary, &focus_point_frames, &scene_camera_motion));
+          key_frame_crop_options_, key_frame_crop_results, frame_width_,
+          effective_frame_height_, scene_frame_timestamps_,
+          has_solid_background_, &scene_summary, &focus_point_frames,
+          &scene_camera_motion));
 
   // Crops scene frames.
   std::vector<cv::Mat> cropped_frames;
@@ -485,26 +577,28 @@ void SceneCroppingCalculator::FilterKeyFrameInfo() {
       should_perform_frame_cropping_ ? &cropped_frames : nullptr;
 
   MP_RETURN_IF_ERROR(scene_cropper_->CropFrames(
-      scene_summary, scene_frame_timestamps_.size(), scene_frames_or_empty_,
-      focus_point_frames, prior_focus_point_frames_, top_static_border_size,
-      bottom_static_border_size, &crop_from_locations, cropped_frames_ptr));
+      scene_summary, scene_frame_timestamps_, is_key_frames_,
+      scene_frames_or_empty_, focus_point_frames, prior_focus_point_frames_,
+      top_static_border_size, bottom_static_border_size, continue_last_scene_,
+      &crop_from_locations, cropped_frames_ptr));
 
   // Formats and outputs cropped frames.
   bool apply_padding = false;
   float vertical_fill_percent;
   std::vector<cv::Rect> render_to_locations;
   std::vector<cv::Scalar> padding_colors;
-  if (should_perform_frame_cropping_) {
-    MP_RETURN_IF_ERROR(FormatAndOutputCroppedFrames(
-        cropped_frames, &render_to_locations, &apply_padding, &padding_colors,
-        &vertical_fill_percent, cc));
-  }
+  MP_RETURN_IF_ERROR(FormatAndOutputCroppedFrames(
+      scene_summary.crop_window_width(), scene_summary.crop_window_height(),
+      scene_frame_timestamps_.size(), &render_to_locations, &apply_padding,
+      &padding_colors, &vertical_fill_percent, cropped_frames_ptr, cc));
   // Caches prior FocusPointFrames if this was not the end of a scene.
   prior_focus_point_frames_.clear();
   if (!is_end_of_scene) {
     const int start =
         std::max(0, static_cast<int>(scene_frame_timestamps_.size()) -
-                        options_.prior_frame_buffer_size());
+                        options_.camera_motion_options()
+                            .polynomial_path_solver()
+                            .prior_frame_buffer_size());
     for (int i = start; i < num_key_frames; ++i) {
       prior_focus_point_frames_.push_back(focus_point_frames[i]);
     }
@@ -512,6 +606,7 @@ void SceneCroppingCalculator::FilterKeyFrameInfo() {
 
   // Optionally outputs visualization frames.
   MP_RETURN_IF_ERROR(OutputVizFrames(key_frame_crop_results, focus_point_frames,
+                                     crop_from_locations,
                                      scene_summary.crop_window_width(),
                                      scene_summary.crop_window_height(), cc));
 
@@ -563,18 +658,13 @@ void SceneCroppingCalculator::FilterKeyFrameInfo() {
 }
 
 ::mediapipe::Status SceneCroppingCalculator::FormatAndOutputCroppedFrames(
-    const std::vector<cv::Mat>& cropped_frames,
+    const int crop_width, const int crop_height, const int num_frames,
     std::vector<cv::Rect>* render_to_locations, bool* apply_padding,
     std::vector<cv::Scalar>* padding_colors, float* vertical_fill_percent,
-    CalculatorContext* cc) {
+    const std::vector<cv::Mat>* cropped_frames_ptr, CalculatorContext* cc) {
   RET_CHECK(apply_padding) << "Has padding boolean is null.";
-  if (cropped_frames.empty()) {
-    return ::mediapipe::OkStatus();
-  }
 
   // Computes scaling factor and decides if padding is needed.
-  const int crop_width = cropped_frames.front().cols;
-  const int crop_height = cropped_frames.front().rows;
   VLOG(1) << "crop_width = " << crop_width << " crop_height = " << crop_height;
   const double scaling =
       std::max(static_cast<double>(target_width_) / crop_width,
@@ -602,7 +692,6 @@ void SceneCroppingCalculator::FilterKeyFrameInfo() {
   // Compute the "render to" location.  This is where the rect taken from the
   // input video gets pasted on the output frame.  For use with external
   // rendering solutions.
-  const int num_frames = cropped_frames.size();
   for (int i = 0; i < num_frames; i++) {
     if (*apply_padding) {
       render_to_locations->push_back(padder_->ComputeOutputLocation());
@@ -612,26 +701,11 @@ void SceneCroppingCalculator::FilterKeyFrameInfo() {
     }
   }
 
-  // Resizes cropped frames, pads frames, and output frames.
-  cv::Scalar* background_color = nullptr;
-  cv::Scalar interpolated_color;
+  // Compute padding colors.
   for (int i = 0; i < num_frames; ++i) {
     // Set default padding color to white.
     cv::Scalar padding_color_to_add = cv::Scalar(255, 255, 255);
     const int64 time_ms = scene_frame_timestamps_[i];
-    const Timestamp timestamp(time_ms);
-    auto scaled_frame = absl::make_unique<ImageFrame>(
-        frame_format_, scaled_width, scaled_height);
-    auto destination = formats::MatView(scaled_frame.get());
-    if (scaled_width == crop_width && scaled_height == crop_height) {
-      cropped_frames[i].copyTo(destination);
-    } else {
-      // cubic is better quality for upscaling and area is good for downscaling
-      const int interpolation_method =
-          scaling > 1 ? cv::INTER_CUBIC : cv::INTER_AREA;
-      cv::resize(cropped_frames[i], destination, destination.size(), 0, 0,
-                 interpolation_method);
-    }
     if (*apply_padding) {
       if (has_solid_background_) {
         double lab[3];
@@ -648,11 +722,39 @@ void SceneCroppingCalculator::FilterKeyFrameInfo() {
         k[0] = k[0] < 0.0 ? 0.0 : k[0] > 255.0 ? 255.0 : k[0];
         k[1] = k[1] < 0.0 ? 0.0 : k[1] > 255.0 ? 255.0 : k[1];
         k[2] = k[2] < 0.0 ? 0.0 : k[2] > 255.0 ? 255.0 : k[2];
-        interpolated_color =
+        cv::Scalar interpolated_color =
             cv::Scalar(std::round(k[0]), std::round(k[1]), std::round(k[2]));
-        background_color = &interpolated_color;
         padding_color_to_add = interpolated_color;
       }
+    }
+    padding_colors->push_back(padding_color_to_add);
+  }
+  if (!cropped_frames_ptr) {
+    return ::mediapipe::OkStatus();
+  }
+
+  // Resizes cropped frames, pads frames, and output frames.
+  for (int i = 0; i < num_frames; ++i) {
+    const int64 time_ms = scene_frame_timestamps_[i];
+    const Timestamp timestamp(time_ms);
+    auto scaled_frame = absl::make_unique<ImageFrame>(
+        frame_format_, scaled_width, scaled_height);
+    auto destination = formats::MatView(scaled_frame.get());
+    if (scaled_width == crop_width && scaled_height == crop_height) {
+      cropped_frames_ptr->at(i).copyTo(destination);
+    } else {
+      // cubic is better quality for upscaling and area is good for
+      // downscaling
+      const int interpolation_method =
+          scaling > 1 ? cv::INTER_CUBIC : cv::INTER_AREA;
+      cv::resize(cropped_frames_ptr->at(i), destination, destination.size(), 0,
+                 0, interpolation_method);
+    }
+    if (*apply_padding) {
+      cv::Scalar* background_color = nullptr;
+      if (has_solid_background_) {
+        background_color = &padding_colors->at(i);
+      }
       auto padded_frame = absl::make_unique<ImageFrame>();
       MP_RETURN_IF_ERROR(padder_->Process(
           *scaled_frame, background_contrast_,
@@ -670,7 +772,6 @@ void SceneCroppingCalculator::FilterKeyFrameInfo() {
           .Tag(kOutputCroppedFrames)
           .Add(scaled_frame.release(), timestamp);
     }
-    padding_colors->push_back(padding_color_to_add);
   }
   return ::mediapipe::OkStatus();
 }
@@ -678,6 +779,7 @@ void SceneCroppingCalculator::FilterKeyFrameInfo() {
 mediapipe::Status SceneCroppingCalculator::OutputVizFrames(
     const std::vector<KeyFrameCropResult>& key_frame_crop_results,
     const std::vector<FocusPointFrame>& focus_point_frames,
+    const std::vector<cv::Rect>& crop_from_locations,
     const int crop_window_width, const int crop_window_height,
     CalculatorContext* cc) const {
   if (cc->Outputs().HasTag(kOutputKeyFrameCropViz)) {
@@ -703,6 +805,17 @@ mediapipe::Status SceneCroppingCalculator::OutputVizFrames(
           .Add(viz_frames[i].release(), Timestamp(scene_frame_timestamps_[i]));
     }
   }
+  if (cc->Outputs().HasTag(kOutputFramingAndDetections)) {
+    std::vector<std::unique_ptr<ImageFrame>> viz_frames;
+    MP_RETURN_IF_ERROR(DrawDetectionAndFramingWindow(
+        raw_scene_frames_or_empty_, crop_from_locations, frame_format_,
+        options_.viz_overlay_opacity(), &viz_frames));
+    for (int i = 0; i < raw_scene_frames_or_empty_.size(); ++i) {
+      cc->Outputs()
+          .Tag(kOutputFramingAndDetections)
+          .Add(viz_frames[i].release(), Timestamp(scene_frame_timestamps_[i]));
+    }
+  }
   return ::mediapipe::OkStatus();
 }
 
diff --git a/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator.h b/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator.h
index 926b434bc..1c00e6210 100644
--- a/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator.h
+++ b/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator.h
@@ -145,9 +145,13 @@ class SceneCroppingCalculator : public CalculatorBase {
   // Removes any static borders from the scene frames before cropping. The
   // arguments |top_border_size| and |bottom_border_size| report the size of the
   // removed borders.
-  ::mediapipe::Status RemoveStaticBorders(int* top_border_size,
+  ::mediapipe::Status RemoveStaticBorders(CalculatorContext* cc,
+                                          int* top_border_size,
                                           int* bottom_border_size);
 
+  // Sets up autoflip after first frame is received and input size is known.
+  ::mediapipe::Status InitializeSceneCroppingCalculator(
+      ::mediapipe::CalculatorContext* cc);
   // Initializes a FrameCropRegionComputer given input and target frame sizes.
   ::mediapipe::Status InitializeFrameCropRegionComputer();
 
@@ -164,20 +168,26 @@ class SceneCroppingCalculator : public CalculatorBase {
   ::mediapipe::Status ProcessScene(const bool is_end_of_scene,
                                    CalculatorContext* cc);
 
-  // Formats and outputs the cropped frames. Scales them to be at least as big
-  // as the target size. If the aspect ratio is different, applies padding. Uses
-  // solid background from static features if possible, otherwise uses blurred
-  // background. Sets apply_padding to true if the scene is padded.
+  // Formats and outputs the cropped frames passed in through
+  // |cropped_frames_ptr|. Scales them to be at least as big as the target
+  // size. If the aspect ratio is different, applies padding. Uses solid
+  // background from static features if possible, otherwise uses blurred
+  // background. Sets |apply_padding| to true if the scene is padded. Set
+  // |cropped_frames_ptr| to nullptr, to bypass the actual output of the
+  // cropped frames. This is useful when the calculator is only used for
+  // computing the cropping metadata rather than doing the actual cropping
+  // operation.
   ::mediapipe::Status FormatAndOutputCroppedFrames(
-      const std::vector<cv::Mat>& cropped_frames,
+      const int crop_width, const int crop_height, const int num_frames,
       std::vector<cv::Rect>* render_to_locations, bool* apply_padding,
       std::vector<cv::Scalar>* padding_colors, float* vertical_fill_percent,
-      CalculatorContext* cc);
+      const std::vector<cv::Mat>* cropped_frames_ptr, CalculatorContext* cc);
 
   // Draws and outputs visualization frames if those streams are present.
   ::mediapipe::Status OutputVizFrames(
       const std::vector<KeyFrameCropResult>& key_frame_crop_results,
       const std::vector<FocusPointFrame>& focus_point_frames,
+      const std::vector<cv::Rect>& crop_from_locations,
       const int crop_window_width, const int crop_window_height,
       CalculatorContext* cc) const;
 
@@ -201,16 +211,21 @@ class SceneCroppingCalculator : public CalculatorBase {
   // Calculator options.
   SceneCroppingCalculatorOptions options_;
 
-  // Buffered KeyFrameInfos for the current scene (size = number of key frames).
+  // Buffered KeyFrameInfos for the current scene (size = number of key
+  // frames).
   std::vector<KeyFrameInfo> key_frame_infos_;
 
   // Buffered frames, timestamps, and indicators for key frames in the current
   // scene (size = number of input video frames).
-  // Note: scene_frames_or_empty_ may be empty if the actual cropping operation
-  // of frames is turned off, e.g. when |should_perform_frame_cropping_| is
-  // false, so rely on scene_frame_timestamps_.size() to query the number of
-  // accumulated timestamps rather than scene_frames_or_empty_.size().
+  // Note: scene_frames_or_empty_ may be empty if the actual cropping
+  // operation of frames is turned off, e.g. when
+  // |should_perform_frame_cropping_| is false, so rely on
+  // scene_frame_timestamps_.size() to query the number of accumulated
+  // timestamps rather than scene_frames_or_empty_.size().
+  // TODO: all of the following vectors are expected to be the same
+  // size. Add to struct and store together in one vector.
   std::vector<cv::Mat> scene_frames_or_empty_;
+  std::vector<cv::Mat> raw_scene_frames_or_empty_;
   std::vector<int64> scene_frame_timestamps_;
   std::vector<bool> is_key_frames_;
 
@@ -221,6 +236,9 @@ class SceneCroppingCalculator : public CalculatorBase {
   // Stored FocusPointFrames from prior scene when there was no actual scene
   // change (due to forced flush when buffer is full).
   std::vector<FocusPointFrame> prior_focus_point_frames_;
+  // Indicates if this scene is a continuation of the last scene (due to
+  // forced flush when buffer is full).
+  bool continue_last_scene_ = false;
 
   // KeyFrameCropOptions used by the FrameCropRegionComputer.
   KeyFrameCropOptions key_frame_crop_options_;
@@ -242,8 +260,8 @@ class SceneCroppingCalculator : public CalculatorBase {
   std::vector<StaticFeatures> static_features_;
   std::vector<int64> static_features_timestamps_;
   bool has_solid_background_ = false;
-  // CIELAB yields more natural color transitions than RGB and HSV: RGB tends to
-  // produce darker in-between colors and HSV can introduce new hues. See
+  // CIELAB yields more natural color transitions than RGB and HSV: RGB tends
+  // to produce darker in-between colors and HSV can introduce new hues. See
   // https://howaboutanorange.com/blog/2011/08/10/color_interpolation/ for
   // visual comparisons of color transition in different spaces.
   PiecewiseLinearFunction background_color_l_function_;  // CIELAB - l
@@ -264,11 +282,11 @@ class SceneCroppingCalculator : public CalculatorBase {
   std::unique_ptr<std::vector<ExternalRenderFrame>> external_render_list_;
 
   // Determines whether to perform real cropping on input frames. This flag is
-  // useful when the user only needs to compute cropping windows, in which case
-  // setting this flag to false can avoid buffering as well as cropping frames.
-  // This can significantly reduce memory usage and speed up processing. Some
-  // debugging visualization inevitably will be disabled because of this flag
-  // too.
+  // useful when the user only needs to compute cropping windows, in which
+  // case setting this flag to false can avoid buffering as well as cropping
+  // frames. This can significantly reduce memory usage and speed up
+  // processing. Some debugging visualization inevitably will be disabled
+  // because of this flag too.
   bool should_perform_frame_cropping_ = false;
 };
 }  // namespace autoflip
diff --git a/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator.proto b/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator.proto
index 31309d162..f9ba9cb87 100644
--- a/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator.proto
+++ b/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator.proto
@@ -44,6 +44,8 @@ message SceneCroppingCalculatorOptions {
     // Used on conjuntion with external_aspect_ratio, create the largest sized
     // output without upscaling the video.
     MAXIMIZE_TARGET_DIMENSION = 4;
+    // Uses original dimensions to calculate aspect ratio.
+    KEEP_ORIGINAL_DIMENSION = 5;
   }
   optional TargetSizeType target_size_type = 3 [default = USE_TARGET_DIMENSION];
 
@@ -53,7 +55,10 @@ message SceneCroppingCalculatorOptions {
 
   // Number of frames from prior buffer to be used to smooth out camera
   // trajectory when it was a forced flush.
-  optional int32 prior_frame_buffer_size = 5 [default = 30];
+  optional int32 prior_frame_buffer_size = 5 [default = 30, deprecated = true];
+  // Set camera motion type along with parameters.  Must select between the two
+  // provided options.
+  optional CameraMotionOptions camera_motion_options = 14;
 
   // Options for computing key frame crop regions using the
   // FrameCropRegionComputer.
diff --git a/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator_test.cc b/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator_test.cc
index 7c9f5009f..6cc9217e3 100644
--- a/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator_test.cc
+++ b/mediapipe/examples/desktop/autoflip/calculators/scene_cropping_calculator_test.cc
@@ -94,6 +94,7 @@ constexpr char kDebugConfig[] = R"(
   output_stream: "CROPPED_FRAMES:cropped_frames"
   output_stream: "KEY_FRAME_CROP_REGION_VIZ_FRAMES:key_frame_crop_viz_frames"
   output_stream: "SALIENT_POINT_FRAME_VIZ_FRAMES:salient_point_viz_frames"
+  output_stream: "FRAMING_DETECTIONS_VIZ_FRAMES:framing_viz_frames"
   output_stream: "CROPPING_SUMMARY:cropping_summaries"
   output_stream: "EXTERNAL_RENDERING_PER_FRAME:external_rendering_per_frame"
   output_stream: "EXTERNAL_RENDERING_FULL_VID:external_rendering_full_vid"
@@ -104,6 +105,39 @@ constexpr char kDebugConfig[] = R"(
     }
   })";
 
+constexpr char kExternalRenderConfig[] = R"(
+  calculator: "SceneCroppingCalculator"
+  input_stream: "VIDEO_FRAMES:camera_frames_org"
+  input_stream: "KEY_FRAMES:down_sampled_frames"
+  input_stream: "DETECTION_FEATURES:salient_regions"
+  input_stream: "STATIC_FEATURES:border_features"
+  input_stream: "SHOT_BOUNDARIES:shot_boundary_frames"
+  output_stream: "EXTERNAL_RENDERING_PER_FRAME:external_rendering_per_frame"
+  output_stream: "EXTERNAL_RENDERING_FULL_VID:external_rendering_full_vid"
+  options: {
+    [mediapipe.autoflip.SceneCroppingCalculatorOptions.ext]: {
+      target_width: $0
+      target_height: $1
+    }
+  })";
+
+constexpr char kExternalRenderConfigNoVideo[] = R"(
+  calculator: "SceneCroppingCalculator"
+  input_stream: "VIDEO_SIZE:camera_size"
+  input_stream: "DETECTION_FEATURES:salient_regions"
+  input_stream: "STATIC_FEATURES:border_features"
+  input_stream: "SHOT_BOUNDARIES:shot_boundary_frames"
+  output_stream: "EXTERNAL_RENDERING_PER_FRAME:external_rendering_per_frame"
+  output_stream: "EXTERNAL_RENDERING_FULL_VID:external_rendering_full_vid"
+  options: {
+    [mediapipe.autoflip.SceneCroppingCalculatorOptions.ext]: {
+      target_width: $0
+      target_height: $1
+      video_features_width: $2
+      video_features_height: $3
+    }
+  })";
+
 constexpr int kInputFrameWidth = 1280;
 constexpr int kInputFrameHeight = 720;
 
@@ -172,6 +206,22 @@ std::unique_ptr<DetectionSet> MakeDetections(const int num_detections,
   return detections;
 }
 
+// Makes a detection set given number of detections. Each detection has randomly
+// generated regions within given width and height with random score in [0, 1],
+// and is randomly set to be required or non-required.
+std::unique_ptr<DetectionSet> MakeCenterDetection(const int width,
+                                                  const int height) {
+  auto detections = absl::make_unique<DetectionSet>();
+  auto* region = detections->add_detections();
+  auto* location = region->mutable_location();
+  location->set_x(width / 2 - 5);
+  location->set_width(width / 2 + 10);
+  location->set_y(height / 2 - 5);
+  location->set_height(height);
+  region->set_score(1);
+  return detections;
+}
+
 // Makes an image frame of solid color given color, width, and height.
 std::unique_ptr<ImageFrame> MakeImageFrameFromColor(const cv::Scalar& color,
                                                     const int width,
@@ -188,7 +238,7 @@ std::unique_ptr<ImageFrame> MakeImageFrameFromColor(const cv::Scalar& color,
 // and kMaxNumDetections. Optionally add a key image frame of random solid color
 // and given size.
 void AddKeyFrameFeatures(const int64 time_ms, const int key_frame_width,
-                         const int key_frame_height,
+                         const int key_frame_height, bool randomize,
                          CalculatorRunner::StreamContentsSet* inputs) {
   Timestamp timestamp(time_ms);
   if (inputs->HasTag("KEY_FRAMES")) {
@@ -197,13 +247,18 @@ void AddKeyFrameFeatures(const int64 time_ms, const int key_frame_width,
     inputs->Tag("KEY_FRAMES")
         .packets.push_back(Adopt(key_frame.release()).At(timestamp));
   }
-
-  const int num_detections = std::uniform_int_distribution<int>(
-      kMinNumDetections, kMaxNumDetections)(GetGen());
-  auto detections =
-      MakeDetections(num_detections, key_frame_width, key_frame_height);
-  inputs->Tag("DETECTION_FEATURES")
-      .packets.push_back(Adopt(detections.release()).At(timestamp));
+  if (randomize) {
+    const int num_detections = std::uniform_int_distribution<int>(
+        kMinNumDetections, kMaxNumDetections)(GetGen());
+    auto detections =
+        MakeDetections(num_detections, key_frame_width, key_frame_height);
+    inputs->Tag("DETECTION_FEATURES")
+        .packets.push_back(Adopt(detections.release()).At(timestamp));
+  } else {
+    auto detections = MakeCenterDetection(key_frame_width, key_frame_height);
+    inputs->Tag("DETECTION_FEATURES")
+        .packets.push_back(Adopt(detections.release()).At(timestamp));
+  }
 }
 
 // Adds a scene given number of frames to the input stream. Spaces frame at the
@@ -212,19 +267,31 @@ void AddKeyFrameFeatures(const int64 time_ms, const int key_frame_width,
 void AddScene(const int start_frame_index, const int num_scene_frames,
               const int frame_width, const int frame_height,
               const int key_frame_width, const int key_frame_height,
+              const int DownSampleRate,
               CalculatorRunner::StreamContentsSet* inputs) {
   int64 time_ms = start_frame_index * kTimestampDiff;
   for (int i = 0; i < num_scene_frames; ++i) {
     Timestamp timestamp(time_ms);
-    auto frame =
-        MakeImageFrameFromColor(GetRandomColor(), frame_width, frame_height);
-    inputs->Tag("VIDEO_FRAMES")
-        .packets.push_back(Adopt(frame.release()).At(timestamp));
+    if (inputs->HasTag("VIDEO_FRAMES")) {
+      auto frame =
+          MakeImageFrameFromColor(GetRandomColor(), frame_width, frame_height);
+      inputs->Tag("VIDEO_FRAMES")
+          .packets.push_back(Adopt(frame.release()).At(timestamp));
+    } else {
+      auto input_size =
+          ::absl::make_unique<std::pair<int, int>>(frame_width, frame_height);
+      inputs->Tag("VIDEO_SIZE")
+          .packets.push_back(Adopt(input_size.release()).At(timestamp));
+    }
     auto static_features = absl::make_unique<StaticFeatures>();
     inputs->Tag("STATIC_FEATURES")
         .packets.push_back(Adopt(static_features.release()).At(timestamp));
-    if (i % kDownSampleRate == 0) {  // is a key frame
-      AddKeyFrameFeatures(time_ms, key_frame_width, key_frame_height, inputs);
+    if (DownSampleRate == 1) {
+      AddKeyFrameFeatures(time_ms, key_frame_width, key_frame_height, false,
+                          inputs);
+    } else if (i % DownSampleRate == 0) {  // is a key frame
+      AddKeyFrameFeatures(time_ms, key_frame_width, key_frame_height, true,
+                          inputs);
     }
     if (i == num_scene_frames - 1) {  // adds shot boundary
       inputs->Tag("SHOT_BOUNDARIES")
@@ -294,7 +361,7 @@ TEST(SceneCroppingCalculatorTest, HandlesNoKeyFrames) {
           absl::Substitute(kNoKeyFrameConfig, kTargetWidth, kTargetHeight));
   auto runner = absl::make_unique<CalculatorRunner>(config);
   AddScene(0, kSceneSize, kInputFrameWidth, kInputFrameHeight, kKeyFrameWidth,
-           kKeyFrameHeight, runner->MutableInputs());
+           kKeyFrameHeight, kDownSampleRate, runner->MutableInputs());
   MP_EXPECT_OK(runner->Run());
   CheckCroppedFrames(*runner, kSceneSize, kTargetWidth, kTargetHeight);
 }
@@ -308,7 +375,8 @@ TEST(SceneCroppingCalculatorTest, HandlesLongScene) {
           kPriorFrameBufferSize));
   auto runner = absl::make_unique<CalculatorRunner>(config);
   AddScene(0, 2 * kMaxSceneSize, kInputFrameWidth, kInputFrameHeight,
-           kKeyFrameWidth, kKeyFrameHeight, runner->MutableInputs());
+           kKeyFrameWidth, kKeyFrameHeight, kDownSampleRate,
+           runner->MutableInputs());
   MP_EXPECT_OK(runner->Run());
   CheckCroppedFrames(*runner, 2 * kMaxSceneSize, kTargetWidth, kTargetHeight);
 }
@@ -321,7 +389,7 @@ TEST(SceneCroppingCalculatorTest, OutputsDebugStreams) {
   auto runner = absl::make_unique<CalculatorRunner>(config);
   const int num_frames = kSceneSize;
   AddScene(0, num_frames, kInputFrameWidth, kInputFrameHeight, kKeyFrameWidth,
-           kKeyFrameHeight, runner->MutableInputs());
+           kKeyFrameHeight, kDownSampleRate, runner->MutableInputs());
 
   MP_EXPECT_OK(runner->Run());
   const auto& outputs = runner->Outputs();
@@ -330,6 +398,7 @@ TEST(SceneCroppingCalculatorTest, OutputsDebugStreams) {
   EXPECT_TRUE(outputs.HasTag("CROPPING_SUMMARY"));
   EXPECT_TRUE(outputs.HasTag("EXTERNAL_RENDERING_PER_FRAME"));
   EXPECT_TRUE(outputs.HasTag("EXTERNAL_RENDERING_FULL_VID"));
+  EXPECT_TRUE(outputs.HasTag("FRAMING_DETECTIONS_VIZ_FRAMES"));
   const auto& crop_region_viz_frames_outputs =
       outputs.Tag("KEY_FRAME_CROP_REGION_VIZ_FRAMES").packets;
   const auto& salient_point_viz_frames_outputs =
@@ -339,8 +408,11 @@ TEST(SceneCroppingCalculatorTest, OutputsDebugStreams) {
       outputs.Tag("EXTERNAL_RENDERING_PER_FRAME").packets;
   const auto& ext_render_full_vid =
       outputs.Tag("EXTERNAL_RENDERING_FULL_VID").packets;
+  const auto& framing_viz_frames_output =
+      outputs.Tag("FRAMING_DETECTIONS_VIZ_FRAMES").packets;
   EXPECT_EQ(crop_region_viz_frames_outputs.size(), num_frames);
   EXPECT_EQ(salient_point_viz_frames_outputs.size(), num_frames);
+  EXPECT_EQ(framing_viz_frames_output.size(), num_frames);
   EXPECT_EQ(summary_output.size(), 1);
   EXPECT_EQ(ext_render_per_frame.size(), num_frames);
   EXPECT_EQ(ext_render_full_vid.size(), 1);
@@ -387,7 +459,8 @@ TEST(SceneCroppingCalculatorTest, HandlesLandscapeTarget) {
   auto runner = absl::make_unique<CalculatorRunner>(config);
   for (int i = 0; i < kNumScenes; ++i) {
     AddScene(i * kSceneSize, kSceneSize, input_width, input_height,
-             kKeyFrameWidth, kKeyFrameHeight, runner->MutableInputs());
+             kKeyFrameWidth, kKeyFrameHeight, kDownSampleRate,
+             runner->MutableInputs());
   }
   const int num_frames = kSceneSize * kNumScenes;
   MP_EXPECT_OK(runner->Run());
@@ -404,13 +477,34 @@ TEST(SceneCroppingCalculatorTest, CropsToTargetSize) {
   auto runner = absl::make_unique<CalculatorRunner>(config);
   for (int i = 0; i < kNumScenes; ++i) {
     AddScene(i * kSceneSize, kSceneSize, kInputFrameWidth, kInputFrameHeight,
-             kKeyFrameWidth, kKeyFrameHeight, runner->MutableInputs());
+             kKeyFrameWidth, kKeyFrameHeight, kDownSampleRate,
+             runner->MutableInputs());
   }
   const int num_frames = kSceneSize * kNumScenes;
   MP_EXPECT_OK(runner->Run());
   CheckCroppedFrames(*runner, num_frames, kTargetWidth, kTargetHeight);
 }
 
+// Checks that the calculator crops scene frames to input size when the target
+// size type is KEEP_ORIGINAL_DIMENSION.
+TEST(SceneCroppingCalculatorTest, CropsToOriginalDimension) {
+  // target_width and target_height are ignored
+  const CalculatorGraphConfig::Node config =
+      ParseTextProtoOrDie<CalculatorGraphConfig::Node>(absl::Substitute(
+          kConfig, /*target_width*/ 2, /*target_height*/ 2,
+          SceneCroppingCalculatorOptions::KEEP_ORIGINAL_DIMENSION,
+          kMaxSceneSize, kPriorFrameBufferSize));
+  auto runner = absl::make_unique<CalculatorRunner>(config);
+  for (int i = 0; i < kNumScenes; ++i) {
+    AddScene(i * kSceneSize, kSceneSize, kInputFrameWidth, kInputFrameHeight,
+             kKeyFrameWidth, kKeyFrameHeight, kDownSampleRate,
+             runner->MutableInputs());
+  }
+  const int num_frames = kSceneSize * kNumScenes;
+  MP_EXPECT_OK(runner->Run());
+  CheckCroppedFrames(*runner, num_frames, kInputFrameWidth, kInputFrameHeight);
+}
+
 // Checks that the calculator keeps original height if the target size type is
 // set to KEEP_ORIGINAL_HEIGHT.
 TEST(SceneCroppingCalculatorTest, KeepsOriginalHeight) {
@@ -427,7 +521,8 @@ TEST(SceneCroppingCalculatorTest, KeepsOriginalHeight) {
           kPriorFrameBufferSize));
   auto runner = absl::make_unique<CalculatorRunner>(config);
   AddScene(0, kMaxSceneSize, kInputFrameWidth, kInputFrameHeight,
-           kKeyFrameWidth, kKeyFrameHeight, runner->MutableInputs());
+           kKeyFrameWidth, kKeyFrameHeight, kDownSampleRate,
+           runner->MutableInputs());
   MP_EXPECT_OK(runner->Run());
   CheckCroppedFrames(*runner, kMaxSceneSize, target_width, target_height);
 }
@@ -448,7 +543,8 @@ TEST(SceneCroppingCalculatorTest, KeepsOriginalWidth) {
           kPriorFrameBufferSize));
   auto runner = absl::make_unique<CalculatorRunner>(config);
   AddScene(0, kMaxSceneSize, kInputFrameWidth, kInputFrameHeight,
-           kKeyFrameWidth, kKeyFrameHeight, runner->MutableInputs());
+           kKeyFrameWidth, kKeyFrameHeight, kDownSampleRate,
+           runner->MutableInputs());
   MP_EXPECT_OK(runner->Run());
   CheckCroppedFrames(*runner, kMaxSceneSize, target_width, target_height);
 }
@@ -461,7 +557,8 @@ TEST(SceneCroppingCalculatorTest, RejectsOddTargetSize) {
           kMaxSceneSize, kPriorFrameBufferSize));
   auto runner = absl::make_unique<CalculatorRunner>(config);
   AddScene(0, kMaxSceneSize, kInputFrameWidth, kInputFrameHeight,
-           kKeyFrameWidth, kKeyFrameHeight, runner->MutableInputs());
+           kKeyFrameWidth, kKeyFrameHeight, kDownSampleRate,
+           runner->MutableInputs());
   const auto status = runner->Run();
   EXPECT_FALSE(status.ok());
   EXPECT_THAT(status.ToString(), HasSubstr("Target width cannot be odd"));
@@ -498,7 +595,7 @@ TEST(SceneCroppingCalculatorTest, ProducesEvenFrameSize) {
                 kMaxSceneSize, kPriorFrameBufferSize));
         auto runner = absl::make_unique<CalculatorRunner>(config);
         AddScene(0, 1, frame_width, frame_height, kKeyFrameWidth,
-                 kKeyFrameHeight, runner->MutableInputs());
+                 kKeyFrameHeight, kDownSampleRate, runner->MutableInputs());
         MP_EXPECT_OK(runner->Run());
         const auto& output_frame = runner->Outputs()
                                        .Tag("CROPPED_FRAMES")
@@ -665,6 +762,146 @@ TEST(SceneCroppingCalculatorTest, RemovesStaticBorders) {
     }
   }
 }
+
+// Checks external render message with default poly path solver.
+TEST(SceneCroppingCalculatorTest, OutputsCropMessagePolyPath) {
+  const CalculatorGraphConfig::Node config =
+      ParseTextProtoOrDie<CalculatorGraphConfig::Node>(
+          absl::Substitute(kExternalRenderConfig, kTargetWidth, kTargetHeight));
+  auto runner = absl::make_unique<CalculatorRunner>(config);
+  const int num_frames = kSceneSize;
+  AddScene(0, num_frames, kInputFrameWidth, kInputFrameHeight, kKeyFrameWidth,
+           kKeyFrameHeight, 1, runner->MutableInputs());
+
+  MP_EXPECT_OK(runner->Run());
+  const auto& outputs = runner->Outputs();
+  const auto& ext_render_per_frame =
+      outputs.Tag("EXTERNAL_RENDERING_PER_FRAME").packets;
+  EXPECT_EQ(ext_render_per_frame.size(), num_frames);
+
+  for (int i = 0; i < num_frames - 1; ++i) {
+    const auto& ext_render_message =
+        ext_render_per_frame[i].Get<ExternalRenderFrame>();
+    EXPECT_EQ(ext_render_message.timestamp_us(), i * 20000);
+    EXPECT_EQ(ext_render_message.crop_from_location().x(), 725);
+    EXPECT_EQ(ext_render_message.crop_from_location().y(), 0);
+    EXPECT_EQ(ext_render_message.crop_from_location().width(), 461);
+    EXPECT_EQ(ext_render_message.crop_from_location().height(), 720);
+    EXPECT_EQ(ext_render_message.render_to_location().x(), 0);
+    EXPECT_EQ(ext_render_message.render_to_location().y(), 0);
+    EXPECT_EQ(ext_render_message.render_to_location().width(), 720);
+    EXPECT_EQ(ext_render_message.render_to_location().height(), 1124);
+  }
+}
+
+// Checks external render message with kinematic path solver.
+TEST(SceneCroppingCalculatorTest, OutputsCropMessageKinematicPath) {
+  CalculatorGraphConfig::Node config =
+      ParseTextProtoOrDie<CalculatorGraphConfig::Node>(
+          absl::Substitute(kDebugConfig, kTargetWidth, kTargetHeight));
+  auto* options = config.mutable_options()->MutableExtension(
+      SceneCroppingCalculatorOptions::ext);
+  auto* kinematic_options =
+      options->mutable_camera_motion_options()->mutable_kinematic_options();
+  kinematic_options->set_max_velocity(200);
+
+  auto runner = absl::make_unique<CalculatorRunner>(config);
+  const int num_frames = kSceneSize;
+  AddScene(0, num_frames, kInputFrameWidth, kInputFrameHeight, kKeyFrameWidth,
+           kKeyFrameHeight, 1, runner->MutableInputs());
+
+  MP_EXPECT_OK(runner->Run());
+  const auto& outputs = runner->Outputs();
+  const auto& ext_render_per_frame =
+      outputs.Tag("EXTERNAL_RENDERING_PER_FRAME").packets;
+  EXPECT_EQ(ext_render_per_frame.size(), num_frames);
+
+  for (int i = 0; i < num_frames - 1; ++i) {
+    const auto& ext_render_message =
+        ext_render_per_frame[i].Get<ExternalRenderFrame>();
+    EXPECT_EQ(ext_render_message.timestamp_us(), i * 20000);
+    EXPECT_EQ(ext_render_message.crop_from_location().x(), 725);
+    EXPECT_EQ(ext_render_message.crop_from_location().y(), 0);
+    EXPECT_EQ(ext_render_message.crop_from_location().width(), 461);
+    EXPECT_EQ(ext_render_message.crop_from_location().height(), 720);
+    EXPECT_EQ(ext_render_message.render_to_location().x(), 0);
+    EXPECT_EQ(ext_render_message.render_to_location().y(), 0);
+    EXPECT_EQ(ext_render_message.render_to_location().width(), 720);
+    EXPECT_EQ(ext_render_message.render_to_location().height(), 1124);
+  }
+}
+
+// Checks external render message with default poly path solver without video
+// input.
+TEST(SceneCroppingCalculatorTest, OutputsCropMessagePolyPathNoVideo) {
+  const CalculatorGraphConfig::Node config =
+      ParseTextProtoOrDie<CalculatorGraphConfig::Node>(
+          absl::Substitute(kExternalRenderConfigNoVideo, kTargetWidth,
+                           kTargetHeight, kKeyFrameWidth, kKeyFrameHeight));
+  auto runner = absl::make_unique<CalculatorRunner>(config);
+  const int num_frames = kSceneSize;
+  AddScene(0, num_frames, kInputFrameWidth, kInputFrameHeight, kKeyFrameWidth,
+           kKeyFrameHeight, 1, runner->MutableInputs());
+
+  MP_EXPECT_OK(runner->Run());
+  const auto& outputs = runner->Outputs();
+  const auto& ext_render_per_frame =
+      outputs.Tag("EXTERNAL_RENDERING_PER_FRAME").packets;
+  EXPECT_EQ(ext_render_per_frame.size(), num_frames);
+
+  for (int i = 0; i < num_frames - 1; ++i) {
+    const auto& ext_render_message =
+        ext_render_per_frame[i].Get<ExternalRenderFrame>();
+    EXPECT_EQ(ext_render_message.timestamp_us(), i * 20000);
+    EXPECT_EQ(ext_render_message.crop_from_location().x(), 725);
+    EXPECT_EQ(ext_render_message.crop_from_location().y(), 0);
+    EXPECT_EQ(ext_render_message.crop_from_location().width(), 461);
+    EXPECT_EQ(ext_render_message.crop_from_location().height(), 720);
+    EXPECT_EQ(ext_render_message.render_to_location().x(), 0);
+    EXPECT_EQ(ext_render_message.render_to_location().y(), 0);
+    EXPECT_EQ(ext_render_message.render_to_location().width(), 720);
+    EXPECT_EQ(ext_render_message.render_to_location().height(), 1124);
+  }
+}
+
+// Checks external render message with kinematic path solver without video
+// input.
+TEST(SceneCroppingCalculatorTest, OutputsCropMessageKinematicPathNoVideo) {
+  CalculatorGraphConfig::Node config =
+      ParseTextProtoOrDie<CalculatorGraphConfig::Node>(
+          absl::Substitute(kExternalRenderConfigNoVideo, kTargetWidth,
+                           kTargetHeight, kKeyFrameWidth, kKeyFrameHeight));
+  auto* options = config.mutable_options()->MutableExtension(
+      SceneCroppingCalculatorOptions::ext);
+  auto* kinematic_options =
+      options->mutable_camera_motion_options()->mutable_kinematic_options();
+  kinematic_options->set_max_velocity(2.0);
+
+  auto runner = absl::make_unique<CalculatorRunner>(config);
+  const int num_frames = kSceneSize;
+  AddScene(0, num_frames, kInputFrameWidth, kInputFrameHeight, kKeyFrameWidth,
+           kKeyFrameHeight, 1, runner->MutableInputs());
+
+  MP_EXPECT_OK(runner->Run());
+  const auto& outputs = runner->Outputs();
+  const auto& ext_render_per_frame =
+      outputs.Tag("EXTERNAL_RENDERING_PER_FRAME").packets;
+  EXPECT_EQ(ext_render_per_frame.size(), num_frames);
+
+  for (int i = 0; i < num_frames - 1; ++i) {
+    const auto& ext_render_message =
+        ext_render_per_frame[i].Get<ExternalRenderFrame>();
+    EXPECT_EQ(ext_render_message.timestamp_us(), i * 20000);
+    EXPECT_EQ(ext_render_message.crop_from_location().x(), 725);
+    EXPECT_EQ(ext_render_message.crop_from_location().y(), 0);
+    EXPECT_EQ(ext_render_message.crop_from_location().width(), 461);
+    EXPECT_EQ(ext_render_message.crop_from_location().height(), 720);
+    EXPECT_EQ(ext_render_message.render_to_location().x(), 0);
+    EXPECT_EQ(ext_render_message.render_to_location().y(), 0);
+    EXPECT_EQ(ext_render_message.render_to_location().width(), 720);
+    EXPECT_EQ(ext_render_message.render_to_location().height(), 1124);
+  }
+}
 }  // namespace
 }  // namespace autoflip
 }  // namespace mediapipe
diff --git a/mediapipe/examples/desktop/autoflip/calculators/signal_fusing_calculator.cc b/mediapipe/examples/desktop/autoflip/calculators/signal_fusing_calculator.cc
index 55cd796b8..703932938 100644
--- a/mediapipe/examples/desktop/autoflip/calculators/signal_fusing_calculator.cc
+++ b/mediapipe/examples/desktop/autoflip/calculators/signal_fusing_calculator.cc
@@ -30,6 +30,10 @@ using mediapipe::autoflip::DetectionSet;
 using mediapipe::autoflip::SalientRegion;
 using mediapipe::autoflip::SignalType;
 
+constexpr char kIsShotBoundaryTag[] = "IS_SHOT_BOUNDARY";
+constexpr char kSignalInputsTag[] = "SIGNAL";
+constexpr char kOutputTag[] = "OUTPUT";
+
 namespace mediapipe {
 namespace autoflip {
 
@@ -43,16 +47,16 @@ struct Frame {
   mediapipe::Timestamp time;
 };
 
-// This calculator takes one scene change signal and an arbitrary number of
-// detection signals and outputs a single list of detections.  The scores for
-// the detections can be re-normalized using the options proto.  Additionally,
-// if a detection has a consistent tracking id during a scene the score for that
-// detection is averaged over the whole scene.
+// This calculator takes one scene change signal (optional, see below) and an
+// arbitrary number of detection signals and outputs a single list of
+// detections.  The scores for the detections can be re-normalized using the
+// options proto.  Additionally, if a detection has a consistent tracking id
+// during a scene the score for that detection is averaged over the whole scene.
 //
-// Example:
+// Example (ordered interface):
 //  node {
 //    calculator: "SignalFusingCalculator"
-//    input_stream: "scene_change"
+//    input_stream: "scene_change" (required for ordered interface)
 //    input_stream: "detection_faces"
 //    input_stream: "detection_custom_text"
 //    output_stream: "salient_region"
@@ -71,9 +75,33 @@ struct Frame {
 //    }
 //    }
 //  }
+//
+// Example (tag interface):
+//  node {
+//    calculator: "SignalFusingCalculator"
+//    input_stream: "IS_SHOT_BOUNDARY:scene_change" (optional)
+//    input_stream: "SIGNAL:0:detection_faces"
+//    input_stream: "SIGNAL:1:detection_custom_text"
+//    output_stream: "OUTPUT:salient_region"
+//    options:{
+//    [mediapipe.autoflip.SignalFusingCalculatorOptions.ext]:{
+//      signal_settings{
+//        type: {standard: FACE}
+//        min_score: 0.5
+//        max_score: 0.6
+//      }
+//      signal_settings{
+//        type: {custom: "custom_text"}
+//        min_score: 0.9
+//        max_score: 1.0
+//      }
+//    }
+//    }
+//  }
 class SignalFusingCalculator : public mediapipe::CalculatorBase {
  public:
-  SignalFusingCalculator() {}
+  SignalFusingCalculator()
+      : tag_input_interface_(false), process_by_scene_(true) {}
   SignalFusingCalculator(const SignalFusingCalculator&) = delete;
   SignalFusingCalculator& operator=(const SignalFusingCalculator&) = delete;
 
@@ -84,9 +112,12 @@ class SignalFusingCalculator : public mediapipe::CalculatorBase {
 
  private:
   mediapipe::Status ProcessScene(mediapipe::CalculatorContext* cc);
+  std::vector<Packet> GetSignalPackets(mediapipe::CalculatorContext* cc);
   SignalFusingCalculatorOptions options_;
   std::map<std::string, SignalSettings> settings_by_type_;
   std::vector<Frame> scene_frames_;
+  bool tag_input_interface_;
+  bool process_by_scene_;
 };
 REGISTER_CALCULATOR(SignalFusingCalculator);
 
@@ -104,7 +135,23 @@ std::string CreateKey(const InputSignal& detection) {
   std::string id = id_source + ":" + id_signal;
   return id;
 }
+void SetupTagInput(mediapipe::CalculatorContract* cc) {
+  if (cc->Inputs().HasTag(kIsShotBoundaryTag)) {
+    cc->Inputs().Tag(kIsShotBoundaryTag).Set<bool>();
+  }
+  for (int i = 0; i < cc->Inputs().NumEntries(kSignalInputsTag); i++) {
+    cc->Inputs().Get(kSignalInputsTag, i).Set<autoflip::DetectionSet>();
+  }
+  cc->Outputs().Tag(kOutputTag).Set<autoflip::DetectionSet>();
+}
 
+void SetupOrderedInput(mediapipe::CalculatorContract* cc) {
+  cc->Inputs().Index(0).Set<bool>();
+  for (int i = 1; i < cc->Inputs().NumEntries(); ++i) {
+    cc->Inputs().Index(i).Set<autoflip::DetectionSet>();
+  }
+  cc->Outputs().Index(0).Set<autoflip::DetectionSet>();
+}
 }  // namespace
 
 mediapipe::Status SignalFusingCalculator::Open(
@@ -113,6 +160,12 @@ mediapipe::Status SignalFusingCalculator::Open(
   for (const auto& setting : options_.signal_settings()) {
     settings_by_type_[CreateSettingsKey(setting.type())] = setting;
   }
+  if (cc->Inputs().HasTag(kSignalInputsTag)) {
+    tag_input_interface_ = true;
+    if (!cc->Inputs().HasTag(kIsShotBoundaryTag)) {
+      process_by_scene_ = false;
+    }
+  }
   return ::mediapipe::OkStatus();
 }
 
@@ -144,14 +197,12 @@ mediapipe::Status SignalFusingCalculator::ProcessScene(
       }
     }
   }
-
   // Average scores.
   for (auto iterator = multiframe_score.begin();
        iterator != multiframe_score.end(); iterator++) {
     multiframe_score[iterator->first] =
         iterator->second / detection_count[iterator->first];
   }
-
   // Process detections.
   for (const Frame& frame : scene_frames_) {
     std::unique_ptr<DetectionSet> processed_detections(new DetectionSet());
@@ -173,33 +224,63 @@ mediapipe::Status SignalFusingCalculator::ProcessScene(
         min_value = settings_it->second.min_score();
         max_value = settings_it->second.max_score();
         detection.signal.set_is_required(settings_it->second.is_required());
+        detection.signal.set_only_required(settings_it->second.only_required());
       }
 
       float final_score = score * (max_value - min_value) + min_value;
       detection.signal.set_score(final_score);
       *processed_detections->add_detections() = detection.signal;
     }
-    cc->Outputs().Index(0).Add(processed_detections.release(), frame.time);
+    if (tag_input_interface_) {
+      cc->Outputs()
+          .Tag(kOutputTag)
+          .Add(processed_detections.release(), frame.time);
+    } else {
+      cc->Outputs().Index(0).Add(processed_detections.release(), frame.time);
+    }
   }
 
   return ::mediapipe::OkStatus();
 }
 
+std::vector<Packet> SignalFusingCalculator::GetSignalPackets(
+    mediapipe::CalculatorContext* cc) {
+  std::vector<Packet> signal_packets;
+  if (tag_input_interface_) {
+    for (int i = 0; i < cc->Inputs().NumEntries(kSignalInputsTag); i++) {
+      const Packet& packet = cc->Inputs().Get(kSignalInputsTag, i).Value();
+      signal_packets.push_back(packet);
+    }
+  } else {
+    for (int i = 1; i < cc->Inputs().NumEntries(); i++) {
+      const Packet& packet = cc->Inputs().Index(i).Value();
+      signal_packets.push_back(packet);
+    }
+  }
+  return signal_packets;
+}
+
 mediapipe::Status SignalFusingCalculator::Process(
     mediapipe::CalculatorContext* cc) {
   bool is_boundary = false;
-  if (!cc->Inputs().Index(0).Value().IsEmpty()) {
-    is_boundary = cc->Inputs().Index(0).Get<bool>();
+  if (process_by_scene_) {
+    const auto& shot_tag = (tag_input_interface_)
+                               ? cc->Inputs().Tag(kIsShotBoundaryTag)
+                               : cc->Inputs().Index(0);
+    if (!shot_tag.Value().IsEmpty()) {
+      is_boundary = shot_tag.Get<bool>();
+    }
   }
 
-  if (is_boundary || scene_frames_.size() > options_.max_scene_size()) {
+  if (is_boundary) {
     MP_RETURN_IF_ERROR(ProcessScene(cc));
     scene_frames_.clear();
   }
 
   Frame frame;
-  for (int i = 1; i < cc->Inputs().NumEntries(); ++i) {
-    const Packet& packet = cc->Inputs().Index(i).Value();
+  const auto& signal_packets = GetSignalPackets(cc);
+  for (int i = 0; i < signal_packets.size(); i++) {
+    const Packet& packet = signal_packets[i];
     if (packet.IsEmpty()) {
       continue;
     }
@@ -214,16 +295,23 @@ mediapipe::Status SignalFusingCalculator::Process(
   frame.time = cc->InputTimestamp();
   scene_frames_.push_back(frame);
 
+  // Flush buffer on same input if it exceeds max_scene_size or if there is not
+  // shot input information.
+  if (scene_frames_.size() > options_.max_scene_size() || !process_by_scene_) {
+    MP_RETURN_IF_ERROR(ProcessScene(cc));
+    scene_frames_.clear();
+  }
+
   return ::mediapipe::OkStatus();
 }
 
 ::mediapipe::Status SignalFusingCalculator::GetContract(
     mediapipe::CalculatorContract* cc) {
-  cc->Inputs().Index(0).Set<bool>();
-  for (int i = 1; i < cc->Inputs().NumEntries(); ++i) {
-    cc->Inputs().Index(i).Set<autoflip::DetectionSet>();
+  if (cc->Inputs().NumEntries(kSignalInputsTag) > 0) {
+    SetupTagInput(cc);
+  } else {
+    SetupOrderedInput(cc);
   }
-  cc->Outputs().Index(0).Set<autoflip::DetectionSet>();
   return ::mediapipe::OkStatus();
 }
 
diff --git a/mediapipe/examples/desktop/autoflip/calculators/signal_fusing_calculator.proto b/mediapipe/examples/desktop/autoflip/calculators/signal_fusing_calculator.proto
index b7f735401..3f14935ba 100644
--- a/mediapipe/examples/desktop/autoflip/calculators/signal_fusing_calculator.proto
+++ b/mediapipe/examples/desktop/autoflip/calculators/signal_fusing_calculator.proto
@@ -31,7 +31,7 @@ message SignalFusingCalculatorOptions {
   optional int32 max_scene_size = 2 [default = 600];
 }
 
-// Next tag: 5
+// Next tag: 6
 message SignalSettings {
   // The type of signal these settings pertain to.
   optional SignalType type = 1;
@@ -51,4 +51,14 @@ message SignalSettings {
   // Is this signal required within the output cropped video?  If it is it will
   // be included or the video will be marked as failed to convert.
   optional bool is_required = 4 [default = false];
+
+  // When used with ContentZoomingCalculator, this flag can be set indicating
+  // that areas outside of these salient regions can be cropped from the frame.
+  // When no salient regions have this flag set true, no zooming is performed.
+  // When one or more salient regions have this flag set true, the max zoom
+  // value will be used that keeps all “only_required” detections within view.
+  // The ContentZoomingCalculator currently supports zooming by finding the size
+  // of non-salient top/bottom borders regions and provides this information to
+  // the SceneCroppingCalculator for reframing.
+  optional bool only_required = 5 [default = false];
 }
diff --git a/mediapipe/examples/desktop/autoflip/calculators/signal_fusing_calculator_test.cc b/mediapipe/examples/desktop/autoflip/calculators/signal_fusing_calculator_test.cc
index b0fa65ab4..7e6fa6b2b 100644
--- a/mediapipe/examples/desktop/autoflip/calculators/signal_fusing_calculator_test.cc
+++ b/mediapipe/examples/desktop/autoflip/calculators/signal_fusing_calculator_test.cc
@@ -80,6 +80,27 @@ const char kConfigB[] = R"(
     }
     })";
 
+const char kConfigC[] = R"(
+    calculator: "SignalFusingCalculator"
+    input_stream: "IS_SHOT_BOUNDARY:scene_change"
+    input_stream: "SIGNAL:0:detection_set_a"
+    input_stream: "SIGNAL:1:detection_set_b"
+    output_stream: "OUTPUT:salient_region"
+    options:{
+    [mediapipe.autoflip.SignalFusingCalculatorOptions.ext]:{
+      signal_settings{
+        type: {standard: FACE_FULL}
+        min_score: 0.5
+        max_score: 0.6
+      }
+      signal_settings{
+        type: {standard: TEXT}
+        min_score: 0.9
+        max_score: 1.0
+      }
+    }
+    })";
+
 TEST(SignalFusingCalculatorTest, TwoInputNoTracking) {
   auto runner = absl::make_unique<CalculatorRunner>(
       ParseTextProtoOrDie<CalculatorGraphConfig::Node>(kConfigA));
@@ -133,6 +154,113 @@ TEST(SignalFusingCalculatorTest, TwoInputNoTracking) {
   EXPECT_FLOAT_EQ(detection_set.detections(3).score(), .99);
 }
 
+TEST(SignalFusingCalculatorTest, TwoInputShotLabeledTags) {
+  auto runner = absl::make_unique<CalculatorRunner>(
+      ParseTextProtoOrDie<CalculatorGraphConfig::Node>(kConfigC));
+
+  auto input_shot = absl::make_unique<bool>(false);
+  runner->MutableInputs()
+      ->Tag("IS_SHOT_BOUNDARY")
+      .packets.push_back(Adopt(input_shot.release()).At(Timestamp(0)));
+
+  auto input_face =
+      absl::make_unique<DetectionSet>(ParseTextProtoOrDie<DetectionSet>(
+          R"(
+            detections {
+              score: 0.5
+              signal_type: { standard: FACE_FULL }
+            }
+            detections {
+              score: 0.3
+              signal_type: { standard: FACE_FULL }
+            }
+          )"));
+
+  runner->MutableInputs()
+      ->Get("SIGNAL", 0)
+      .packets.push_back(Adopt(input_face.release()).At(Timestamp(0)));
+
+  auto input_ocr =
+      absl::make_unique<DetectionSet>(ParseTextProtoOrDie<DetectionSet>(
+          R"(
+            detections {
+              score: 0.3
+              signal_type: { standard: TEXT }
+            }
+            detections {
+              score: 0.9
+              signal_type: { standard: TEXT }
+            }
+          )"));
+
+  runner->MutableInputs()
+      ->Get("SIGNAL", 1)
+      .packets.push_back(Adopt(input_ocr.release()).At(Timestamp(0)));
+
+  MP_ASSERT_OK(runner->Run());
+
+  const std::vector<Packet>& output_packets =
+      runner->Outputs().Tag("OUTPUT").packets;
+  const auto& detection_set = output_packets[0].Get<DetectionSet>();
+
+  ASSERT_EQ(detection_set.detections().size(), 4);
+  EXPECT_FLOAT_EQ(detection_set.detections(0).score(), .55);
+  EXPECT_FLOAT_EQ(detection_set.detections(1).score(), .53);
+  EXPECT_FLOAT_EQ(detection_set.detections(2).score(), .93);
+  EXPECT_FLOAT_EQ(detection_set.detections(3).score(), .99);
+}
+
+TEST(SignalFusingCalculatorTest, TwoInputNoShotLabeledTags) {
+  auto runner = absl::make_unique<CalculatorRunner>(
+      ParseTextProtoOrDie<CalculatorGraphConfig::Node>(kConfigC));
+
+  auto input_face =
+      absl::make_unique<DetectionSet>(ParseTextProtoOrDie<DetectionSet>(
+          R"(
+            detections {
+              score: 0.5
+              signal_type: { standard: FACE_FULL }
+            }
+            detections {
+              score: 0.3
+              signal_type: { standard: FACE_FULL }
+            }
+          )"));
+
+  runner->MutableInputs()
+      ->Get("SIGNAL", 0)
+      .packets.push_back(Adopt(input_face.release()).At(Timestamp(0)));
+
+  auto input_ocr =
+      absl::make_unique<DetectionSet>(ParseTextProtoOrDie<DetectionSet>(
+          R"(
+            detections {
+              score: 0.3
+              signal_type: { standard: TEXT }
+            }
+            detections {
+              score: 0.9
+              signal_type: { standard: TEXT }
+            }
+          )"));
+
+  runner->MutableInputs()
+      ->Get("SIGNAL", 1)
+      .packets.push_back(Adopt(input_ocr.release()).At(Timestamp(0)));
+
+  MP_ASSERT_OK(runner->Run());
+
+  const std::vector<Packet>& output_packets =
+      runner->Outputs().Tag("OUTPUT").packets;
+  const auto& detection_set = output_packets[0].Get<DetectionSet>();
+
+  ASSERT_EQ(detection_set.detections().size(), 4);
+  EXPECT_FLOAT_EQ(detection_set.detections(0).score(), .55);
+  EXPECT_FLOAT_EQ(detection_set.detections(1).score(), .53);
+  EXPECT_FLOAT_EQ(detection_set.detections(2).score(), .93);
+  EXPECT_FLOAT_EQ(detection_set.detections(3).score(), .99);
+}
+
 TEST(SignalFusingCalculatorTest, ThreeInputTracking) {
   auto runner = absl::make_unique<CalculatorRunner>(
       ParseTextProtoOrDie<CalculatorGraphConfig::Node>(kConfigB));
diff --git a/mediapipe/examples/desktop/autoflip/quality/BUILD b/mediapipe/examples/desktop/autoflip/quality/BUILD
index d1f3aee81..4d79b92de 100644
--- a/mediapipe/examples/desktop/autoflip/quality/BUILD
+++ b/mediapipe/examples/desktop/autoflip/quality/BUILD
@@ -23,17 +23,33 @@ proto_library(
     srcs = ["cropping.proto"],
     deps = [
         "//mediapipe/examples/desktop/autoflip:autoflip_messages_proto",
+        "//mediapipe/examples/desktop/autoflip/quality:kinematic_path_solver_proto",
     ],
 )
 
 mediapipe_cc_proto_library(
     name = "cropping_cc_proto",
     srcs = ["cropping.proto"],
-    cc_deps = ["//mediapipe/examples/desktop/autoflip:autoflip_messages_cc_proto"],
+    cc_deps = [
+        ":kinematic_path_solver_cc_proto",
+        "//mediapipe/examples/desktop/autoflip:autoflip_messages_cc_proto",
+    ],
     visibility = ["//mediapipe/examples:__subpackages__"],
     deps = [":cropping_proto"],
 )
 
+proto_library(
+    name = "kinematic_path_solver_proto",
+    srcs = ["kinematic_path_solver.proto"],
+)
+
+mediapipe_cc_proto_library(
+    name = "kinematic_path_solver_cc_proto",
+    srcs = ["kinematic_path_solver.proto"],
+    visibility = ["//mediapipe/examples:__subpackages__"],
+    deps = [":kinematic_path_solver_proto"],
+)
+
 proto_library(
     name = "focus_point_proto",
     srcs = ["focus_point.proto"],
@@ -142,6 +158,29 @@ cc_library(
     ],
 )
 
+cc_library(
+    name = "kinematic_path_solver",
+    srcs = ["kinematic_path_solver.cc"],
+    hdrs = ["kinematic_path_solver.h"],
+    deps = [
+        ":kinematic_path_solver_cc_proto",
+        "//mediapipe/framework/port:integral_types",
+        "//mediapipe/framework/port:ret_check",
+        "//mediapipe/framework/port:status",
+    ],
+)
+
+cc_test(
+    name = "kinematic_path_solver_test",
+    srcs = ["kinematic_path_solver_test.cc"],
+    deps = [
+        ":kinematic_path_solver",
+        "//mediapipe/framework/port:gtest_main",
+        "//mediapipe/framework/port:integral_types",
+        "//mediapipe/framework/port:status",
+    ],
+)
+
 cc_library(
     name = "scene_cropper",
     srcs = ["scene_cropper.cc"],
@@ -149,6 +188,7 @@ cc_library(
     deps = [
         ":cropping_cc_proto",
         ":focus_point_cc_proto",
+        ":kinematic_path_solver",
         ":polynomial_regression_path_solver",
         ":utils",
         "//mediapipe/framework/port:opencv_core",
diff --git a/mediapipe/examples/desktop/autoflip/quality/cropping.proto b/mediapipe/examples/desktop/autoflip/quality/cropping.proto
index 3293d7502..f8a62b247 100644
--- a/mediapipe/examples/desktop/autoflip/quality/cropping.proto
+++ b/mediapipe/examples/desktop/autoflip/quality/cropping.proto
@@ -17,6 +17,7 @@ syntax = "proto2";
 package mediapipe.autoflip;
 
 import "mediapipe/examples/desktop/autoflip/autoflip_messages.proto";
+import "mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.proto";
 
 // All relevant information for key frames, including timestamp and detected
 // features. This object should be generated by calling PackKeyFrameInfo() in
@@ -77,6 +78,8 @@ message KeyFrameCropResult {
   optional Rect region = 6;
   // Score of the computed crop region based on the detected features.
   optional float region_score = 7;
+  // Frame timestamp (in microseconds).
+  optional int64 timestamp_ms = 8;
 }
 
 // Compact processed scene key frame info containing timestamp, center position,
@@ -172,6 +175,7 @@ message SceneCameraMotion {
 // User-specified options for analyzing scene camera motion from a collection of
 // key frame crop regions.
 message SceneCameraMotionAnalyzerOptions {
+  reserved 9;
   // If there is small motion within the scene keep the camera steady at the
   // center.
   optional float motion_stabilization_threshold_percent = 1 [default = .30];
@@ -196,6 +200,11 @@ message SceneCameraMotionAnalyzerOptions {
   optional float minimum_success_rate_for_sweeping = 7 [default = 0.4];
   // If true, sweep entire frame. Otherwise, sweep the crop window.
   optional bool sweep_entire_frame = 8 [default = true];
+  // When no salient region is received, the default behavior is the return the
+  // camera to center-focused location.  When this flag is set to a value >0,
+  // the camera will remain at its last position for this amount of time before
+  // recentering (if the last scene camera motion type was steady).
+  optional int64 duration_before_centering_us = 10;
 }
 
 // Video cropping summary information for debugging/statistics.
@@ -215,3 +224,18 @@ message VideoCroppingSummary {
   // Cropping summaries for all the scenes in the video.
   repeated SceneCroppingSummary scene_summaries = 1;
 }
+
+message CameraMotionOptions {
+  message PolynomialRegressionPathSolver {
+    // Number of frames from prior buffer to be used to smooth out camera
+    // trajectory when it was a forced flush.
+    optional int32 prior_frame_buffer_size = 1 [default = 30];
+  }
+  oneof camera_model_oneof {
+    // Fits a poly line to keypoints to find a smooth camera path.
+    PolynomialRegressionPathSolver polynomial_path_solver = 1;
+    // Maintains a kinematic state of the camera, updated with keypoints, to
+    // find a smooth camera path.  Currently optimized for real-time operation.
+    KinematicOptions kinematic_options = 2;
+  }
+}
diff --git a/mediapipe/examples/desktop/autoflip/quality/frame_crop_region_computer.cc b/mediapipe/examples/desktop/autoflip/quality/frame_crop_region_computer.cc
index 3e391fc87..0b57cd0da 100644
--- a/mediapipe/examples/desktop/autoflip/quality/frame_crop_region_computer.cc
+++ b/mediapipe/examples/desktop/autoflip/quality/frame_crop_region_computer.cc
@@ -171,6 +171,9 @@ void FrameCropRegionComputer::UpdateCropRegionScore(
     const KeyFrameInfo& frame_info, KeyFrameCropResult* crop_result) const {
   RET_CHECK(crop_result != nullptr) << "KeyFrameCropResult is null.";
 
+  // Set timestamp of KeyFrameCropResult
+  crop_result->set_timestamp_ms(frame_info.timestamp_ms());
+
   // Sorts required and non-required regions.
   std::vector<SalientRegion> required_regions, non_required_regions;
   const auto sort_status = SortDetections(
@@ -180,7 +183,6 @@ void FrameCropRegionComputer::UpdateCropRegionScore(
   int target_width = options_.target_width();
   int target_height = options_.target_height();
   auto* region = crop_result->mutable_region();
-  RET_CHECK(region != nullptr) << "Crop region is null.";
 
   bool crop_region_is_empty = true;
   float crop_region_score = 0.0;
diff --git a/mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.cc b/mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.cc
new file mode 100644
index 000000000..340c4b253
--- /dev/null
+++ b/mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.cc
@@ -0,0 +1,76 @@
+#include "mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.h"
+
+namespace mediapipe {
+namespace autoflip {
+
+::mediapipe::Status KinematicPathSolver::AddObservation(int position,
+                                                        const uint64 time_us) {
+  if (!initialized_) {
+    current_position_px_ = position;
+    current_time_ = time_us;
+    initialized_ = true;
+    current_velocity_deg_per_s_ = 0;
+    return ::mediapipe::OkStatus();
+  }
+
+  RET_CHECK(current_time_ < time_us)
+      << "Observation added before a prior observations.";
+
+  double delta_degs = (position - current_position_px_) / pixels_per_degree_;
+
+  // If the motion is smaller than the min, don't use the update.
+  if (abs(delta_degs) < options_.min_motion_to_reframe()) {
+    position = current_position_px_;
+    delta_degs = 0;
+  }
+
+  // Time and position updates.
+  double delta_t = (time_us - current_time_) / 1000000.0;
+
+  // Observed velocity and then weighted update of this velocity.
+  double observed_velocity = delta_degs / delta_t;
+  double updated_velocity =
+      current_velocity_deg_per_s_ * (1 - options_.update_rate()) +
+      observed_velocity * options_.update_rate();
+  // Limited current velocity.
+  current_velocity_deg_per_s_ =
+      updated_velocity > 0 ? fmin(updated_velocity, options_.max_velocity())
+                           : fmax(updated_velocity, -options_.max_velocity());
+
+  // Update prediction based on time input.
+  return UpdatePrediction(time_us);
+}
+
+::mediapipe::Status KinematicPathSolver::UpdatePrediction(const int64 time_us) {
+  RET_CHECK(current_time_ < time_us)
+      << "Prediction time added before a prior observation or prediction.";
+  // Time since last state/prediction update.
+  double delta_t = (time_us - current_time_) / 1000000.0;
+
+  // Position update limited by min/max.
+
+  const double update_position_px =
+      current_position_px_ +
+      current_velocity_deg_per_s_ * delta_t * pixels_per_degree_;
+  if (update_position_px < min_location_) {
+    current_position_px_ = min_location_;
+    current_velocity_deg_per_s_ = 0;
+  } else if (update_position_px > max_location_) {
+    current_position_px_ = max_location_;
+    current_velocity_deg_per_s_ = 0;
+  } else {
+    current_position_px_ = update_position_px;
+  }
+  current_time_ = time_us;
+
+  return ::mediapipe::OkStatus();
+}
+
+::mediapipe::Status KinematicPathSolver::GetState(int* position) {
+  RET_CHECK(initialized_) << "GetState called before first observation added.";
+  *position = round(current_position_px_);
+  return ::mediapipe::OkStatus();
+}
+
+}  // namespace autoflip
+}  // namespace mediapipe
diff --git a/mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.h b/mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.h
new file mode 100644
index 000000000..2dcd9e520
--- /dev/null
+++ b/mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.h
@@ -0,0 +1,67 @@
+// Copyright 2019 The MediaPipe Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//      http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef MEDIAPIPE_EXAMPLES_DESKTOP_AUTOFLIP_QUALITY_UNIFORM_ACCELERATION_PATH_SOLVER_H_
+#define MEDIAPIPE_EXAMPLES_DESKTOP_AUTOFLIP_QUALITY_UNIFORM_ACCELERATION_PATH_SOLVER_H_
+
+#include "mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.pb.h"
+#include "mediapipe/framework/port/integral_types.h"
+#include "mediapipe/framework/port/ret_check.h"
+#include "mediapipe/framework/port/status.h"
+
+namespace mediapipe {
+namespace autoflip {
+
+// Kinematic path solver class is a stateful 1d position estimator based loosely
+// on a differential kalman filter that is specifically designed to control a
+// camera.  It utilizes a Kalman filters predict/update interface for estimating
+// the best camera focus position and updating that estimate when a measurement
+// is available.  Tuning controls include: update_rate: how much to update the
+// existing state with a new state. max_velocity: max speed of the state per
+// second. min_motion_to_reframe: only updating the state if a measurement
+// exceeds this threshold.
+class KinematicPathSolver {
+ public:
+  KinematicPathSolver(const KinematicOptions& options, const int min_location,
+                      const int max_location, float pixels_per_degree)
+      : options_(options),
+        min_location_(min_location),
+        max_location_(max_location),
+        initialized_(false),
+        pixels_per_degree_(pixels_per_degree) {}
+  // Add an observation (detection) at a position and time.
+  ::mediapipe::Status AddObservation(int position, const uint64 time_us);
+  // Get the predicted position at a time.
+  ::mediapipe::Status UpdatePrediction(const int64 time_us);
+  // Get the state at a time.
+  ::mediapipe::Status GetState(int* position);
+
+ private:
+  // Tuning options.
+  KinematicOptions options_;
+  // Min and max value the state can be.
+  const int min_location_;
+  const int max_location_;
+  bool initialized_;
+  float pixels_per_degree_;
+  // Current state values.
+  double current_position_px_;
+  double current_velocity_deg_per_s_;
+  uint64 current_time_;
+};
+
+}  // namespace autoflip
+}  // namespace mediapipe
+
+#endif  // MEDIAPIPE_EXAMPLES_DESKTOP_AUTOFLIP_QUALITY_UNIFORM_ACCELERATION_PATH_SOLVER_H_
diff --git a/mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.proto b/mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.proto
new file mode 100644
index 000000000..eda04c4b1
--- /dev/null
+++ b/mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.proto
@@ -0,0 +1,13 @@
+syntax = "proto2";
+
+package mediapipe.autoflip;
+
+message KinematicOptions {
+  // Weighted update of new camera velocity (measurement) vs current state
+  // (prediction).
+  optional double update_rate = 1 [default = 0.5];
+  // Max velocity (degrees per second) that the camera can move.
+  optional double max_velocity = 2 [default = 18];
+  // Min motion (in degrees) to react in pixels.
+  optional float min_motion_to_reframe = 3 [default = 1.8];
+}
diff --git a/mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver_test.cc b/mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver_test.cc
new file mode 100644
index 000000000..5d5717589
--- /dev/null
+++ b/mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver_test.cc
@@ -0,0 +1,140 @@
+// Copyright 2019 The MediaPipe Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//      http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.h"
+
+#include "mediapipe/framework/port/gmock.h"
+#include "mediapipe/framework/port/gtest.h"
+#include "mediapipe/framework/port/integral_types.h"
+#include "mediapipe/framework/port/status.h"
+#include "mediapipe/framework/port/status_matchers.h"
+
+constexpr int64 kMicroSecInSec = 1000000;
+constexpr float kWidthFieldOfView = 60;
+
+namespace mediapipe {
+namespace autoflip {
+namespace {
+
+TEST(KinematicPathSolverTest, FailNotInitializedState) {
+  KinematicOptions options;
+  KinematicPathSolver solver(options, 0, 1000, 1000.0 / kWidthFieldOfView);
+  int state;
+  EXPECT_FALSE(solver.GetState(&state).ok());
+}
+
+TEST(KinematicPathSolverTest, FailNotInitializedPrediction) {
+  KinematicOptions options;
+  KinematicPathSolver solver(options, 0, 1000, 1000.0 / kWidthFieldOfView);
+  int64 timestamp = 0;
+  EXPECT_FALSE(solver.UpdatePrediction(timestamp).ok());
+}
+
+TEST(KinematicPathSolverTest, PassNotEnoughMotionLargeImg) {
+  KinematicOptions options;
+  // Set min motion to 2deg
+  options.set_min_motion_to_reframe(2.0);
+  options.set_update_rate(1);
+  options.set_max_velocity(1000);
+  // Set degrees / pixel to 16.6
+  KinematicPathSolver solver(options, 0, 1000, 1000.0 / kWidthFieldOfView);
+  int state;
+  MP_ASSERT_OK(solver.AddObservation(500, kMicroSecInSec * 0));
+  // Move target by 20px / 16.6 = 1.2deg
+  MP_ASSERT_OK(solver.AddObservation(520, kMicroSecInSec * 1));
+  MP_ASSERT_OK(solver.GetState(&state));
+  // Expect cam to not move.
+  EXPECT_EQ(state, 500);
+}
+
+TEST(KinematicPathSolverTest, PassNotEnoughMotionSmallImg) {
+  KinematicOptions options;
+  // Set min motion to 2deg
+  options.set_min_motion_to_reframe(2.0);
+  options.set_update_rate(1);
+  options.set_max_velocity(500);
+  // Set degrees / pixel to 8.3
+  KinematicPathSolver solver(options, 0, 500, 500.0 / kWidthFieldOfView);
+  int state;
+  MP_ASSERT_OK(solver.AddObservation(400, kMicroSecInSec * 0));
+  // Move target by 10px / 8.3 = 1.2deg
+  MP_ASSERT_OK(solver.AddObservation(410, kMicroSecInSec * 1));
+  MP_ASSERT_OK(solver.GetState(&state));
+  // Expect cam to not move.
+  EXPECT_EQ(state, 400);
+}
+
+TEST(KinematicPathSolverTest, PassEnoughMotionLargeImg) {
+  KinematicOptions options;
+  // Set min motion to 1deg
+  options.set_min_motion_to_reframe(1.0);
+  options.set_update_rate(1);
+  options.set_max_velocity(1000);
+  // Set degrees / pixel to 16.6
+  KinematicPathSolver solver(options, 0, 1000, 1000.0 / kWidthFieldOfView);
+  int state;
+  MP_ASSERT_OK(solver.AddObservation(500, kMicroSecInSec * 0));
+  // Move target by 20px / 16.6 = 1.2deg
+  MP_ASSERT_OK(solver.AddObservation(520, kMicroSecInSec * 1));
+  MP_ASSERT_OK(solver.GetState(&state));
+  // Expect cam to move.
+  EXPECT_EQ(state, 520);
+}
+
+TEST(KinematicPathSolverTest, PassEnoughMotionSmallImg) {
+  KinematicOptions options;
+  // Set min motion to 2deg
+  options.set_min_motion_to_reframe(1.0);
+  options.set_update_rate(1);
+  options.set_max_velocity(18);
+  // Set degrees / pixel to 8.3
+  KinematicPathSolver solver(options, 0, 500, 500.0 / kWidthFieldOfView);
+  int state;
+  MP_ASSERT_OK(solver.AddObservation(400, kMicroSecInSec * 0));
+  // Move target by 10px / 8.3 = 1.2deg
+  MP_ASSERT_OK(solver.AddObservation(410, kMicroSecInSec * 1));
+  MP_ASSERT_OK(solver.GetState(&state));
+  // Expect cam to move.
+  EXPECT_EQ(state, 410);
+}
+
+TEST(KinematicPathSolverTest, PassUpdateRate) {
+  KinematicOptions options;
+  options.set_min_motion_to_reframe(1.0);
+  options.set_update_rate(0.25);
+  options.set_max_velocity(18);
+  KinematicPathSolver solver(options, 0, 1000, 1000.0 / kWidthFieldOfView);
+  int state;
+  MP_ASSERT_OK(solver.AddObservation(500, kMicroSecInSec * 0));
+  MP_ASSERT_OK(solver.AddObservation(520, kMicroSecInSec * 1));
+  MP_ASSERT_OK(solver.GetState(&state));
+  EXPECT_EQ(state, 505);
+}
+
+TEST(KinematicPathSolverTest, PassMaxVelocity) {
+  KinematicOptions options;
+  options.set_min_motion_to_reframe(1.0);
+  options.set_update_rate(1.0);
+  options.set_max_velocity(6);
+  KinematicPathSolver solver(options, 0, 1000, 1000.0 / kWidthFieldOfView);
+  int state;
+  MP_ASSERT_OK(solver.AddObservation(500, kMicroSecInSec * 0));
+  MP_ASSERT_OK(solver.AddObservation(1000, kMicroSecInSec * 1));
+  MP_ASSERT_OK(solver.GetState(&state));
+  EXPECT_EQ(state, 600);
+}
+
+}  // namespace
+}  // namespace autoflip
+}  // namespace mediapipe
diff --git a/mediapipe/examples/desktop/autoflip/quality/scene_camera_motion_analyzer.cc b/mediapipe/examples/desktop/autoflip/quality/scene_camera_motion_analyzer.cc
index ff519785a..34f1a4ee6 100644
--- a/mediapipe/examples/desktop/autoflip/quality/scene_camera_motion_analyzer.cc
+++ b/mediapipe/examples/desktop/autoflip/quality/scene_camera_motion_analyzer.cc
@@ -32,17 +32,19 @@ namespace autoflip {
 
 ::mediapipe::Status
 SceneCameraMotionAnalyzer::AnalyzeSceneAndPopulateFocusPointFrames(
-    const std::vector<KeyFrameInfo>& key_frame_infos,
     const KeyFrameCropOptions& key_frame_crop_options,
     const std::vector<KeyFrameCropResult>& key_frame_crop_results,
     const int scene_frame_width, const int scene_frame_height,
     const std::vector<int64>& scene_frame_timestamps,
+    const bool has_solid_color_background,
     SceneKeyFrameCropSummary* scene_summary,
     std::vector<FocusPointFrame>* focus_point_frames,
-    SceneCameraMotion* scene_camera_motion) const {
+    SceneCameraMotion* scene_camera_motion) {
+  has_solid_color_background_ = has_solid_color_background;
+  total_scene_frames_ = scene_frame_timestamps.size();
   MP_RETURN_IF_ERROR(AggregateKeyFrameResults(
-      key_frame_infos, key_frame_crop_options, key_frame_crop_results,
-      scene_frame_width, scene_frame_height, scene_summary));
+      key_frame_crop_options, key_frame_crop_results, scene_frame_width,
+      scene_frame_height, scene_summary));
 
   const int64 scene_span_ms =
       scene_frame_timestamps.empty()
@@ -51,7 +53,12 @@ SceneCameraMotionAnalyzer::AnalyzeSceneAndPopulateFocusPointFrames(
   const double scene_span_sec = TimestampDiff(scene_span_ms).Seconds();
   SceneCameraMotion camera_motion;
   MP_RETURN_IF_ERROR(DecideCameraMotionType(
-      key_frame_crop_options, scene_span_sec, scene_summary, &camera_motion));
+      key_frame_crop_options, scene_span_sec, scene_frame_timestamps.back(),
+      scene_summary, &camera_motion));
+  if (scene_summary->has_salient_region()) {
+    last_scene_with_salient_region_ = camera_motion;
+    time_since_last_salient_region_us_ = scene_frame_timestamps.back();
+  }
   if (scene_camera_motion != nullptr) {
     *scene_camera_motion = camera_motion;
   }
@@ -97,7 +104,8 @@ SceneCameraMotionAnalyzer::AnalyzeSceneAndPopulateFocusPointFrames(
 
 ::mediapipe::Status SceneCameraMotionAnalyzer::DecideCameraMotionType(
     const KeyFrameCropOptions& key_frame_crop_options,
-    const double scene_span_sec, SceneKeyFrameCropSummary* scene_summary,
+    const double scene_span_sec, const int64 end_time_us,
+    SceneKeyFrameCropSummary* scene_summary,
     SceneCameraMotion* scene_camera_motion) const {
   RET_CHECK_GE(scene_span_sec, 0.0) << "Scene time span is negative.";
   RET_CHECK_NE(scene_summary, nullptr) << "Scene summary is null.";
@@ -109,8 +117,18 @@ SceneCameraMotionAnalyzer::AnalyzeSceneAndPopulateFocusPointFrames(
   // regions, then default to look at the center.
   if (!scene_summary->has_salient_region()) {
     VLOG(1) << "No focus regions - camera is set to be steady on center.";
+    float no_salient_position_x = scene_frame_center_x;
+    float no_salient_position_y = scene_frame_center_y;
+    if (end_time_us - time_since_last_salient_region_us_ <
+            options_.duration_before_centering_us() &&
+        last_scene_with_salient_region_.has_steady_motion()) {
+      no_salient_position_x = last_scene_with_salient_region_.steady_motion()
+                                  .steady_look_at_center_x();
+      no_salient_position_y = last_scene_with_salient_region_.steady_motion()
+                                  .steady_look_at_center_y();
+    }
     MP_RETURN_IF_ERROR(ToUseSteadyMotion(
-        scene_frame_center_x, scene_frame_center_y,
+        no_salient_position_x, no_salient_position_y,
         scene_summary->crop_window_width(), scene_summary->crop_window_height(),
         scene_summary, scene_camera_motion));
     return ::mediapipe::OkStatus();
@@ -118,7 +136,7 @@ SceneCameraMotionAnalyzer::AnalyzeSceneAndPopulateFocusPointFrames(
 
   // Sweep across the scene when 1) success rate is too low, AND 2) the current
   // scene is long enough.
-  if (options_.allow_sweeping() &&
+  if (options_.allow_sweeping() && !has_solid_color_background_ &&
       scene_summary->frame_success_rate() <
           options_.minimum_success_rate_for_sweeping() &&
       scene_span_sec >= options_.minimum_scene_span_sec_for_sweeping()) {
@@ -150,10 +168,11 @@ SceneCameraMotionAnalyzer::AnalyzeSceneAndPopulateFocusPointFrames(
   }
 
   // If scene motion is small, then look at a steady point in the scene.
-  if (scene_summary->horizontal_motion_amount() <
-          options_.motion_stabilization_threshold_percent() &&
-      scene_summary->vertical_motion_amount() <
-          options_.motion_stabilization_threshold_percent()) {
+  if ((scene_summary->horizontal_motion_amount() <
+           options_.motion_stabilization_threshold_percent() &&
+       scene_summary->vertical_motion_amount() <
+           options_.motion_stabilization_threshold_percent()) ||
+      total_scene_frames_ == 1) {
     return DecideSteadyLookAtRegion(key_frame_crop_options, scene_summary,
                                     scene_camera_motion);
   }
diff --git a/mediapipe/examples/desktop/autoflip/quality/scene_camera_motion_analyzer.h b/mediapipe/examples/desktop/autoflip/quality/scene_camera_motion_analyzer.h
index 6ffcb2c84..4aca2108c 100644
--- a/mediapipe/examples/desktop/autoflip/quality/scene_camera_motion_analyzer.h
+++ b/mediapipe/examples/desktop/autoflip/quality/scene_camera_motion_analyzer.h
@@ -53,7 +53,9 @@ class SceneCameraMotionAnalyzer {
 
   explicit SceneCameraMotionAnalyzer(const SceneCameraMotionAnalyzerOptions&
                                          scene_camera_motion_analyzer_options)
-      : options_(scene_camera_motion_analyzer_options) {}
+      : options_(scene_camera_motion_analyzer_options),
+        time_since_last_salient_region_us_(0),
+        has_solid_color_background_(false) {}
 
   ~SceneCameraMotionAnalyzer() {}
 
@@ -61,21 +63,22 @@ class SceneCameraMotionAnalyzer {
   // SceneKeyFrameCropSummary, and populates FocusPointFrames given scene
   // frame timestamps. Optionally returns SceneCameraMotion.
   ::mediapipe::Status AnalyzeSceneAndPopulateFocusPointFrames(
-      const std::vector<KeyFrameInfo>& key_frame_infos,
       const KeyFrameCropOptions& key_frame_crop_options,
       const std::vector<KeyFrameCropResult>& key_frame_crop_results,
       const int scene_frame_width, const int scene_frame_height,
       const std::vector<int64>& scene_frame_timestamps,
+      const bool has_solid_color_background,
       SceneKeyFrameCropSummary* scene_summary,
       std::vector<FocusPointFrame>* focus_point_frames,
-      SceneCameraMotion* scene_camera_motion = nullptr) const;
+      SceneCameraMotion* scene_camera_motion = nullptr);
 
  protected:
   // Decides SceneCameraMotion based on SceneKeyFrameCropSummary. Updates the
   // crop window in SceneKeyFrameCropSummary in the case of steady motion.
   ::mediapipe::Status DecideCameraMotionType(
       const KeyFrameCropOptions& key_frame_crop_options,
-      const double scene_span_sec, SceneKeyFrameCropSummary* scene_summary,
+      const double scene_span_sec, const int64 end_time_us,
+      SceneKeyFrameCropSummary* scene_summary,
       SceneCameraMotion* scene_camera_motion) const;
 
   // Populates the FocusPointFrames for each scene frame based on
@@ -134,6 +137,16 @@ class SceneCameraMotionAnalyzer {
 
   // Scene camera motion analyzer options.
   SceneCameraMotionAnalyzerOptions options_;
+
+  // Last position
+  SceneCameraMotion last_scene_with_salient_region_;
+  int64 time_since_last_salient_region_us_;
+
+  // Scene has solid color background.
+  bool has_solid_color_background_;
+
+  // Total number of frames for this scene.
+  int total_scene_frames_;
 };
 
 }  // namespace autoflip
diff --git a/mediapipe/examples/desktop/autoflip/quality/scene_camera_motion_analyzer_test.cc b/mediapipe/examples/desktop/autoflip/quality/scene_camera_motion_analyzer_test.cc
index e8df355b7..f24a2f22d 100644
--- a/mediapipe/examples/desktop/autoflip/quality/scene_camera_motion_analyzer_test.cc
+++ b/mediapipe/examples/desktop/autoflip/quality/scene_camera_motion_analyzer_test.cc
@@ -63,16 +63,6 @@ Rect MakeRect(const int x, const int y, const int width, const int height) {
   return rect;
 }
 
-// Returns default values for KeyFrameInfos. Populates timestamps using the
-// default spacing kKeyFrameTimestampDiff starting from 0.
-std::vector<KeyFrameInfo> GetDefaultKeyFrameInfos() {
-  std::vector<KeyFrameInfo> key_frame_infos(kNumKeyFrames);
-  for (int i = 0; i < kNumKeyFrames; ++i) {
-    key_frame_infos[i].set_timestamp_ms(kKeyFrameTimestampDiff * i);
-  }
-  return key_frame_infos;
-}
-
 // Returns default values for scene frame timestamps. Populates timestamps using
 // the default spacing kSceneFrameTimestampDiff starting from 0.
 std::vector<int64> GetDefaultSceneFrameTimestamps() {
@@ -108,6 +98,7 @@ std::vector<KeyFrameCropResult> GetDefaultKeyFrameCropResults() {
     *(key_frame_crop_results[i].mutable_required_region()) =
         MakeRect(10, 10, 20, 20);
     key_frame_crop_results[i].set_region_score(1.0);
+    key_frame_crop_results[i].set_timestamp_ms(kKeyFrameTimestampDiff * i);
   }
   return key_frame_crop_results;
 }
@@ -183,10 +174,10 @@ TEST(SceneCameraMotionAnalyzerTest, DecideCameraMotionTypeChecksOutputNotNull) {
   SceneKeyFrameCropSummary scene_summary;
   SceneCameraMotion camera_motion;
   auto status = analyzer.DecideCameraMotionType(crop_options, kSceneTimeSpanSec,
-                                                nullptr, &camera_motion);
+                                                0, nullptr, &camera_motion);
   EXPECT_FALSE(status.ok());
   EXPECT_THAT(status.ToString(), HasSubstr("Scene summary is null."));
-  status = analyzer.DecideCameraMotionType(crop_options, kSceneTimeSpanSec,
+  status = analyzer.DecideCameraMotionType(crop_options, kSceneTimeSpanSec, 0,
                                            &scene_summary, nullptr);
   EXPECT_FALSE(status.ok());
   EXPECT_THAT(status.ToString(), HasSubstr("Scene camera motion is null."));
@@ -204,8 +195,8 @@ TEST(SceneCameraMotionAnalyzerTest,
   scene_summary.set_has_salient_region(false);
   SceneCameraMotion camera_motion;
 
-  MP_EXPECT_OK(analyzer.DecideCameraMotionType(crop_options, kSceneTimeSpanSec,
-                                               &scene_summary, &camera_motion));
+  MP_EXPECT_OK(analyzer.DecideCameraMotionType(
+      crop_options, kSceneTimeSpanSec, 0, &scene_summary, &camera_motion));
   EXPECT_TRUE(camera_motion.has_steady_motion());
   const auto& steady_motion = camera_motion.steady_motion();
   EXPECT_FLOAT_EQ(steady_motion.steady_look_at_center_x(),
@@ -229,7 +220,7 @@ TEST(SceneCameraMotionAnalyzerTest, DecideCameraMotionTypeSweepingLeftToRight) {
   SceneCameraMotion camera_motion;
 
   MP_EXPECT_OK(analyzer.DecideCameraMotionType(GetDefaultKeyFrameCropOptions(),
-                                               time_span, &scene_summary,
+                                               time_span, 0, &scene_summary,
                                                &camera_motion));
 
   EXPECT_TRUE(camera_motion.has_sweeping_motion());
@@ -258,7 +249,7 @@ TEST(SceneCameraMotionAnalyzerTest, DecideCameraMotionTypeSweepingTopToBottom) {
   SceneCameraMotion camera_motion;
 
   MP_EXPECT_OK(analyzer.DecideCameraMotionType(GetDefaultKeyFrameCropOptions(),
-                                               time_span, &scene_summary,
+                                               time_span, 0, &scene_summary,
                                                &camera_motion));
 
   EXPECT_TRUE(camera_motion.has_sweeping_motion());
@@ -287,7 +278,7 @@ TEST(SceneCameraMotionAnalyzerTest, DecideCameraMotionTypeSweepingCenterRange) {
   SceneCameraMotion camera_motion;
 
   MP_EXPECT_OK(analyzer.DecideCameraMotionType(GetDefaultKeyFrameCropOptions(),
-                                               time_span, &scene_summary,
+                                               time_span, 0, &scene_summary,
                                                &camera_motion));
 
   EXPECT_TRUE(camera_motion.has_sweeping_motion());
@@ -316,7 +307,7 @@ TEST(SceneCameraMotionAnalyzerTest,
   SceneCameraMotion camera_motion;
 
   MP_EXPECT_OK(analyzer.DecideCameraMotionType(GetDefaultKeyFrameCropOptions(),
-                                               kSceneTimeSpanSec,
+                                               kSceneTimeSpanSec, 0,
                                                &scene_summary, &camera_motion));
   EXPECT_TRUE(camera_motion.has_steady_motion());
   EXPECT_EQ(camera_motion.steady_motion().steady_look_at_center_x(),
@@ -341,7 +332,7 @@ TEST(SceneCameraMotionAnalyzerTest,
   SceneCameraMotion camera_motion;
 
   MP_EXPECT_OK(analyzer.DecideCameraMotionType(GetDefaultKeyFrameCropOptions(),
-                                               kSceneTimeSpanSec,
+                                               kSceneTimeSpanSec, 0,
                                                &scene_summary, &camera_motion));
   EXPECT_TRUE(camera_motion.has_steady_motion());
   EXPECT_EQ(camera_motion.steady_motion().steady_look_at_center_x(),
@@ -366,7 +357,7 @@ TEST(SceneCameraMotionAnalyzerTest,
   SceneCameraMotion camera_motion;
 
   MP_EXPECT_OK(analyzer.DecideCameraMotionType(GetDefaultKeyFrameCropOptions(),
-                                               kSceneTimeSpanSec,
+                                               kSceneTimeSpanSec, 0,
                                                &scene_summary, &camera_motion));
   EXPECT_TRUE(camera_motion.has_steady_motion());
   EXPECT_EQ(camera_motion.steady_motion().steady_look_at_center_x(),
@@ -391,8 +382,8 @@ TEST(SceneCameraMotionAnalyzerTest,
   scene_summary.set_key_frame_center_max_x(frame_center_x);
   SceneCameraMotion camera_motion;
 
-  MP_EXPECT_OK(analyzer.DecideCameraMotionType(crop_options, kSceneTimeSpanSec,
-                                               &scene_summary, &camera_motion));
+  MP_EXPECT_OK(analyzer.DecideCameraMotionType(
+      crop_options, kSceneTimeSpanSec, 0, &scene_summary, &camera_motion));
   EXPECT_TRUE(camera_motion.has_steady_motion());
   EXPECT_FLOAT_EQ(camera_motion.steady_motion().steady_look_at_center_x(),
                   frame_center_x);
@@ -409,7 +400,7 @@ TEST(SceneCameraMotionAnalyzerTest, DecideCameraMotionTypeTracking) {
   SceneCameraMotion camera_motion;
 
   MP_EXPECT_OK(analyzer.DecideCameraMotionType(GetDefaultKeyFrameCropOptions(),
-                                               kSceneTimeSpanSec,
+                                               kSceneTimeSpanSec, 0,
                                                &scene_summary, &camera_motion));
   EXPECT_TRUE(camera_motion.has_tracking_motion());
 }
@@ -785,9 +776,9 @@ TEST(SceneCameraMotionAnalyzerTest, AnalyzeSceneAndPopulateFocusPointFrames) {
   std::vector<FocusPointFrame> focus_point_frames;
 
   MP_EXPECT_OK(analyzer.AnalyzeSceneAndPopulateFocusPointFrames(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      GetDefaultKeyFrameCropResults(), kSceneFrameWidth, kSceneFrameHeight,
-      GetDefaultSceneFrameTimestamps(), &scene_summary, &focus_point_frames));
+      GetDefaultKeyFrameCropOptions(), GetDefaultKeyFrameCropResults(),
+      kSceneFrameWidth, kSceneFrameHeight, GetDefaultSceneFrameTimestamps(),
+      false, &scene_summary, &focus_point_frames));
   EXPECT_EQ(scene_summary.num_key_frames(), kNumKeyFrames);
   EXPECT_EQ(focus_point_frames.size(), kNumSceneFrames);
 }
@@ -803,10 +794,9 @@ TEST(SceneCameraMotionAnalyzerTest,
   SceneCameraMotion scene_camera_motion;
 
   MP_EXPECT_OK(analyzer.AnalyzeSceneAndPopulateFocusPointFrames(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      GetDefaultKeyFrameCropResults(), kSceneFrameWidth, kSceneFrameHeight,
-      GetDefaultSceneFrameTimestamps(), &scene_summary, &focus_point_frames,
-      &scene_camera_motion));
+      GetDefaultKeyFrameCropOptions(), GetDefaultKeyFrameCropResults(),
+      kSceneFrameWidth, kSceneFrameHeight, GetDefaultSceneFrameTimestamps(),
+      false, &scene_summary, &focus_point_frames, &scene_camera_motion));
   EXPECT_TRUE(scene_camera_motion.has_steady_motion());
 }
 
diff --git a/mediapipe/examples/desktop/autoflip/quality/scene_cropper.cc b/mediapipe/examples/desktop/autoflip/quality/scene_cropper.cc
index d70b7d677..acb66ced6 100644
--- a/mediapipe/examples/desktop/autoflip/quality/scene_cropper.cc
+++ b/mediapipe/examples/desktop/autoflip/quality/scene_cropper.cc
@@ -14,6 +14,8 @@
 
 #include "mediapipe/examples/desktop/autoflip/quality/scene_cropper.h"
 
+#include <memory>
+
 #include "absl/memory/memory.h"
 #include "mediapipe/examples/desktop/autoflip/quality/polynomial_regression_path_solver.h"
 #include "mediapipe/examples/desktop/autoflip/quality/utils.h"
@@ -21,17 +23,74 @@
 #include "mediapipe/framework/port/ret_check.h"
 #include "mediapipe/framework/port/status.h"
 
+// TODO: Parameterize FOV based on camera specs.
+constexpr float kWidthFieldOfView = 60;
+
 namespace mediapipe {
 namespace autoflip {
 
+::mediapipe::Status SceneCropper::ProcessKinematicPathSolver(
+    const SceneKeyFrameCropSummary& scene_summary,
+    const std::vector<int64>& scene_timestamps,
+    const std::vector<bool>& is_key_frames,
+    const std::vector<FocusPointFrame>& focus_point_frames,
+    const bool continue_last_scene, std::vector<cv::Mat>* all_xforms) {
+  // TODO: Fix upstream calculators to not crop beyond portrait target
+  // value.
+  /*
+  RET_CHECK(scene_summary.scene_frame_height() ==
+            scene_summary.crop_window_height())
+      << "Kinematic path solver does not yet support horizontal cropping.";
+      */
+
+  RET_CHECK(scene_timestamps.size() == focus_point_frames.size())
+      << "Kinematic path solver does not yet support downsampled detections.";
+
+  if (!path_solver_initalized_ || !continue_last_scene) {
+    int min_location = scene_summary.crop_window_width() / 2;
+    int max_location = scene_summary.scene_frame_width() -
+                       scene_summary.crop_window_width() / 2;
+    kinematic_path_solver_ = std::make_unique<KinematicPathSolver>(
+        camera_motion_options_.kinematic_options(), min_location, max_location,
+        static_cast<float>(frame_width_) / kWidthFieldOfView);
+    path_solver_initalized_ = true;
+  }
+  int keyframe_counter = 0;
+  for (int i = 0; i < is_key_frames.size(); i++) {
+    if (is_key_frames[i]) {
+      RET_CHECK_EQ(focus_point_frames[keyframe_counter].point().size(), 2)
+          << "Expected focus_points to equal 2";
+      int observed_x = std::round(
+          focus_point_frames[keyframe_counter].point(0).norm_point_x() *
+          scene_summary.scene_frame_width());
+      MP_RETURN_IF_ERROR(kinematic_path_solver_->AddObservation(
+          observed_x, scene_timestamps[i]));
+      keyframe_counter++;
+    } else {
+      MP_RETURN_IF_ERROR(
+          kinematic_path_solver_->UpdatePrediction(scene_timestamps[i]));
+    }
+    int x_path;
+    MP_RETURN_IF_ERROR(kinematic_path_solver_->GetState(&x_path));
+    cv::Mat transform = cv::Mat::eye(2, 3, CV_32FC1);
+    transform.at<float>(0, 2) =
+        -(x_path - scene_summary.crop_window_width() / 2);
+    all_xforms->push_back(transform);
+  }
+  return ::mediapipe::OkStatus();
+}
+
 ::mediapipe::Status SceneCropper::CropFrames(
-    const SceneKeyFrameCropSummary& scene_summary, const int num_scene_frames,
+    const SceneKeyFrameCropSummary& scene_summary,
+    const std::vector<int64>& scene_timestamps,
+    const std::vector<bool>& is_key_frames,
     const std::vector<cv::Mat>& scene_frames_or_empty,
     const std::vector<FocusPointFrame>& focus_point_frames,
     const std::vector<FocusPointFrame>& prior_focus_point_frames,
     int top_static_border_size, int bottom_static_border_size,
-    std::vector<cv::Rect>* crop_from_location,
-    std::vector<cv::Mat>* cropped_frames) const {
+    const bool continue_last_scene, std::vector<cv::Rect>* crop_from_location,
+    std::vector<cv::Mat>* cropped_frames) {
+  const int num_scene_frames = scene_timestamps.size();
   RET_CHECK_GT(num_scene_frames, 0) << "No scene frames.";
   RET_CHECK_EQ(focus_point_frames.size(), num_scene_frames)
       << "Wrong size of FocusPointFrames.";
@@ -46,26 +105,50 @@ namespace autoflip {
   RET_CHECK_LE(crop_height, frame_height)
       << "Crop height exceeds frame height.";
 
+  RET_CHECK(camera_motion_options_.has_polynomial_path_solver() ||
+            camera_motion_options_.has_kinematic_options())
+      << "No camera motion model selected.";
+
   // Computes transforms.
-  std::vector<cv::Mat> all_xforms;
 
-  PolynomialRegressionPathSolver solver;
-  RET_CHECK_OK(solver.ComputeCameraPath(
-      focus_point_frames, prior_focus_point_frames, frame_width, frame_height,
-      crop_width, crop_height, &all_xforms));
+  std::vector<cv::Mat> scene_frame_xforms;
+  int num_prior = 0;
+  if (camera_motion_options_.has_polynomial_path_solver()) {
+    num_prior = prior_focus_point_frames.size();
+    std::vector<cv::Mat> all_xforms;
+    PolynomialRegressionPathSolver solver;
+    RET_CHECK_OK(solver.ComputeCameraPath(
+        focus_point_frames, prior_focus_point_frames, frame_width, frame_height,
+        crop_width, crop_height, &all_xforms));
 
-  const int num_prior = prior_focus_point_frames.size();
-  std::vector<cv::Mat> scene_frame_xforms(all_xforms.begin() + num_prior,
-                                          all_xforms.end());
+    scene_frame_xforms =
+        std::vector<cv::Mat>(all_xforms.begin() + num_prior, all_xforms.end());
 
-  // Convert the matrix from center-aligned to upper-left aligned.
-  for (cv::Mat& xform : scene_frame_xforms) {
-    cv::Mat affine_opencv = cv::Mat::eye(2, 3, CV_32FC1);
-    affine_opencv.at<float>(0, 2) =
-        -(xform.at<float>(0, 2) + frame_width / 2 - crop_width / 2);
-    affine_opencv.at<float>(1, 2) =
-        -(xform.at<float>(1, 2) + frame_height / 2 - crop_height / 2);
-    xform = affine_opencv;
+    // Convert the matrix from center-aligned to upper-left aligned.
+    for (cv::Mat& xform : scene_frame_xforms) {
+      cv::Mat affine_opencv = cv::Mat::eye(2, 3, CV_32FC1);
+      affine_opencv.at<float>(0, 2) =
+          -(xform.at<float>(0, 2) + frame_width / 2 - crop_width / 2);
+      affine_opencv.at<float>(1, 2) =
+          -(xform.at<float>(1, 2) + frame_height / 2 - crop_height / 2);
+      xform = affine_opencv;
+    }
+  } else if (camera_motion_options_.has_kinematic_options()) {
+    num_prior = 0;
+    MP_RETURN_IF_ERROR(ProcessKinematicPathSolver(
+        scene_summary, scene_timestamps, is_key_frames, focus_point_frames,
+        continue_last_scene, &scene_frame_xforms));
+  }
+
+  // Store the "crop from" location on the input frame for use with an external
+  // renderer.
+  for (int i = 0; i < num_scene_frames; i++) {
+    const int left = -(scene_frame_xforms[i].at<float>(0, 2));
+    const int right = left + crop_width;
+    const int top = top_static_border_size;
+    const int bottom = frame_height_ - bottom_static_border_size;
+    crop_from_location->push_back(
+        cv::Rect(left, top, right - left, bottom - top));
   }
 
   // If no cropped_frames is passed in, return directly.
@@ -81,20 +164,6 @@ namespace autoflip {
     (*cropped_frames)[i] = cv::Mat::zeros(crop_height, crop_width,
                                           scene_frames_or_empty[i].type());
   }
-
-  // Store the "crop from" location on the input frame for use with an external
-  // renderer.
-  for (int i = 0; i < num_scene_frames; i++) {
-    const int left = scene_frame_xforms[i].at<float>(0, 2);
-    const int right = left + crop_width;
-    const int top = top_static_border_size;
-    const int bottom =
-        top_static_border_size +
-        (crop_height - top_static_border_size - bottom_static_border_size);
-    crop_from_location->push_back(
-        cv::Rect(left, top, right - left, bottom - top));
-  }
-
   return AffineRetarget(cv::Size(crop_width, crop_height),
                         scene_frames_or_empty, scene_frame_xforms,
                         cropped_frames);
diff --git a/mediapipe/examples/desktop/autoflip/quality/scene_cropper.h b/mediapipe/examples/desktop/autoflip/quality/scene_cropper.h
index 0235eb1b2..c99ae59e7 100644
--- a/mediapipe/examples/desktop/autoflip/quality/scene_cropper.h
+++ b/mediapipe/examples/desktop/autoflip/quality/scene_cropper.h
@@ -20,6 +20,7 @@
 
 #include "mediapipe/examples/desktop/autoflip/quality/cropping.pb.h"
 #include "mediapipe/examples/desktop/autoflip/quality/focus_point.pb.h"
+#include "mediapipe/examples/desktop/autoflip/quality/kinematic_path_solver.h"
 #include "mediapipe/framework/port/opencv_core_inc.h"
 #include "mediapipe/framework/port/ret_check.h"
 #include "mediapipe/framework/port/status.h"
@@ -45,7 +46,12 @@ namespace autoflip {
 //       prior_focus_point_frames, &cropped_frames));
 class SceneCropper {
  public:
-  SceneCropper() {}
+  SceneCropper(const CameraMotionOptions& camera_motion_options,
+               const int frame_width, const int frame_height)
+      : path_solver_initalized_(false),
+        camera_motion_options_(camera_motion_options),
+        frame_width_(frame_width),
+        frame_height_(frame_height) {}
   ~SceneCropper() {}
 
   // Computes transformation matrix given SceneKeyFrameCropSummary,
@@ -55,13 +61,29 @@ class SceneCropper {
   // |scene_frames_or_empty| isn't empty.
   // TODO: split this function into two separate functions.
   ::mediapipe::Status CropFrames(
-      const SceneKeyFrameCropSummary& scene_summary, const int num_scene_frames,
+      const SceneKeyFrameCropSummary& scene_summary,
+      const std::vector<int64>& scene_timestamps,
+      const std::vector<bool>& is_key_frames,
       const std::vector<cv::Mat>& scene_frames_or_empty,
       const std::vector<FocusPointFrame>& focus_point_frames,
       const std::vector<FocusPointFrame>& prior_focus_point_frames,
       int top_static_border_size, int bottom_static_border_size,
-      std::vector<cv::Rect>* all_scene_frame_xforms,
-      std::vector<cv::Mat>* cropped_frames) const;
+      const bool continue_last_scene, std::vector<cv::Rect>* crop_from_location,
+      std::vector<cv::Mat>* cropped_frames);
+
+  ::mediapipe::Status ProcessKinematicPathSolver(
+      const SceneKeyFrameCropSummary& scene_summary,
+      const std::vector<int64>& scene_timestamps,
+      const std::vector<bool>& is_key_frames,
+      const std::vector<FocusPointFrame>& focus_point_frames,
+      const bool continue_last_scene, std::vector<cv::Mat>* all_xforms);
+
+ private:
+  bool path_solver_initalized_;
+  std::unique_ptr<KinematicPathSolver> kinematic_path_solver_;
+  CameraMotionOptions camera_motion_options_;
+  int frame_width_;
+  int frame_height_;
 };
 
 }  // namespace autoflip
diff --git a/mediapipe/examples/desktop/autoflip/quality/scene_cropper_test.cc b/mediapipe/examples/desktop/autoflip/quality/scene_cropper_test.cc
index 6c7dc3e41..e0e4f9d15 100644
--- a/mediapipe/examples/desktop/autoflip/quality/scene_cropper_test.cc
+++ b/mediapipe/examples/desktop/autoflip/quality/scene_cropper_test.cc
@@ -71,30 +71,53 @@ std::vector<FocusPointFrame> GetDefaultFocusPointFrames() {
   return GetFocusPointFrames(kNumSceneFrames);
 }
 
+std::vector<int64> GetTimestamps(const int num_frames) {
+  std::vector<int64> timestamps;
+  for (int i = 0; i < num_frames; ++i) {
+    timestamps.push_back(i * 100000);
+  }
+  return timestamps;
+}
+
+std::vector<bool> GetIsKeyframe(const int num_frames) {
+  std::vector<bool> is_keyframe;
+  for (int i = 0; i < num_frames; ++i) {
+    is_keyframe.push_back(false);
+  }
+  return is_keyframe;
+}
+
 // Checks that CropFrames checks that scene frames size is positive.
 TEST(SceneCropperTest, CropFramesChecksSceneFramesSize) {
-  SceneCropper scene_cropper;
+  CameraMotionOptions options;
+  options.mutable_polynomial_path_solver()->set_prior_frame_buffer_size(30);
+  SceneCropper scene_cropper(options, kSceneWidth, kSceneHeight);
   std::vector<cv::Mat> scene_frames(0);
   std::vector<cv::Mat> cropped_frames;
   std::vector<cv::Rect> crop_from_locations;
   const auto status = scene_cropper.CropFrames(
-      GetDefaultSceneKeyFrameCropSummary(), scene_frames.size(), scene_frames,
-      GetDefaultFocusPointFrames(), GetFocusPointFrames(0), 0, 0,
+      GetDefaultSceneKeyFrameCropSummary(), GetTimestamps(scene_frames.size()),
+      GetIsKeyframe(scene_frames.size()), scene_frames,
+      GetDefaultFocusPointFrames(), GetFocusPointFrames(0), 0, 0, false,
       &crop_from_locations, &cropped_frames);
   EXPECT_FALSE(status.ok());
   EXPECT_THAT(status.ToString(), HasSubstr("No scene frames."));
 }
 
 // Checks that CropFrames checks that FocusPointFrames has the right size.
+
 TEST(SceneCropperTest, CropFramesChecksFocusPointFramesSize) {
-  SceneCropper scene_cropper;
+  CameraMotionOptions options;
+  options.mutable_polynomial_path_solver()->set_prior_frame_buffer_size(30);
+  SceneCropper scene_cropper(options, kSceneWidth, kSceneHeight);
   std::vector<cv::Mat> cropped_frames;
   std::vector<cv::Rect> crop_from_locations;
   const auto& scene_frames = GetDefaultSceneFrames();
   const auto status = scene_cropper.CropFrames(
-      GetDefaultSceneKeyFrameCropSummary(), scene_frames.size(), scene_frames,
+      GetDefaultSceneKeyFrameCropSummary(), GetTimestamps(kNumSceneFrames),
+      GetIsKeyframe(kNumSceneFrames), scene_frames,
       GetFocusPointFrames(kNumSceneFrames - 1), GetFocusPointFrames(0), 0, 0,
-      &crop_from_locations, &cropped_frames);
+      false, &crop_from_locations, &cropped_frames);
   EXPECT_FALSE(status.ok());
   EXPECT_THAT(status.ToString(), HasSubstr("Wrong size of FocusPointFrames"));
 }
@@ -103,13 +126,16 @@ TEST(SceneCropperTest, CropFramesChecksFocusPointFramesSize) {
 TEST(SceneCropperTest, CropFramesChecksCropSizePositive) {
   auto scene_summary = GetDefaultSceneKeyFrameCropSummary();
   scene_summary.set_crop_window_width(-1);
-  SceneCropper scene_cropper;
+  CameraMotionOptions options;
+  options.mutable_polynomial_path_solver()->set_prior_frame_buffer_size(30);
+  SceneCropper scene_cropper(options, kSceneWidth, kSceneHeight);
   std::vector<cv::Mat> cropped_frames;
   std::vector<cv::Rect> crop_from_locations;
   const auto& scene_frames = GetDefaultSceneFrames();
   const auto status = scene_cropper.CropFrames(
-      scene_summary, scene_frames.size(), scene_frames,
-      GetDefaultFocusPointFrames(), GetFocusPointFrames(0), 0, 0,
+      scene_summary, GetTimestamps(kNumSceneFrames),
+      GetIsKeyframe(kNumSceneFrames), scene_frames,
+      GetDefaultFocusPointFrames(), GetFocusPointFrames(0), 0, 0, false,
       &crop_from_locations, &cropped_frames);
   EXPECT_FALSE(status.ok());
   EXPECT_THAT(status.ToString(), HasSubstr("Crop width is non-positive."));
@@ -119,13 +145,16 @@ TEST(SceneCropperTest, CropFramesChecksCropSizePositive) {
 TEST(SceneCropperTest, InitializesRetargeterChecksCropSizeNotExceedFrameSize) {
   auto scene_summary = GetDefaultSceneKeyFrameCropSummary();
   scene_summary.set_crop_window_height(kSceneHeight + 1);
-  SceneCropper scene_cropper;
+  CameraMotionOptions options;
+  options.mutable_polynomial_path_solver()->set_prior_frame_buffer_size(30);
+  SceneCropper scene_cropper(options, kSceneWidth, kSceneHeight);
   std::vector<cv::Mat> cropped_frames;
   std::vector<cv::Rect> crop_from_locations;
   const auto& scene_frames = GetDefaultSceneFrames();
   const auto status = scene_cropper.CropFrames(
-      scene_summary, scene_frames.size(), scene_frames,
-      GetDefaultFocusPointFrames(), GetFocusPointFrames(0), 0, 0,
+      scene_summary, GetTimestamps(kNumSceneFrames),
+      GetIsKeyframe(kNumSceneFrames), scene_frames,
+      GetDefaultFocusPointFrames(), GetFocusPointFrames(0), 0, 0, false,
       &crop_from_locations, &cropped_frames);
   EXPECT_FALSE(status.ok());
   EXPECT_THAT(status.ToString(),
@@ -134,13 +163,16 @@ TEST(SceneCropperTest, InitializesRetargeterChecksCropSizeNotExceedFrameSize) {
 
 // Checks that CropFrames works when there are not any prior FocusPointFrames.
 TEST(SceneCropperTest, CropFramesWorksWithoutPriorFocusPointFrames) {
-  SceneCropper scene_cropper;
+  CameraMotionOptions options;
+  options.mutable_polynomial_path_solver()->set_prior_frame_buffer_size(30);
+  SceneCropper scene_cropper(options, kSceneWidth, kSceneHeight);
   std::vector<cv::Mat> cropped_frames;
   std::vector<cv::Rect> crop_from_locations;
   const auto& scene_frames = GetDefaultSceneFrames();
   MP_ASSERT_OK(scene_cropper.CropFrames(
-      GetDefaultSceneKeyFrameCropSummary(), scene_frames.size(), scene_frames,
-      GetDefaultFocusPointFrames(), GetFocusPointFrames(0), 0, 0,
+      GetDefaultSceneKeyFrameCropSummary(), GetTimestamps(kNumSceneFrames),
+      GetIsKeyframe(kNumSceneFrames), scene_frames,
+      GetDefaultFocusPointFrames(), GetFocusPointFrames(0), 0, 0, false,
       &crop_from_locations, &cropped_frames));
   ASSERT_EQ(cropped_frames.size(), kNumSceneFrames);
   for (int i = 0; i < kNumSceneFrames; ++i) {
@@ -151,13 +183,16 @@ TEST(SceneCropperTest, CropFramesWorksWithoutPriorFocusPointFrames) {
 
 // Checks that CropFrames works when there are prior FocusPointFrames.
 TEST(SceneCropperTest, CropFramesWorksWithPriorFocusPointFrames) {
-  SceneCropper scene_cropper;
+  CameraMotionOptions options;
+  options.mutable_polynomial_path_solver()->set_prior_frame_buffer_size(30);
+  SceneCropper scene_cropper(options, kSceneWidth, kSceneHeight);
   std::vector<cv::Mat> cropped_frames;
   std::vector<cv::Rect> crop_from_locations;
   const auto& scene_frames = GetDefaultSceneFrames();
   MP_EXPECT_OK(scene_cropper.CropFrames(
-      GetDefaultSceneKeyFrameCropSummary(), scene_frames.size(), scene_frames,
-      GetDefaultFocusPointFrames(), GetFocusPointFrames(3), 0, 0,
+      GetDefaultSceneKeyFrameCropSummary(), GetTimestamps(scene_frames.size()),
+      GetIsKeyframe(scene_frames.size()), scene_frames,
+      GetDefaultFocusPointFrames(), GetFocusPointFrames(3), 0, 0, false,
       &crop_from_locations, &cropped_frames));
   EXPECT_EQ(cropped_frames.size(), kNumSceneFrames);
   for (int i = 0; i < kNumSceneFrames; ++i) {
diff --git a/mediapipe/examples/desktop/autoflip/quality/scene_cropping_viz.cc b/mediapipe/examples/desktop/autoflip/quality/scene_cropping_viz.cc
index 974ebad77..e2be36c08 100644
--- a/mediapipe/examples/desktop/autoflip/quality/scene_cropping_viz.cc
+++ b/mediapipe/examples/desktop/autoflip/quality/scene_cropping_viz.cc
@@ -133,6 +133,42 @@ const cv::Scalar kWhite = cv::Scalar(255.0, 255.0, 255.0);  // others
   return ::mediapipe::OkStatus();
 }
 
+namespace {
+cv::Rect LimitBounds(const cv::Rect& rect, const int max_width,
+                     const int max_height) {
+  cv::Rect result;
+  result.x = fmax(rect.x, 0);
+  result.y = fmax(rect.y, 0);
+  result.width =
+      result.x + rect.width >= max_width ? max_width - result.x : rect.width;
+  result.height = result.y + rect.height >= max_height ? max_height - result.y
+                                                       : rect.height;
+  return result;
+}
+}  // namespace
+
+::mediapipe::Status DrawDetectionAndFramingWindow(
+    const std::vector<cv::Mat>& org_scene_frames,
+    const std::vector<cv::Rect>& crop_from_locations,
+    const ImageFormat::Format image_format, const float overlay_opacity,
+    std::vector<std::unique_ptr<ImageFrame>>* viz_frames) {
+  for (int i = 0; i < org_scene_frames.size(); i++) {
+    const auto& scene_frame = org_scene_frames[i];
+    auto viz_frame = absl::make_unique<ImageFrame>(
+        image_format, scene_frame.cols, scene_frame.rows);
+    cv::Mat darkened = formats::MatView(viz_frame.get());
+    scene_frame.copyTo(darkened);
+    cv::Mat overlay = cv::Mat::zeros(darkened.size(), darkened.type());
+    cv::addWeighted(overlay, overlay_opacity, darkened, 1 - overlay_opacity, 0,
+                    darkened);
+    const auto& crop_from_bounded =
+        LimitBounds(crop_from_locations[i], scene_frame.cols, scene_frame.rows);
+    scene_frame(crop_from_bounded).copyTo(darkened(crop_from_bounded));
+    viz_frames->push_back(std::move(viz_frame));
+  }
+  return ::mediapipe::OkStatus();
+}
+
 ::mediapipe::Status DrawFocusPointAndCropWindow(
     const std::vector<cv::Mat>& scene_frames,
     const std::vector<FocusPointFrame>& focus_point_frames,
diff --git a/mediapipe/examples/desktop/autoflip/quality/scene_cropping_viz.h b/mediapipe/examples/desktop/autoflip/quality/scene_cropping_viz.h
index 464b4e4c9..e951f2df7 100644
--- a/mediapipe/examples/desktop/autoflip/quality/scene_cropping_viz.h
+++ b/mediapipe/examples/desktop/autoflip/quality/scene_cropping_viz.h
@@ -55,6 +55,14 @@ namespace autoflip {
     const mediapipe::ImageFormat::Format image_format,
     std::vector<std::unique_ptr<ImageFrame>>* viz_frames);
 
+// Draws the final smoothed path of the camera retargeter by darkening the
+// removed areas.
+::mediapipe::Status DrawDetectionAndFramingWindow(
+    const std::vector<cv::Mat>& org_scene_frames,
+    const std::vector<cv::Rect>& crop_from_locations,
+    const ImageFormat::Format image_format, const float overlay_opacity,
+    std::vector<std::unique_ptr<ImageFrame>>* viz_frames);
+
 }  // namespace autoflip
 }  // namespace mediapipe
 
diff --git a/mediapipe/examples/desktop/autoflip/quality/utils.cc b/mediapipe/examples/desktop/autoflip/quality/utils.cc
index d68ec1d92..68db4aa11 100644
--- a/mediapipe/examples/desktop/autoflip/quality/utils.cc
+++ b/mediapipe/examples/desktop/autoflip/quality/utils.cc
@@ -203,7 +203,6 @@ void RectUnion(const Rect& rect_to_add, Rect* rect) {
 }
 
 ::mediapipe::Status AggregateKeyFrameResults(
-    const std::vector<KeyFrameInfo>& key_frame_infos,
     const KeyFrameCropOptions& key_frame_crop_options,
     const std::vector<KeyFrameCropResult>& key_frame_crop_results,
     const int scene_frame_width, const int scene_frame_height,
@@ -211,11 +210,7 @@ void RectUnion(const Rect& rect_to_add, Rect* rect) {
   RET_CHECK_NE(scene_summary, nullptr)
       << "Output SceneKeyFrameCropSummary is null.";
 
-  const int num_key_frames = key_frame_infos.size();
-  RET_CHECK_EQ(num_key_frames, key_frame_crop_results.size())
-      << "Inconsistent number of key frames:"
-      << " num_key_frames = " << num_key_frames
-      << " key_frame_crop_results.size() = " << key_frame_crop_results.size();
+  const int num_key_frames = key_frame_crop_results.size();
 
   RET_CHECK_GT(scene_frame_width, 0) << "Non-positive frame width.";
   RET_CHECK_GT(scene_frame_height, 0) << "Non-positive frame height.";
@@ -255,8 +250,8 @@ void RectUnion(const Rect& rect_to_add, Rect* rect) {
   std::unique_ptr<Rect> required_crop_region_union = nullptr;
   for (int i = 0; i < num_key_frames; ++i) {
     auto* key_frame_compact_info = scene_summary->add_key_frame_compact_infos();
-    key_frame_compact_info->set_timestamp_ms(key_frame_infos[i].timestamp_ms());
     const auto& result = key_frame_crop_results[i];
+    key_frame_compact_info->set_timestamp_ms(result.timestamp_ms());
     if (result.are_required_regions_covered_in_target_size()) {
       num_success_frames++;
     }
diff --git a/mediapipe/examples/desktop/autoflip/quality/utils.h b/mediapipe/examples/desktop/autoflip/quality/utils.h
index 4761077bc..ec1373ae4 100644
--- a/mediapipe/examples/desktop/autoflip/quality/utils.h
+++ b/mediapipe/examples/desktop/autoflip/quality/utils.h
@@ -54,7 +54,6 @@ namespace autoflip {
 // Aggregates information from KeyFrameInfos and KeyFrameCropResults into
 // SceneKeyFrameCropSummary.
 ::mediapipe::Status AggregateKeyFrameResults(
-    const std::vector<KeyFrameInfo>& key_frame_infos,
     const KeyFrameCropOptions& key_frame_crop_options,
     const std::vector<KeyFrameCropResult>& key_frame_crop_results,
     const int scene_frame_width, const int scene_frame_height,
diff --git a/mediapipe/examples/desktop/autoflip/quality/utils_test.cc b/mediapipe/examples/desktop/autoflip/quality/utils_test.cc
index 03d0d5354..b10e37855 100644
--- a/mediapipe/examples/desktop/autoflip/quality/utils_test.cc
+++ b/mediapipe/examples/desktop/autoflip/quality/utils_test.cc
@@ -113,16 +113,6 @@ void AddDetectionFromScoreAndIsRequired(const double score,
   detection->set_is_required(is_required);
 }
 
-// Returns default values for KeyFrameInfos. Populates timestamps using the
-// default spacing kKeyFrameTimestampDiff starting from 0.
-std::vector<KeyFrameInfo> GetDefaultKeyFrameInfos() {
-  std::vector<KeyFrameInfo> key_frame_infos(kNumKeyFrames);
-  for (int i = 0; i < kNumKeyFrames; ++i) {
-    key_frame_infos[i].set_timestamp_ms(kKeyFrameTimestampDiff * i);
-  }
-  return key_frame_infos;
-}
-
 // Returns default settings for KeyFrameCropOptions. Populates target size to be
 // the default target size.
 KeyFrameCropOptions GetDefaultKeyFrameCropOptions() {
@@ -148,6 +138,7 @@ std::vector<KeyFrameCropResult> GetDefaultKeyFrameCropResults() {
     *(key_frame_crop_results[i].mutable_required_region()) =
         MakeRect(10, 10, 20, 20);
     key_frame_crop_results[i].set_region_score(1.0);
+    key_frame_crop_results[i].set_timestamp_ms(kKeyFrameTimestampDiff * i);
   }
   return key_frame_crop_results;
 }
@@ -502,9 +493,8 @@ TEST(UtilTest, SetKeyFrameCropTargetSetsTargetSizeCorrectly) {
 // Checks that AggregateKeyFrameResults checks output pointer is not null.
 TEST(UtilTest, AggregateKeyFrameResultsChecksOutputNotNull) {
   const auto status = AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      GetDefaultKeyFrameCropResults(), kOriginalWidth, kOriginalHeight,
-      nullptr);
+      GetDefaultKeyFrameCropOptions(), GetDefaultKeyFrameCropResults(),
+      kOriginalWidth, kOriginalHeight, nullptr);
   EXPECT_FALSE(status.ok());
   EXPECT_THAT(status.ToString(),
               HasSubstr("Output SceneKeyFrameCropSummary is null."));
@@ -512,36 +502,20 @@ TEST(UtilTest, AggregateKeyFrameResultsChecksOutputNotNull) {
 
 // Checks that AggregateKeyFrameResults handles the case of no key frames.
 TEST(UtilTest, AggregateKeyFrameResultsHandlesNoKeyFrames) {
-  std::vector<KeyFrameInfo> key_frame_infos(0);
   std::vector<KeyFrameCropResult> key_frame_crop_results(0);
   SceneKeyFrameCropSummary scene_summary;
 
-  MP_EXPECT_OK(AggregateKeyFrameResults(
-      key_frame_infos, GetDefaultKeyFrameCropOptions(), key_frame_crop_results,
-      kOriginalWidth, kOriginalHeight, &scene_summary));
-}
-
-// Checks that AggregateKeyFrameResults checks that number of key frames is
-// consistent between KeyFrameInfos and KeyFrameCropResults.
-TEST(UtilTest, AggregateKeyFrameResultsChecksNumKeyFramesConsistent) {
-  std::vector<KeyFrameInfo> key_frame_infos(kNumKeyFrames);
-  std::vector<KeyFrameCropResult> key_frame_crop_results(kNumKeyFrames + 1);
-  SceneKeyFrameCropSummary scene_summary;
-
-  const auto status = AggregateKeyFrameResults(
-      key_frame_infos, GetDefaultKeyFrameCropOptions(), key_frame_crop_results,
-      kOriginalWidth, kOriginalHeight, &scene_summary);
-  EXPECT_FALSE(status.ok());
-  EXPECT_THAT(status.ToString(),
-              HasSubstr("Inconsistent number of key frames"));
+  MP_EXPECT_OK(AggregateKeyFrameResults(GetDefaultKeyFrameCropOptions(),
+                                        key_frame_crop_results, kOriginalWidth,
+                                        kOriginalHeight, &scene_summary));
 }
 
 // Checks that AggregateKeyFrameResults checks that frame size is valid.
 TEST(UtilTest, AggregateKeyFrameResultsChecksFrameSizeValid) {
   SceneKeyFrameCropSummary scene_summary;
   const auto status = AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      GetDefaultKeyFrameCropResults(), kOriginalWidth, 0, &scene_summary);
+      GetDefaultKeyFrameCropOptions(), GetDefaultKeyFrameCropResults(),
+      kOriginalWidth, 0, &scene_summary);
   EXPECT_FALSE(status.ok());
   EXPECT_THAT(status.ToString(), HasSubstr("Non-positive frame height."));
 }
@@ -553,9 +527,8 @@ TEST(UtilTest, AggregateKeyFrameResultsChecksTargetSizeValid) {
   SceneKeyFrameCropSummary scene_summary;
 
   const auto status = AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), key_frame_crop_options,
-      GetDefaultKeyFrameCropResults(), kOriginalWidth, kOriginalHeight,
-      &scene_summary);
+      key_frame_crop_options, GetDefaultKeyFrameCropResults(), kOriginalWidth,
+      kOriginalHeight, &scene_summary);
   EXPECT_FALSE(status.ok());
   EXPECT_THAT(status.ToString(), HasSubstr("Non-positive target width."));
 }
@@ -568,9 +541,8 @@ TEST(UtilTest, AggregateKeyFrameResultsChecksTargetSizeNotExceedFrameSize) {
   SceneKeyFrameCropSummary scene_summary;
 
   const auto status = AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), key_frame_crop_options,
-      GetDefaultKeyFrameCropResults(), kOriginalWidth, kOriginalHeight,
-      &scene_summary);
+      key_frame_crop_options, GetDefaultKeyFrameCropResults(), kOriginalWidth,
+      kOriginalHeight, &scene_summary);
   EXPECT_FALSE(status.ok());
   EXPECT_THAT(status.ToString(),
               HasSubstr("Target width exceeds frame width."));
@@ -578,19 +550,19 @@ TEST(UtilTest, AggregateKeyFrameResultsChecksTargetSizeNotExceedFrameSize) {
 
 // Checks that AggregateKeyFrameResults packs KeyFrameCompactInfos.
 TEST(UtilTest, AggregateKeyFrameResultsPacksKeyFrameCompactInfos) {
-  const auto key_frame_infos = GetDefaultKeyFrameInfos();
   const auto key_frame_crop_results = GetDefaultKeyFrameCropResults();
   SceneKeyFrameCropSummary scene_summary;
 
-  MP_EXPECT_OK(AggregateKeyFrameResults(
-      key_frame_infos, GetDefaultKeyFrameCropOptions(), key_frame_crop_results,
-      kOriginalWidth, kOriginalHeight, &scene_summary));
+  MP_EXPECT_OK(AggregateKeyFrameResults(GetDefaultKeyFrameCropOptions(),
+                                        key_frame_crop_results, kOriginalWidth,
+                                        kOriginalHeight, &scene_summary));
 
   EXPECT_EQ(scene_summary.num_key_frames(), kNumKeyFrames);
   EXPECT_EQ(scene_summary.key_frame_compact_infos_size(), kNumKeyFrames);
   for (int i = 0; i < kNumKeyFrames; ++i) {
     const auto& compact_info = scene_summary.key_frame_compact_infos(i);
-    EXPECT_EQ(compact_info.timestamp_ms(), key_frame_infos[i].timestamp_ms());
+    EXPECT_EQ(compact_info.timestamp_ms(),
+              key_frame_crop_results[i].timestamp_ms());
     const auto center = RectCenter(key_frame_crop_results[i].region());
     EXPECT_FLOAT_EQ(compact_info.center_x(), center.first);
     EXPECT_FLOAT_EQ(compact_info.center_y(), center.second);
@@ -602,7 +574,6 @@ TEST(UtilTest, AggregateKeyFrameResultsPacksKeyFrameCompactInfos) {
 // Checks that AggregateKeyFrameResults ensures the centered region of target
 // size fits in frame bound.
 TEST(UtilTest, AggregateKeyFrameResultsEnsuresCropRegionFitsInFrame) {
-  std::vector<KeyFrameInfo> key_frame_infos(1);
   std::vector<KeyFrameCropResult> key_frame_crop_results(1);
   auto* crop_region = key_frame_crop_results[0].mutable_region();
   crop_region->set_x(0);
@@ -611,9 +582,9 @@ TEST(UtilTest, AggregateKeyFrameResultsEnsuresCropRegionFitsInFrame) {
   crop_region->set_height(10);
   SceneKeyFrameCropSummary scene_summary;
 
-  MP_EXPECT_OK(AggregateKeyFrameResults(
-      key_frame_infos, GetDefaultKeyFrameCropOptions(), key_frame_crop_results,
-      kOriginalWidth, kOriginalHeight, &scene_summary));
+  MP_EXPECT_OK(AggregateKeyFrameResults(GetDefaultKeyFrameCropOptions(),
+                                        key_frame_crop_results, kOriginalWidth,
+                                        kOriginalHeight, &scene_summary));
 
   EXPECT_EQ(scene_summary.crop_window_width(), kTargetWidth);
   EXPECT_EQ(scene_summary.crop_window_height(), kTargetHeight);
@@ -638,14 +609,13 @@ TEST(UtilTest, AggregateKeyFrameResultsEnsuresCropRegionFitsInFrame) {
 // frames with empty regions.
 TEST(UtilTest,
      AggregateKeyFrameResultsSetsMinusOneForKeyFramesWithEmptyRegions) {
-  std::vector<KeyFrameInfo> key_frame_infos(1);
   std::vector<KeyFrameCropResult> key_frame_crop_results(1);
   key_frame_crop_results[0].set_region_is_empty(true);
   SceneKeyFrameCropSummary scene_summary;
 
-  MP_EXPECT_OK(AggregateKeyFrameResults(
-      key_frame_infos, GetDefaultKeyFrameCropOptions(), key_frame_crop_results,
-      kOriginalWidth, kOriginalHeight, &scene_summary));
+  MP_EXPECT_OK(AggregateKeyFrameResults(GetDefaultKeyFrameCropOptions(),
+                                        key_frame_crop_results, kOriginalWidth,
+                                        kOriginalHeight, &scene_summary));
 
   const auto& compact_info = scene_summary.key_frame_compact_infos(0);
   EXPECT_FLOAT_EQ(compact_info.center_x(), -1.0f);
@@ -661,8 +631,8 @@ TEST(UtilTest, AggregateKeyFrameResultsRejectsNegativeCenter) {
   SceneKeyFrameCropSummary scene_summary;
 
   const auto status = AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      key_frame_crop_results, kOriginalWidth, kOriginalHeight, &scene_summary);
+      GetDefaultKeyFrameCropOptions(), key_frame_crop_results, kOriginalWidth,
+      kOriginalHeight, &scene_summary);
   EXPECT_FALSE(status.ok());
   EXPECT_THAT(status.ToString(), HasSubstr("Negative vertical center."));
 }
@@ -674,8 +644,8 @@ TEST(UtilTest, AggregateKeyFrameResultsRejectsNegativeScore) {
   SceneKeyFrameCropSummary scene_summary;
 
   const auto status = AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      key_frame_crop_results, kOriginalWidth, kOriginalHeight, &scene_summary);
+      GetDefaultKeyFrameCropOptions(), key_frame_crop_results, kOriginalWidth,
+      kOriginalHeight, &scene_summary);
   EXPECT_FALSE(status.ok());
   EXPECT_THAT(status.ToString(), HasSubstr("Negative score."));
 }
@@ -693,9 +663,9 @@ TEST(UtilTest, AggregateKeyFrameResultsSetsCenterRanges) {
   }
   SceneKeyFrameCropSummary scene_summary;
 
-  MP_EXPECT_OK(AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      key_frame_crop_results, kOriginalWidth, kOriginalHeight, &scene_summary));
+  MP_EXPECT_OK(AggregateKeyFrameResults(GetDefaultKeyFrameCropOptions(),
+                                        key_frame_crop_results, kOriginalWidth,
+                                        kOriginalHeight, &scene_summary));
 
   EXPECT_FLOAT_EQ(scene_summary.key_frame_center_min_x(), 25.0f);
   EXPECT_FLOAT_EQ(scene_summary.key_frame_center_max_x(), 45.0f);
@@ -712,9 +682,9 @@ TEST(UtilTest, AggregateKeyFrameResultsSetsScoreRange) {
   }
   SceneKeyFrameCropSummary scene_summary;
 
-  MP_EXPECT_OK(AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      key_frame_crop_results, kOriginalWidth, kOriginalHeight, &scene_summary));
+  MP_EXPECT_OK(AggregateKeyFrameResults(GetDefaultKeyFrameCropOptions(),
+                                        key_frame_crop_results, kOriginalWidth,
+                                        kOriginalHeight, &scene_summary));
 
   EXPECT_FLOAT_EQ(scene_summary.key_frame_min_score(),
                   *std::min_element(scores.begin(), scores.end()));
@@ -727,9 +697,8 @@ TEST(UtilTest, AggregateKeyFrameResultsSetsScoreRange) {
 TEST(UtilTest, AggregateKeyFrameResultsSetsCropWindowSizeToTargetSize) {
   SceneKeyFrameCropSummary scene_summary;
   MP_EXPECT_OK(AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      GetDefaultKeyFrameCropResults(), kOriginalWidth, kOriginalHeight,
-      &scene_summary));
+      GetDefaultKeyFrameCropOptions(), GetDefaultKeyFrameCropResults(),
+      kOriginalWidth, kOriginalHeight, &scene_summary));
   EXPECT_EQ(scene_summary.crop_window_width(), kTargetWidth);
   EXPECT_EQ(scene_summary.crop_window_height(), kTargetHeight);
 }
@@ -741,9 +710,9 @@ TEST(UtilTest, AggregateKeyFrameResultsSetsCropWindowSizeExceedingTargetSize) {
   key_frame_crop_results[0].mutable_region()->set_width(kTargetWidth + 1);
   SceneKeyFrameCropSummary scene_summary;
 
-  MP_EXPECT_OK(AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      key_frame_crop_results, kOriginalWidth, kOriginalHeight, &scene_summary));
+  MP_EXPECT_OK(AggregateKeyFrameResults(GetDefaultKeyFrameCropOptions(),
+                                        key_frame_crop_results, kOriginalWidth,
+                                        kOriginalHeight, &scene_summary));
   EXPECT_EQ(scene_summary.crop_window_width(), kTargetWidth + 1);
   EXPECT_EQ(scene_summary.crop_window_height(), kTargetHeight);
 }
@@ -753,9 +722,8 @@ TEST(UtilTest, AggregateKeyFrameResultsSetsCropWindowSizeExceedingTargetSize) {
 TEST(UtilTest, AggregateKeyFrameResultsSetsHasSalientRegionTrue) {
   SceneKeyFrameCropSummary scene_summary;
   MP_EXPECT_OK(AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      GetDefaultKeyFrameCropResults(), kOriginalWidth, kOriginalHeight,
-      &scene_summary));
+      GetDefaultKeyFrameCropOptions(), GetDefaultKeyFrameCropResults(),
+      kOriginalWidth, kOriginalHeight, &scene_summary));
   EXPECT_TRUE(scene_summary.has_salient_region());
 }
 
@@ -768,9 +736,9 @@ TEST(UtilTest, AggregateKeyFrameResultsSetsHasSalientRegionFalse) {
   }
   SceneKeyFrameCropSummary scene_summary;
 
-  MP_EXPECT_OK(AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      key_frame_crop_results, kOriginalWidth, kOriginalHeight, &scene_summary));
+  MP_EXPECT_OK(AggregateKeyFrameResults(GetDefaultKeyFrameCropOptions(),
+                                        key_frame_crop_results, kOriginalWidth,
+                                        kOriginalHeight, &scene_summary));
   EXPECT_FALSE(scene_summary.has_salient_region());
 }
 
@@ -779,9 +747,8 @@ TEST(UtilTest, AggregateKeyFrameResultsSetsHasSalientRegionFalse) {
 TEST(UtilTest, AggregateKeyFrameResultsSetsHasRequiredSalientRegionTrue) {
   SceneKeyFrameCropSummary scene_summary;
   MP_EXPECT_OK(AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      GetDefaultKeyFrameCropResults(), kOriginalWidth, kOriginalHeight,
-      &scene_summary));
+      GetDefaultKeyFrameCropOptions(), GetDefaultKeyFrameCropResults(),
+      kOriginalWidth, kOriginalHeight, &scene_summary));
   EXPECT_TRUE(scene_summary.has_required_salient_region());
 }
 
@@ -794,9 +761,9 @@ TEST(UtilTest, AggregateKeyFrameResultsSetsHasRequiredSalientRegionFalse) {
   }
   SceneKeyFrameCropSummary scene_summary;
 
-  MP_EXPECT_OK(AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      key_frame_crop_results, kOriginalWidth, kOriginalHeight, &scene_summary));
+  MP_EXPECT_OK(AggregateKeyFrameResults(GetDefaultKeyFrameCropOptions(),
+                                        key_frame_crop_results, kOriginalWidth,
+                                        kOriginalHeight, &scene_summary));
   EXPECT_FALSE(scene_summary.has_required_salient_region());
 }
 
@@ -810,9 +777,9 @@ TEST(UtilTest, AggregateKeyFrameResultsSetsKeyFrameRequiredCropRegionUnion) {
   }
   SceneKeyFrameCropSummary scene_summary;
 
-  MP_EXPECT_OK(AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      key_frame_crop_results, kOriginalWidth, kOriginalHeight, &scene_summary));
+  MP_EXPECT_OK(AggregateKeyFrameResults(GetDefaultKeyFrameCropOptions(),
+                                        key_frame_crop_results, kOriginalWidth,
+                                        kOriginalHeight, &scene_summary));
   const auto& required_crop_region_union =
       scene_summary.key_frame_required_crop_region_union();
   EXPECT_EQ(required_crop_region_union.x(), 0);
@@ -832,9 +799,9 @@ TEST(UtilTest, AggregateKeyFrameResultsSetsFrameSuccessRate) {
   }
   SceneKeyFrameCropSummary scene_summary;
 
-  MP_EXPECT_OK(AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      key_frame_crop_results, kOriginalWidth, kOriginalHeight, &scene_summary));
+  MP_EXPECT_OK(AggregateKeyFrameResults(GetDefaultKeyFrameCropOptions(),
+                                        key_frame_crop_results, kOriginalWidth,
+                                        kOriginalHeight, &scene_summary));
   EXPECT_FLOAT_EQ(scene_summary.frame_success_rate(), success_rate);
 }
 
@@ -853,9 +820,9 @@ TEST(UtilTest, AggregateKeyFrameResultsSetsMotion) {
   }
   SceneKeyFrameCropSummary scene_summary;
 
-  MP_EXPECT_OK(AggregateKeyFrameResults(
-      GetDefaultKeyFrameInfos(), GetDefaultKeyFrameCropOptions(),
-      key_frame_crop_results, kOriginalWidth, kOriginalHeight, &scene_summary));
+  MP_EXPECT_OK(AggregateKeyFrameResults(GetDefaultKeyFrameCropOptions(),
+                                        key_frame_crop_results, kOriginalWidth,
+                                        kOriginalHeight, &scene_summary));
   EXPECT_FLOAT_EQ(scene_summary.horizontal_motion_amount(), motion_x);
   EXPECT_FLOAT_EQ(scene_summary.vertical_motion_amount(), motion_y);
 }
diff --git a/mediapipe/examples/desktop/autoflip/subgraph/BUILD b/mediapipe/examples/desktop/autoflip/subgraph/BUILD
index 5c128e90b..4fea2fb92 100644
--- a/mediapipe/examples/desktop/autoflip/subgraph/BUILD
+++ b/mediapipe/examples/desktop/autoflip/subgraph/BUILD
@@ -28,6 +28,23 @@ mediapipe_simple_subgraph(
     ],
 )
 
+mediapipe_simple_subgraph(
+    name = "autoflip_front_face_detection_subgraph",
+    graph = "front_face_detection_subgraph.pbtxt",
+    register_as = "AutoFlipFrontFaceDetectionSubgraph",
+    visibility = ["//visibility:public"],
+    deps = [
+        "//mediapipe/calculators/image:image_transformation_calculator",
+        "//mediapipe/calculators/tflite:ssd_anchors_calculator",
+        "//mediapipe/calculators/tflite:tflite_converter_calculator",
+        "//mediapipe/calculators/tflite:tflite_inference_calculator",
+        "//mediapipe/calculators/tflite:tflite_tensors_to_detections_calculator",
+        "//mediapipe/calculators/util:detection_label_id_to_text_calculator",
+        "//mediapipe/calculators/util:detection_letterbox_removal_calculator",
+        "//mediapipe/calculators/util:non_max_suppression_calculator",
+    ],
+)
+
 mediapipe_simple_subgraph(
     name = "autoflip_object_detection_subgraph",
     graph = "autoflip_object_detection_subgraph.pbtxt",
diff --git a/mediapipe/examples/desktop/autoflip/subgraph/front_face_detection_subgraph.pbtxt b/mediapipe/examples/desktop/autoflip/subgraph/front_face_detection_subgraph.pbtxt
new file mode 100644
index 000000000..18d336c80
--- /dev/null
+++ b/mediapipe/examples/desktop/autoflip/subgraph/front_face_detection_subgraph.pbtxt
@@ -0,0 +1,135 @@
+# MediaPipe graph that performs face detection with TensorFlow Lite on CPU.  Model paths setup for web use.
+# TODO: parameterize input paths to support desktop use.
+input_stream: "VIDEO:input_video"
+output_stream: "DETECTIONS:output_detections"
+
+# Transforms the input image on CPU to a 128x128 image. To scale the input
+# image, the scale_mode option is set to FIT to preserve the aspect ratio,
+# resulting in potential letterboxing in the transformed image.
+node: {
+  calculator: "ImageTransformationCalculator"
+  input_stream: "IMAGE:input_video"
+  output_stream: "IMAGE:transformed_input_video_cpu"
+  output_stream: "LETTERBOX_PADDING:letterbox_padding"
+  options: {
+    [mediapipe.ImageTransformationCalculatorOptions.ext] {
+      output_width: 128
+      output_height: 128
+      scale_mode: FIT
+    }
+  }
+}
+
+# Converts the transformed input image on CPU into an image tensor stored as a
+# TfLiteTensor.
+node {
+  calculator: "TfLiteConverterCalculator"
+  input_stream: "IMAGE:transformed_input_video_cpu"
+  output_stream: "TENSORS:image_tensor"
+}
+
+# Runs a TensorFlow Lite model on CPU that takes an image tensor and outputs a
+# vector of tensors representing, for instance, detection boxes/keypoints and
+# scores.
+node {
+  calculator: "TfLiteInferenceCalculator"
+  input_stream: "TENSORS:image_tensor"
+  output_stream: "TENSORS:detection_tensors"
+  options: {
+    [mediapipe.TfLiteInferenceCalculatorOptions.ext] {
+      model_path: "face_detection_front.tflite"
+    }
+  }
+}
+
+# Generates a single side packet containing a vector of SSD anchors based on
+# the specification in the options.
+node {
+  calculator: "SsdAnchorsCalculator"
+  output_side_packet: "anchors"
+  options: {
+    [mediapipe.SsdAnchorsCalculatorOptions.ext] {
+      num_layers: 4
+      min_scale: 0.1484375
+      max_scale: 0.75
+      input_size_height: 128
+      input_size_width: 128
+      anchor_offset_x: 0.5
+      anchor_offset_y: 0.5
+      strides: 8
+      strides: 16
+      strides: 16
+      strides: 16
+      aspect_ratios: 1.0
+      fixed_anchor_size: true
+    }
+  }
+}
+
+# Decodes the detection tensors generated by the TensorFlow Lite model, based on
+# the SSD anchors and the specification in the options, into a vector of
+# detections. Each detection describes a detected object.
+node {
+  calculator: "TfLiteTensorsToDetectionsCalculator"
+  input_stream: "TENSORS:detection_tensors"
+  input_side_packet: "ANCHORS:anchors"
+  output_stream: "DETECTIONS:detections"
+  options: {
+    [mediapipe.TfLiteTensorsToDetectionsCalculatorOptions.ext] {
+      num_classes: 1
+      num_boxes: 896
+      num_coords: 16
+      box_coord_offset: 0
+      keypoint_coord_offset: 4
+      num_keypoints: 6
+      num_values_per_keypoint: 2
+      sigmoid_score: true
+      score_clipping_thresh: 100.0
+      reverse_output_order: true
+      x_scale: 128.0
+      y_scale: 128.0
+      h_scale: 128.0
+      w_scale: 128.0
+      min_score_thresh: 0.75
+    }
+  }
+}
+
+# Performs non-max suppression to remove excessive detections.
+node {
+  calculator: "NonMaxSuppressionCalculator"
+  input_stream: "detections"
+  output_stream: "filtered_detections"
+  options: {
+    [mediapipe.NonMaxSuppressionCalculatorOptions.ext] {
+      min_suppression_threshold: 0.3
+      overlap_type: INTERSECTION_OVER_UNION
+      algorithm: WEIGHTED
+      return_empty_detections: true
+    }
+  }
+}
+
+# Maps detection label IDs to the corresponding label text ("Face"). The label
+# map is provided in the label_map_path option.
+node {
+  calculator: "DetectionLabelIdToTextCalculator"
+  input_stream: "filtered_detections"
+  output_stream: "labeled_detections"
+  options: {
+    [mediapipe.DetectionLabelIdToTextCalculatorOptions.ext] {
+      label_map_path: "face_detection_front_labelmap.txt"
+    }
+  }
+}
+
+# Adjusts detection locations (already normalized to [0.f, 1.f]) on the
+# letterboxed image (after image transformation with the FIT scale mode) to the
+# corresponding locations on the same image with the letterbox removed (the
+# input image to the graph before image transformation).
+node {
+  calculator: "DetectionLetterboxRemovalCalculator"
+  input_stream: "DETECTIONS:labeled_detections"
+  input_stream: "LETTERBOX_PADDING:letterbox_padding"
+  output_stream: "DETECTIONS:output_detections"
+}
diff --git a/mediapipe/framework/calculator_graph.cc b/mediapipe/framework/calculator_graph.cc
index d5eae9ef3..3b48d617d 100644
--- a/mediapipe/framework/calculator_graph.cc
+++ b/mediapipe/framework/calculator_graph.cc
@@ -760,10 +760,6 @@ CalculatorGraph::PrepareGpu(const std::map<std::string, Packet>& side_packets) {
 }
 
 ::mediapipe::Status CalculatorGraph::WaitUntilIdle() {
-  if (has_sources_) {
-    return ::mediapipe::InvalidArgumentErrorBuilder(MEDIAPIPE_LOC)
-           << "WaitUntilIdle called on a graph with source nodes.";
-  }
   MP_RETURN_IF_ERROR(scheduler_.WaitUntilIdle());
   VLOG(2) << "Scheduler idle.";
   ::mediapipe::Status status = ::mediapipe::OkStatus();
diff --git a/mediapipe/framework/calculator_graph_test.cc b/mediapipe/framework/calculator_graph_test.cc
index b25752b4e..1adf2c0ac 100644
--- a/mediapipe/framework/calculator_graph_test.cc
+++ b/mediapipe/framework/calculator_graph_test.cc
@@ -65,6 +65,9 @@ namespace mediapipe {
 
 namespace {
 
+using testing::ElementsAre;
+using testing::HasSubstr;
+
 // Pass packets through. Note that it calls SetOffset() in Process()
 // instead of Open().
 class SetOffsetInProcessCalculator : public CalculatorBase {
diff --git a/mediapipe/framework/deps/BUILD b/mediapipe/framework/deps/BUILD
index 918799813..1573fa1f7 100644
--- a/mediapipe/framework/deps/BUILD
+++ b/mediapipe/framework/deps/BUILD
@@ -272,6 +272,14 @@ cc_library(
     ],
 )
 
+cc_library(
+    name = "re2",
+    hdrs = [
+        "re2.h",
+    ],
+    visibility = ["//visibility:public"],
+)
+
 cc_library(
     name = "status_matchers",
     testonly = 1,
@@ -280,7 +288,7 @@ cc_library(
     visibility = ["//mediapipe/framework/port:__pkg__"],
     deps = [
         ":status",
-        "@com_google_googletest//:gtest_main",
+        "@com_google_googletest//:gtest",
     ],
 )
 
diff --git a/mediapipe/framework/deps/re2.h b/mediapipe/framework/deps/re2.h
new file mode 100644
index 000000000..61f7985ee
--- /dev/null
+++ b/mediapipe/framework/deps/re2.h
@@ -0,0 +1,59 @@
+// Copyright 2019 The MediaPipe Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//      http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef MEDIAPIPE_FRAMEWORK_DEPS_RE2_H_
+#define MEDIAPIPE_FRAMEWORK_DEPS_RE2_H_
+
+#include <regex>  // NOLINT
+
+namespace mediapipe {
+
+// Implementats a subset of RE2 using std::regex_match.
+class RE2 {
+ public:
+  RE2(const std::string& pattern) : std_regex_(pattern) {}
+  static bool FullMatch(std::string text, const RE2& re) {
+    return std::regex_match(text, re.std_regex_);
+  }
+  static bool PartialMatch(std::string text, const RE2& re) {
+    return std::regex_search(text, re.std_regex_);
+  }
+  static int GlobalReplace(std::string* text, const RE2& re,
+                           const std::string& rewrite) {
+    std::smatch sm;
+    std::regex_search(*text, sm, re.std_regex_);
+    *text = std::regex_replace(*text, re.std_regex_, rewrite);
+    return std::max(0, static_cast<int>(sm.size()) - 1);
+  }
+
+ private:
+  std::regex std_regex_;
+};
+
+// Implements LazyRE2 using std::call_once.
+class LazyRE2 {
+ public:
+  RE2& operator*() const {
+    std::call_once(once_, [&]() { ptr_ = new RE2(pattern_); });
+    return *ptr_;
+  }
+  RE2* operator->() const { return &**this; }
+  const char* pattern_;
+  mutable RE2* ptr_;
+  mutable std::once_flag once_;
+};
+
+}  // namespace mediapipe
+
+#endif  // MEDIAPIPE_FRAMEWORK_DEPS_RE2_H_
diff --git a/mediapipe/framework/deps/status_matchers.h b/mediapipe/framework/deps/status_matchers.h
index 179e321e7..5e7f34272 100644
--- a/mediapipe/framework/deps/status_matchers.h
+++ b/mediapipe/framework/deps/status_matchers.h
@@ -15,10 +15,44 @@
 #ifndef MEDIAPIPE_DEPS_STATUS_MATCHERS_H_
 #define MEDIAPIPE_DEPS_STATUS_MATCHERS_H_
 
+#include "gmock/gmock.h"
 #include "gtest/gtest.h"
 #include "mediapipe/framework/deps/status.h"
 
-#define MP_EXPECT_OK(statement) EXPECT_TRUE((statement).ok())
-#define MP_ASSERT_OK(statement) ASSERT_TRUE((statement).ok())
+namespace mediapipe {
+
+// Monomorphic implementation of matcher IsOk() for a given type T.
+// T can be Status, StatusOr<>, or a reference to either of them.
+template <typename T>
+class MonoIsOkMatcherImpl : public testing::MatcherInterface<T> {
+ public:
+  void DescribeTo(std::ostream* os) const override { *os << "is OK"; }
+  void DescribeNegationTo(std::ostream* os) const override {
+    *os << "is not OK";
+  }
+  bool MatchAndExplain(T actual_value,
+                       testing::MatchResultListener*) const override {
+    return actual_value.ok();
+  }
+};
+
+// Implements IsOk() as a polymorphic matcher.
+class IsOkMatcher {
+ public:
+  template <typename T>
+  operator testing::Matcher<T>() const {  // NOLINT
+    return testing::Matcher<T>(new MonoIsOkMatcherImpl<T>());
+  }
+};
+
+// Returns a gMock matcher that matches a Status or StatusOr<> which is OK.
+inline IsOkMatcher IsOk() { return IsOkMatcher(); }
+
+}  // namespace mediapipe
+
+// Macros for testing the results of functions that return mediapipe::Status or
+// mediapipe::StatusOr<T> (for any type T).
+#define MP_EXPECT_OK(expression) EXPECT_THAT(expression, mediapipe::IsOk())
+#define MP_ASSERT_OK(expression) ASSERT_THAT(expression, mediapipe::IsOk())
 
 #endif  // MEDIAPIPE_DEPS_STATUS_MATCHERS_H_
diff --git a/mediapipe/framework/encode_binary_proto.bzl b/mediapipe/framework/encode_binary_proto.bzl
index 030897bce..1ed64a954 100644
--- a/mediapipe/framework/encode_binary_proto.bzl
+++ b/mediapipe/framework/encode_binary_proto.bzl
@@ -141,7 +141,8 @@ def _generate_proto_descriptor_set_impl(ctx):
     # order of gendir before ., is needed for the proto compiler to resolve
     # import statements that reference proto files produced by a genrule.
     ctx.actions.run(
-        inputs = all_protos.to_list() + [ctx.executable._proto_compiler],
+        inputs = all_protos,
+        tools = [ctx.executable._proto_compiler],
         outputs = [descriptor],
         executable = ctx.executable._proto_compiler,
         arguments = [
diff --git a/mediapipe/framework/formats/landmark.proto b/mediapipe/framework/formats/landmark.proto
index 708a34000..bc3821609 100644
--- a/mediapipe/framework/formats/landmark.proto
+++ b/mediapipe/framework/formats/landmark.proto
@@ -26,6 +26,11 @@ message Landmark {
   optional float x = 1;
   optional float y = 2;
   optional float z = 3;
+
+  // Landmark visibility. Float score of whether landmark is visible or occluded
+  // by other obects. Depending on the model, visibility value is either a
+  // sigmoid or an argument of sigmoid.
+  optional float visibility = 4;
 }
 
 // Group of Landmark protos.
@@ -39,6 +44,7 @@ message NormalizedLandmark {
   optional float x = 1;
   optional float y = 2;
   optional float z = 3;
+  optional float visibility = 4;
 }
 
 // Group of NormalizedLandmark protos.
diff --git a/mediapipe/framework/formats/object_detection/BUILD b/mediapipe/framework/formats/object_detection/BUILD
index c073afa07..4a9f0ca50 100644
--- a/mediapipe/framework/formats/object_detection/BUILD
+++ b/mediapipe/framework/formats/object_detection/BUILD
@@ -15,10 +15,10 @@
 # Description:
 #   Working with dense optical flow in mediapipe.
 
-licenses(["notice"])  # Apache 2.0
-
 load("//mediapipe/framework/port:build_config.bzl", "mediapipe_cc_proto_library")
 
+licenses(["notice"])  # Apache 2.0
+
 package(default_visibility = ["//visibility:private"])
 
 proto_library(
diff --git a/mediapipe/framework/legacy_calculator_support.cc b/mediapipe/framework/legacy_calculator_support.cc
index b96d1e41f..13fd714ac 100644
--- a/mediapipe/framework/legacy_calculator_support.cc
+++ b/mediapipe/framework/legacy_calculator_support.cc
@@ -16,20 +16,11 @@
 
 namespace mediapipe {
 
-#if EMSCRIPTEN_WORKAROUND_FOR_B121216479
-template <>
-CalculatorContext*
-    LegacyCalculatorSupport::Scoped<CalculatorContext>::current_ = nullptr;
-template <>
-CalculatorContract*
-    LegacyCalculatorSupport::Scoped<CalculatorContract>::current_ = nullptr;
-#else
 template <>
 thread_local CalculatorContext*
     LegacyCalculatorSupport::Scoped<CalculatorContext>::current_ = nullptr;
 template <>
 thread_local CalculatorContract*
     LegacyCalculatorSupport::Scoped<CalculatorContract>::current_ = nullptr;
-#endif  // EMSCRIPTEN_WORKAROUND_FOR_B121216479
 
 }  // namespace mediapipe
diff --git a/mediapipe/framework/legacy_calculator_support.h b/mediapipe/framework/legacy_calculator_support.h
index 019473e67..6a76101bb 100644
--- a/mediapipe/framework/legacy_calculator_support.h
+++ b/mediapipe/framework/legacy_calculator_support.h
@@ -18,29 +18,6 @@
 #include "mediapipe/framework/calculator_context.h"
 #include "mediapipe/framework/calculator_contract.h"
 
-// In Emscripten builds without threading support, some member variables
-// declared "static thread_local" will not be linked correctly. To workaround
-// this we declare them only "static".
-// TODO: remove this macro and use thread_local unconditionally
-#if defined(__EMSCRIPTEN__) && !defined(__EMSCRIPTEN_PTHREADS__)
-#define EMSCRIPTEN_WORKAROUND_FOR_B121216479 1
-#endif
-
-namespace mediapipe {
-class GlCalculatorHelper;
-class MetalHelperLegacySupport;
-namespace aimatter {
-template <class T>
-class CachableAsyncLoadableObject;
-}
-}  // namespace mediapipe
-
-namespace xeno {
-namespace effect {
-class AssetRegistryServiceHelper;
-}  // namespace effect
-}  // namespace xeno
-
 namespace mediapipe {
 
 class LegacyCalculatorSupport {
@@ -55,12 +32,9 @@ class LegacyCalculatorSupport {
   // from that point, and the previous value is restored when execution leaves
   // that scope, as one would expect.
   //
-  // The current value is only accessible via this mechanism by a limited set
-  // of classes (listed as friends below). This is only meant to be used where
-  // backwards compatibility reasons prevent passing the CC directly.
-  //
-  // Only two specializations are allowed: Scoped<CalculatorContext> and
-  // Scoped<CalculatorContract>.
+  // This is only meant to be used where backwards compatibility reasons prevent
+  // passing the CC directly. Specifically, it can be used to access
+  // CalculatorContext and CalculatorContract from legacy calculator code.
   template <class C>
   class Scoped {
    public:
@@ -72,53 +46,26 @@ class LegacyCalculatorSupport {
     }
     ~Scoped() { current_ = saved_; }
 
+    // The current C* for this thread.
+    static C* current() { return current_; }
+
    private:
     // The value to restore after exiting this scope.
     C* saved_;
 
-    // The current C* for this thread.
-    //
     // This needs NOLINT because, when included in Objective-C++ files,
     // clang-tidy suggests using an Objective-C naming convention, which is
     // inappropriate. (b/116015736) No category specifier because of b/71698089.
-#if EMSCRIPTEN_WORKAROUND_FOR_B121216479
-    ABSL_CONST_INIT static C* current_;  // NOLINT
-#else
-    ABSL_CONST_INIT static thread_local C* current_;  // NOLINT
-#endif
-
-    static C* current() { return current_; }
-
-    // Only these classes are allowed to access the current CC via this
-    // mechanism.
-    friend class ::mediapipe::GlCalculatorHelper;
-    friend class ::mediapipe::MetalHelperLegacySupport;
-    template <class T>
-    friend class ::mediapipe::aimatter::CachableAsyncLoadableObject;
-    friend class ::xeno::effect::AssetRegistryServiceHelper;
+    //
+    // ABSL_CONST_INIT triggers b/155992786 with some versions of Clang on Apple
+    // platforms.
+#ifndef __APPLE__
+    ABSL_CONST_INIT
+#endif                                // !__APPLE__
+    static thread_local C* current_;  // NOLINT
   };
 };
 
-// We only declare this variable for two specializations of the template because
-// it is only meant to be used for these two types.
-#if EMSCRIPTEN_WORKAROUND_FOR_B121216479
-template <>
-CalculatorContext* LegacyCalculatorSupport::Scoped<CalculatorContext>::current_;
-template <>
-CalculatorContract*
-    LegacyCalculatorSupport::Scoped<CalculatorContract>::current_;
-#elif _MSC_VER
-// MSVC interprets these declarations as definitions and during linking it
-// generates an error about multiple definitions of current_.
-#else
-template <>
-thread_local CalculatorContext*
-    LegacyCalculatorSupport::Scoped<CalculatorContext>::current_;
-template <>
-thread_local CalculatorContract*
-    LegacyCalculatorSupport::Scoped<CalculatorContract>::current_;
-#endif  // EMSCRIPTEN_WORKAROUND_FOR_B121216479
-
 }  // namespace mediapipe
 
 #endif  // MEDIAPIPE_FRAMEWORK_LEGACY_CALCULATOR_SUPPORT_H_
diff --git a/mediapipe/framework/port/BUILD b/mediapipe/framework/port/BUILD
index 9b235be0f..68e158efd 100644
--- a/mediapipe/framework/port/BUILD
+++ b/mediapipe/framework/port/BUILD
@@ -153,6 +153,33 @@ cc_library(
     ],
 )
 
+cc_library(
+    name = "re2",
+    hdrs = [
+        "re2.h",
+    ],
+    visibility = ["//visibility:public"],
+    deps = [
+        "//mediapipe/framework/deps:re2",
+    ],
+)
+
+cc_library(
+    name = "gtest",
+    testonly = 1,
+    hdrs = [
+        "gmock.h",
+        "gtest.h",
+        "status_matchers.h",
+    ],
+    visibility = ["//visibility:public"],
+    deps = [
+        ":status_matchers",
+        "//mediapipe/framework:port",
+        "@com_google_googletest//:gtest",
+    ],
+)
+
 cc_library(
     name = "gtest_main",
     testonly = 1,
@@ -163,6 +190,7 @@ cc_library(
     ],
     visibility = ["//visibility:public"],
     deps = [
+        ":status_matchers",
         "//mediapipe/framework:port",
         "//mediapipe/framework/deps:status_matchers",
         "@com_google_googletest//:gtest_main",
@@ -369,6 +397,18 @@ cc_library(
     ],
 )
 
+cc_library(
+    name = "status_matchers",
+    testonly = 1,
+    hdrs = ["status_matchers.h"],
+    # Use this library through "mediapipe/framework/port:gtest_main".
+    visibility = ["//mediapipe/framework/port:__pkg__"],
+    deps = [
+        ":status",
+        "//mediapipe/framework/deps:status_matchers",
+    ],
+)
+
 cc_library(
     name = "threadpool",
     hdrs = ["threadpool.h"],
diff --git a/mediapipe/framework/port/build_config.bzl b/mediapipe/framework/port/build_config.bzl
index 787bbf1fc..f07c96c16 100644
--- a/mediapipe/framework/port/build_config.bzl
+++ b/mediapipe/framework/port/build_config.bzl
@@ -120,7 +120,7 @@ def mediapipe_proto_library(
 def mediapipe_py_proto_library(
         name,
         srcs,
-        visibility,
+        visibility = None,
         py_proto_deps = [],
         proto_deps = None,
         api_version = None,
@@ -147,7 +147,7 @@ def mediapipe_py_proto_library(
         testonly = testonly,
     ))
 
-def mediapipe_cc_proto_library(name, srcs, visibility, deps = [], cc_deps = [], testonly = 0):
+def mediapipe_cc_proto_library(name, srcs, visibility = None, deps = [], cc_deps = [], testonly = 0):
     """Generate cc_proto_library for mediapipe open source version.
 
       Args:
diff --git a/mediapipe/framework/port/re2.h b/mediapipe/framework/port/re2.h
new file mode 100644
index 000000000..fe2feecb4
--- /dev/null
+++ b/mediapipe/framework/port/re2.h
@@ -0,0 +1,6 @@
+#ifndef MEDIAPIPE_FRAMEWORK_PORT_RE2_H_
+#define MEDIAPIPE_FRAMEWORK_PORT_RE2_H_
+
+#include "mediapipe/framework/deps/re2.h"
+
+#endif  // MEDIAPIPE_FRAMEWORK_PORT_RE2_H_
diff --git a/mediapipe/framework/profiler/BUILD b/mediapipe/framework/profiler/BUILD
index e266fb867..aa770829a 100644
--- a/mediapipe/framework/profiler/BUILD
+++ b/mediapipe/framework/profiler/BUILD
@@ -298,3 +298,24 @@ cc_library(
         "//mediapipe:apple": [],
     }),
 )
+
+cc_test(
+    name = "reporter_test",
+    srcs = ["reporter_test.cc"],
+    data = [
+        "//mediapipe/framework/profiler/testdata:mediapipe_profile_graphs",
+    ],
+    visibility = ["//visibility:private"],
+    deps = [
+        "//mediapipe/framework:calculator_cc_proto",
+        "//mediapipe/framework:calculator_profile_cc_proto",
+        "//mediapipe/framework/deps:file_path",
+        "//mediapipe/framework/port:advanced_proto",
+        "//mediapipe/framework/port:gtest_main",
+        "//mediapipe/framework/port:parse_text_proto",
+        "//mediapipe/framework/profiler/reporter:reporter_lib",
+        "//mediapipe/framework/tool:test_util",
+        "@com_google_absl//absl/status",
+        "@com_google_absl//absl/strings",
+    ],
+)
diff --git a/mediapipe/framework/profiler/reporter/BUILD b/mediapipe/framework/profiler/reporter/BUILD
new file mode 100644
index 000000000..83f3dfe9e
--- /dev/null
+++ b/mediapipe/framework/profiler/reporter/BUILD
@@ -0,0 +1,62 @@
+# Copyright 2020 The MediaPipe Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+licenses(["notice"])  # Apache 2.0
+
+cc_library(
+    name = "reporter_lib",
+    srcs = [
+        "reporter.cc",
+        "statistic.cc",
+    ],
+    hdrs = [
+        "reporter.h",
+        "statistic.h",
+    ],
+    visibility = ["//visibility:public"],
+    deps = [
+        "//mediapipe/framework:calculator_cc_proto",
+        "//mediapipe/framework:calculator_framework",
+        "//mediapipe/framework:calculator_profile_cc_proto",
+        "//mediapipe/framework/port:advanced_proto",
+        "//mediapipe/framework/port:commandlineflags",
+        "//mediapipe/framework/port:file_helpers",
+        "//mediapipe/framework/port:parse_text_proto",
+        "//mediapipe/framework/port:re2",
+        "//mediapipe/framework/port:ret_check",
+        "//mediapipe/framework/port:status",
+        "//mediapipe/framework/port:statusor",
+        "@com_google_absl//absl/container:btree",
+        "@com_google_absl//absl/status",
+        "@com_google_absl//absl/strings",
+        "@com_google_absl//absl/strings:str_format",
+    ],
+)
+
+cc_binary(
+    name = "print_profile",
+    srcs = ["print_profile.cc"],
+    deps = [
+        ":reporter_lib",
+        "//mediapipe/framework/port:advanced_proto",
+        "//mediapipe/framework/port:commandlineflags",
+        "//mediapipe/framework/port:file_helpers",
+        "//mediapipe/framework/port:status",
+        "@com_google_absl//absl/container:btree",
+        "@com_google_absl//absl/flags:flag",
+        "@com_google_absl//absl/flags:parse",
+        "@com_google_absl//absl/flags:usage",
+    ],
+)
diff --git a/mediapipe/framework/profiler/reporter/README.md b/mediapipe/framework/profiler/reporter/README.md
new file mode 100644
index 000000000..12fa4bb06
--- /dev/null
+++ b/mediapipe/framework/profiler/reporter/README.md
@@ -0,0 +1,102 @@
+# Command Line Profiler
+
+Allows a user to analyze trace files generated by MediaPipe from the command
+line. If you would prefer to see this information visually (or if you can't
+build the tool), you can see the same information within viz.mediapipe.dev.
+For more information on this, see [Profile Visualization](https://docs.google.com/document/d/1inBoRzKDyKEjtVws8Seceoa0xRU3mqpPgM_myDBilS4/edit#heading=h.bnft45odm046) at go/mediapipe-profiler-guide
+
+See go/mediapipe-profiler-guide for a detailed user's guide.
+
+---
+
+## Building and Executing
+
+Navigate to:
+
+    //mediapipe/framework/profiler/reporter
+
+To run:
+
+    bazel run :print_profile
+
+To test:
+
+    bazel test :reporter_test
+
+To print out the time columns and the total columns (as an example):
+
+    bazel run :print_profile -- --cols "*time*,*total*" --logfiles "<path-to-log>,<path-to-another-log>"
+
+
+---
+
+### print_profile [OPTION]... [FILE]...
+> Extract information from a set of MediaPipe trace files.
+
+**--compact**
+> print_profile will create lanes for each column, adding white space so that
+everything is easily readable. This option trims out any extra whitespace.
+
+**--cols**
+> Column separated set of columns to be shown. Omit to show everything. The user
+can use asterisks to match zero or more characters, or question marks to match a
+single character. (e.g., "time_*" will match "time_mean", "time_stddev", and so
+on).  "calculator" is always shown first.
+
+> Columns are listed below.
+
+#### Calculator Columns:
+
+**calculator**
+> The name of the calculator
+
+**fps**
+> The number of frames that this calculator can generate each second, on
+average. 1 / (latency_mean + time_mean) (Units are 1 / second).
+
+**frequency**
+
+> The rate that this calculator was asked to process packets per second.
+(Computed by # of calls total / (last_call_time - first_call_time)).  (Units are
+1 / second)
+
+**counter**
+> Number of times process() was called on the calculator. If the calculator
+generated outputs, then it will be reflected in "completed." If it did not, then
+this will be reflected in "dropped".
+
+**dropped**
+> Number of times the calculator was called but did not produce an output.
+
+**completed**
+> Number of times that this calculator was asked to process inputs after which
+it generated outputs.
+
+**processing_rate**
+> 1E+6 / time_mean.  The number of times per second this calculator could run
+process, on average.  (Units are 1 / second).
+
+**thread_count**
+> The number of threads that made use of each calculator.
+
+**time_mean**
+> Average time spent within a calculator (in microseconds).
+
+**time_stddev**
+> Standard deviation of time_mean (in microseconds).
+
+**time_total**
+> Total time spent within a calculator (in microseconds).
+
+**time_percent**
+> Percent of total time spent within a calculator.
+
+**input_latency_mean**
+> Average latency between earliest input packet and when calculator actually
+starts processing (in microseconds).
+
+**input_latency_stddev**
+> Standard deviation of input_latency_mean (in microseconds).
+
+**input_latency_total**
+> Total accumulated input_latency (in microseconds).
diff --git a/mediapipe/framework/profiler/reporter/print_profile.cc b/mediapipe/framework/profiler/reporter/print_profile.cc
new file mode 100644
index 000000000..86144df7b
--- /dev/null
+++ b/mediapipe/framework/profiler/reporter/print_profile.cc
@@ -0,0 +1,69 @@
+// Copyright 2019 The MediaPipe Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//      http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+// This program takes one input file and encodes its contents as a C++
+// std::string, which can be included in a C++ source file. It is similar to
+// filewrapper (and borrows some of its code), but simpler.
+
+#include <algorithm>
+#include <fstream>
+
+#include "absl/container/btree_map.h"
+#include "absl/flags/flag.h"
+#include "absl/flags/parse.h"
+#include "absl/flags/usage.h"
+#include "mediapipe/framework/port/advanced_proto_inc.h"
+#include "mediapipe/framework/port/commandlineflags.h"
+#include "mediapipe/framework/port/file_helpers.h"
+#include "mediapipe/framework/port/status.h"
+#include "mediapipe/framework/profiler/reporter/reporter.h"
+
+ABSL_FLAG(std::vector<std::string>, logfiles, {},
+          "comma-separated list of .binarypb files to process.");
+ABSL_FLAG(std::vector<std::string>, cols, {"*"},
+          "comma-separated list of columns to show. Suffix wildcards, '*', '?' "
+          "allowed.");
+ABSL_FLAG(bool, compact, false,
+          "if true, then don't print unnecessary whitespace.");
+
+using ::mediapipe::reporter::Reporter;
+
+// The command line utility to mine trace files of useful statistics to
+// determine bottlenecks and performance of a graph.
+int main(int argc, char** argv) {
+  absl::SetProgramUsageMessage("Display statistics from MediaPipe log files.");
+  absl::ParseCommandLine(argc, argv);
+
+  Reporter reporter;
+  reporter.set_compact(absl::GetFlag(FLAGS_compact));
+  const auto result = reporter.set_columns(absl::GetFlag(FLAGS_cols));
+  if (result.message().length()) {
+    std::cout << "WARNING" << std::endl << result.message();
+  }
+
+  const auto& flags_logfiles = absl::GetFlag(FLAGS_logfiles);
+  for (const auto& file_name : flags_logfiles) {
+    std::ifstream ifs(file_name.c_str(), std::ifstream::in);
+    mediapipe::proto_ns::io::IstreamInputStream isis(&ifs);
+    mediapipe::proto_ns::io::CodedInputStream coded_input_stream(&isis);
+    mediapipe::GraphProfile proto;
+    if (!proto.ParseFromCodedStream(&coded_input_stream)) {
+      std::cerr << "Failed to parse proto.\n";
+    } else {
+      reporter.Accumulate(proto);
+    }
+  }
+  reporter.Report()->Print(std::cout);
+  return 1;
+}
diff --git a/mediapipe/framework/profiler/reporter/reporter.cc b/mediapipe/framework/profiler/reporter/reporter.cc
new file mode 100644
index 000000000..e9f5db6a0
--- /dev/null
+++ b/mediapipe/framework/profiler/reporter/reporter.cc
@@ -0,0 +1,448 @@
+#include "mediapipe/framework/profiler/reporter/reporter.h"
+
+#include <algorithm>
+#include <iterator>
+#include <memory>
+#include <ostream>
+#include <string>
+#include <string_view>
+#include <vector>
+
+#include "absl/container/btree_map.h"
+#include "absl/status/status.h"
+#include "absl/strings/str_format.h"
+#include "absl/strings/str_join.h"
+#include "fstream"
+#include "map"
+#include "mediapipe/framework/calculator_profile.pb.h"
+#include "mediapipe/framework/port/advanced_proto_inc.h"
+#include "mediapipe/framework/port/canonical_errors.h"
+#include "mediapipe/framework/port/re2.h"
+#include "mediapipe/framework/port/status.h"
+#include "mediapipe/framework/port/status_macros.h"
+
+namespace mediapipe {
+namespace reporter {
+
+const LazyRE2 kValidColumnRegex = {"^[a-zA-Z0-9_?*]+$"};
+const LazyRE2 kReplace1WildcharRegex = {"\\?"};
+const LazyRE2 kReplace0toNWildcharRegex = {"\\*"};
+
+std::string ToStringF(double d) { return absl::StrFormat("%1.2f", d); }
+std::string ToString(double d) { return absl::StrFormat("%1.0f", d); }
+
+absl::btree_map<std::string,
+                std::function<const std::string(const CalculatorData&)>>
+    kColumns = {
+        {"calculator",
+         [](const CalculatorData& d) -> const std::string { return d.name; }},
+        {"counter",
+         [](const CalculatorData& d) -> const std::string {
+           return ToString(d.counter);
+         }},
+        {"completed",
+         [](const CalculatorData& d) -> const std::string {
+           return ToString(d.completed);
+         }},
+        {"dropped",
+         [](const CalculatorData& d) -> const std::string {
+           return ToString(d.dropped);
+         }},
+        {"fps",
+         [](const CalculatorData& d) -> const std::string {
+           return ToStringF(d.fps);
+         }},
+        {"frequency",
+         [](const CalculatorData& d) -> const std::string {
+           return ToStringF(d.frequency);
+         }},
+        {"processing_rate",
+         [](const CalculatorData& d) -> const std::string {
+           return ToStringF(d.processing_rate);
+         }},
+        {"thread_count",
+         [](const CalculatorData& d) -> const std::string {
+           return ToStringF(d.thread_count);
+         }},
+        {"time_mean",
+         [](const CalculatorData& d) -> const std::string {
+           return ToStringF(d.time_stat.mean());
+         }},
+        {"time_stddev",
+         [](const CalculatorData& d) -> const std::string {
+           return ToStringF(d.time_stat.stddev());
+         }},
+        {"time_total",
+         [](const CalculatorData& d) -> const std::string {
+           return ToString(d.time_stat.total());
+         }},
+        {"time_percent",
+         [](const CalculatorData& d) -> const std::string {
+           return ToStringF(d.time_percent);
+         }},
+        {"input_latency_mean",
+         [](const CalculatorData& d) -> const std::string {
+           return ToStringF(d.input_latency_stat.mean());
+         }},
+        {"input_latency_stddev",
+         [](const CalculatorData& d) -> const std::string {
+           return ToStringF(d.input_latency_stat.stddev());
+         }},
+        {"input_latency_total",
+         [](const CalculatorData& d) -> const std::string {
+           return ToString(d.input_latency_stat.total());
+         }}};
+
+// Holds calculator traces that have an output trace with a provided stream ID
+// and Packet timestamp.
+typedef std::map<std::pair<int64_t, int32_t>,
+                 const mediapipe::GraphTrace::CalculatorTrace*>
+    PacketKeyToCalcTrace;
+
+// Use this to locate the calculator trace with the start time for a given
+// node its thread_id and its packet timestamp.
+typedef std::map<std::pair<int64_t, std::pair<int32_t, int32_t>>,
+                 const mediapipe::GraphTrace::CalculatorTrace*>
+    TimestampNodeIdToCalcTrace;
+
+// Maps node IDs to names.
+typedef std::map<int32_t, std::string> NameLookup;
+
+Reporter::Reporter() { MEDIAPIPE_CHECK_OK(set_columns({"*"})); }
+
+int64_t RecursePacketStartTime(
+    const PacketKeyToCalcTrace& output_trace_lookup,
+    const mediapipe::GraphProfile& profile,
+    const mediapipe::GraphTrace::CalculatorTrace& trace,
+    std::vector<int32_t>* visited_calculators) {
+  int64_t child_start_time =
+      trace.has_start_time() ? trace.start_time() : trace.finish_time();
+  const int32_t node_id = trace.node_id();
+  if (std::find(visited_calculators->begin(), visited_calculators->end(),
+                node_id) != visited_calculators->end()) {
+    return child_start_time;
+  }
+  visited_calculators->push_back(node_id);
+
+  for (size_t index = 0; index < trace.input_trace_size(); ++index) {
+    const auto& stream_trace = trace.input_trace(index);
+
+    // Find the output corresponding to this input.
+    const auto it = output_trace_lookup.find(std::make_pair(
+        stream_trace.packet_timestamp(), stream_trace.stream_id()));
+    if (it != output_trace_lookup.end()) {
+      child_start_time =
+          std::min(child_start_time,
+                   RecursePacketStartTime(output_trace_lookup, profile,
+                                          *it->second, visited_calculators));
+    }
+  }
+  return child_start_time;
+}
+
+int64_t CalculateInputLatency(
+    const PacketKeyToCalcTrace& output_trace_lookup,
+    const mediapipe::GraphProfile& profile,
+    const mediapipe::GraphTrace::CalculatorTrace& trace) {
+  // Track visited calculators to detect loops.
+  std::vector<int> visited_calculators;
+
+  // If a calculator has no start time, then there is no latency to measure.
+  const auto result =
+      !trace.has_start_time()
+          ? 0L
+          : trace.start_time() - RecursePacketStartTime(output_trace_lookup,
+                                                        profile, trace,
+                                                        &visited_calculators);
+
+  return result;
+}
+
+void CacheNodeNameLookup(const mediapipe::GraphProfile& profile,
+                         NameLookup* result) {
+  for (const auto& graph_trace : profile.graph_trace()) {
+    int key = 0;
+    for (const auto& calc_name : graph_trace.calculator_name()) {
+      (*result)[key] = calc_name;
+      ++key;
+    }
+  }
+}
+
+void CacheOutputTraceLookup(const mediapipe::GraphProfile& profile,
+                            PacketKeyToCalcTrace* output_trace_lookup,
+                            TimestampNodeIdToCalcTrace* start_time_lookup) {
+  for (const auto& graph_trace : profile.graph_trace()) {
+    for (const auto& calc_trace : graph_trace.calculator_trace()) {
+      if (calc_trace.event_type() != mediapipe::GraphTrace_EventType_PROCESS) {
+        continue;
+      }
+      if (calc_trace.has_start_time() && !calc_trace.has_finish_time()) {
+        (*start_time_lookup)[std::make_pair(
+            calc_trace.input_timestamp(),
+            std::make_pair(calc_trace.node_id(), calc_trace.thread_id()))] =
+            &calc_trace;
+      }
+      for (const auto& stream_trace : calc_trace.output_trace()) {
+        (*output_trace_lookup)[std::make_pair(stream_trace.packet_timestamp(),
+                                              stream_trace.stream_id())] =
+            &calc_trace;
+      }
+    }
+  }
+}
+
+void CompleteCalculatorData(
+    const GraphData& graph_data,
+    std::map<std::string, CalculatorData>* calculator_data) {
+  for (auto& calc_entry : *calculator_data) {
+    auto& calc_data = calc_entry.second;
+    const auto& time_stat = calc_data.time_stat;
+    const auto& latency_stat = calc_data.input_latency_stat;
+    const auto time_to_process = time_stat.mean() + latency_stat.mean();
+    calc_data.fps = time_to_process == 0 ? 0 : 1.0E+6 / time_to_process;
+
+    const auto duration = graph_data.max_time - graph_data.min_time;
+    calc_data.frequency = calc_data.completed / (duration / 1.0E+6);
+    calc_data.time_percent = 100 * time_stat.total() / graph_data.total_time;
+    calc_data.dropped = calc_data.counter - calc_data.completed;
+
+    calc_data.processing_rate = calc_data.time_stat.mean() == 0
+                                    ? 0
+                                    : 1.0 / calc_data.time_stat.mean() * 1.0E+6;
+    calc_data.thread_count = calc_data.threads.size();
+  }
+}
+
+void Reporter::Accumulate(const mediapipe::GraphProfile& profile) {
+  // Cache nodeID to its std::string name.
+  NameLookup name_lookup;
+  CacheNodeNameLookup(profile, &name_lookup);
+
+  // Cache some lookups so that we can quickly find the matching output stream
+  // for a given input stream, and so that we can find the start time of a
+  // given timestamp of a node.
+  PacketKeyToCalcTrace output_trace_lookup;
+  TimestampNodeIdToCalcTrace start_event_lookup;
+  CacheOutputTraceLookup(profile, &output_trace_lookup, &start_event_lookup);
+
+  // Hold the domain of all times found in the trace file.
+  auto& min_time = graph_data_.min_time;
+  auto& max_time = graph_data_.max_time;
+  auto& total_time = graph_data_.total_time;
+
+  // The start and finish time of PROCESS events might be split between
+  // events. If a start event has been seen, we'll record it so that we can
+  // match it up later.
+  std::map<int32_t, absl::optional<int64_t>> start_times;
+
+  for (const auto& graph_trace : profile.graph_trace()) {
+    for (const auto& calc_trace : graph_trace.calculator_trace()) {
+      if (calc_trace.event_type() != mediapipe::GraphTrace_EventType_PROCESS) {
+        continue;
+      }
+
+      const auto& node_name = name_lookup[calc_trace.node_id()];
+      auto& calc_data = calculator_data_[node_name];
+
+      calc_data.name = node_name;
+      calc_data.threads.insert(calc_trace.thread_id());
+
+      // If there is a start time, update the domain of the trace time, and
+      // mark that we've seen a start time for this calculator.
+      if (calc_trace.has_start_time()) {
+        min_time =
+            std::min(min_time, static_cast<int64_t>(calc_trace.start_time() +
+                                                    graph_trace.base_time()));
+        ++calc_data.counter;
+      }
+
+      // If there is a finish time, update the domain and mark that an event
+      // has been completed.
+      if (calc_trace.has_finish_time()) {
+        const auto finish_time =
+            calc_trace.finish_time() + graph_trace.base_time();
+        max_time = std::max(max_time, static_cast<int64_t>(finish_time));
+
+        absl::optional<int64_t> start_time;
+        if (calc_trace.has_start_time()) {
+          start_time.emplace(calc_trace.start_time());
+        } else {
+          const auto start_event_it = start_event_lookup.find(std::make_pair(
+              calc_trace.input_timestamp(),
+              std::make_pair(calc_trace.node_id(), calc_trace.thread_id())));
+          if (start_event_it != start_event_lookup.end()) {
+            start_time.emplace(start_event_it->second->start_time());
+          }
+        }
+
+        // Edge case -- If a finish time came in without a start time, then
+        // we know that an event started before the trace became available.
+        // But since we don't know when that is, we can't record its duration
+        // and won't count it.
+        if (start_time) {
+          ++calc_data.completed;
+          // Add up the duration of the events that led up to this start
+          // event.
+          const auto input_latency =
+              CalculateInputLatency(output_trace_lookup, profile, calc_trace);
+          calc_data.input_latency_stat.Push(input_latency);
+          const auto duration =
+              finish_time - (start_time.value() + graph_trace.base_time());
+          calc_data.time_stat.Push(duration);
+          total_time += duration;
+        }
+      }
+    }
+  }
+}
+
+::mediapipe::Status Reporter::set_columns(
+    const std::vector<std::string>& columns) {
+  bool error = false;
+  std::stringstream warnings;
+  std::vector<std::string> new_columns({"calculator"});
+
+  // Iterate through the desired columns and build a regex.
+  for (const auto& column_matcher : columns) {
+    if (!RE2::PartialMatch(column_matcher, *kValidColumnRegex)) {
+      warnings << "Column '" << column_matcher << "' is invalid." << std::endl;
+      error = true;
+      continue;
+    }
+    std::string colString = column_matcher;
+    RE2::GlobalReplace(&colString, *kReplace0toNWildcharRegex, ".*");
+    RE2::GlobalReplace(&colString, *kReplace1WildcharRegex, ".");
+
+    // Iterator through our available columns and add them to our collection
+    // of new columns if they do not already exist.
+    bool matched = false;
+    for (const auto& column : kColumns) {
+      if (RE2::FullMatch(column.first, colString)) {
+        matched = true;
+        if (std::find(new_columns.begin(), new_columns.end(), column.first) ==
+            new_columns.end()) {
+          new_columns.push_back(column.first);
+        }
+      }
+    }
+    if (!matched) {
+      warnings << "Column '" << column_matcher << "' did not match any columns."
+               << std::endl;
+      error = true;
+    }
+  }
+  // As long as there is still one column, honor the request, even if error.
+  if (!new_columns.empty()) {
+    columns_.swap(new_columns);
+  }
+  if (!error) {
+    return ::mediapipe::OkStatus();
+  }
+  return ::mediapipe::InvalidArgumentError(warnings.str());
+}
+
+class ReportImpl : public Report {
+ public:
+  ReportImpl(const std::map<std::string, CalculatorData>& calculator_data,
+             const GraphData& graph_data)
+      : calculator_data_(calculator_data), graph_data_(graph_data) {}
+  void Print(std::ostream& output) override;
+  const std::vector<std::string>& headers() override { return headers_impl; }
+  const std::vector<std::vector<std::string>>& lines() override {
+    return lines_impl;
+  }
+  const GraphData& graph_data() override { return graph_data_; }
+  const std::map<std::string, CalculatorData>& calculator_data() override {
+    return calculator_data_;
+  }
+
+  // Each header name in alphabetical order, except the first column, which is
+  // always "calculator".
+  std::vector<std::string> headers_impl;
+
+  // Values for each calculator, corresponding to the label in headers().
+  std::vector<std::vector<std::string>> lines_impl;
+
+  // The longest std::string of any value in a given column (including the
+  // header for that column). Used for formatting the output.
+  std::vector<size_t> char_counts_impl;
+  bool compact_flag = false;
+
+  const std::map<std::string, CalculatorData>& calculator_data_;
+  const GraphData& graph_data_;
+};
+
+void ReportImpl::Print(std::ostream& output) {
+  // Print the results, but aside from the last column, add whitespace to
+  // fill space up to char_counts[column] + 1. The strings in the output
+  // are mutable to support padding, hence no const in the for loops.
+  int column_number = 0;
+  // Make a copy of the column std::string because we might be adding spaces.
+  for (auto column : headers_impl) {
+    int padding_needed = char_counts_impl[column_number] + 1 - column.length();
+    if (compact_flag) {
+      padding_needed = 1;
+    }
+    column.append(padding_needed, ' ');
+    output << column;
+    column_number++;
+  }
+  output << std::endl;
+
+  for (auto& row : lines_impl) {
+    int column_number = 0;
+    for (auto column : row) {
+      int padding_needed =
+          char_counts_impl[column_number] + 1 - column.length();
+      if (compact_flag) {
+        padding_needed = 1;
+      }
+      column.append(padding_needed, ' ');
+      output << column;
+      column_number++;
+    }
+    output << std::endl;
+  }
+}
+
+std::unique_ptr<Report> Reporter::Report() {
+  CompleteCalculatorData(graph_data_, &calculator_data_);
+
+  auto report = std::make_unique<ReportImpl>(calculator_data_, graph_data_);
+  report->compact_flag = compact_flag_;
+
+  // First row contains the column headers.
+  auto& headers = report->headers_impl;
+  auto& lines = report->lines_impl;
+  auto& char_counts = report->char_counts_impl;
+
+  headers = columns_;
+  char_counts.resize(headers.size());
+  std::transform(headers.begin(), headers.end(), char_counts.begin(),
+                 [](const auto& header) { return header.size(); });
+
+  for (const auto& header : headers) {
+    size_t line_num = 0;
+    for (auto calc_it = calculator_data_.begin();
+         calc_it != calculator_data_.end(); ++calc_it) {
+      const std::string value = kColumns[header](calc_it->second);
+      if (calc_it->second.name.empty()) {
+        continue;
+      }
+      while (line_num >= lines.size()) {
+        lines.push_back({});
+      }
+      auto& line = lines[line_num];
+      line.push_back(value);
+      const size_t char_count_index = line.size() - 1;
+      char_counts[char_count_index] =
+          std::max(char_counts[char_count_index], value.length());
+      ++line_num;
+    }
+  }
+  return report;
+}
+
+}  // namespace reporter
+}  // namespace mediapipe
diff --git a/mediapipe/framework/profiler/reporter/reporter.h b/mediapipe/framework/profiler/reporter/reporter.h
new file mode 100644
index 000000000..8652fdbdb
--- /dev/null
+++ b/mediapipe/framework/profiler/reporter/reporter.h
@@ -0,0 +1,130 @@
+#ifndef MEDIAPIPE_FRAMEWORK_PROFILER_REPORTER_REPORTER_H_
+#define MEDIAPIPE_FRAMEWORK_PROFILER_REPORTER_REPORTER_H_
+
+#include <memory>
+#include <ostream>
+#include <set>
+
+#include "map"
+#include "mediapipe/framework/calculator.pb.h"
+#include "mediapipe/framework/calculator_profile.pb.h"
+#include "mediapipe/framework/port/status.h"
+#include "mediapipe/framework/profiler/reporter/statistic.h"
+
+namespace mediapipe {
+namespace reporter {
+
+struct GraphData {
+  int64_t min_time = std::numeric_limits<int64_t>::max();
+
+  int64_t max_time = std::numeric_limits<int64_t>::min();
+
+  int64_t total_time = 0;
+};
+
+// Holds all of the measured data for a calculator.
+struct CalculatorData {
+  // Name of the calculator.
+  std::string name;
+
+  // The number of times the calculator was detected entering a PROCESS state.
+  int counter;
+
+  // The number of times the calculator finished its process state.
+  int completed;
+
+  // The number of dropped packets.
+  double dropped;
+
+  // Specifies how quickly (1/s) this calculator can output events given its
+  // input latency and processing time.
+  double fps;
+
+  // Reports how often this calculator was called across the lifetime of the
+  // trace (1/s).
+  double frequency;
+
+  // The max number of threads used.
+  double thread_count;
+
+  // Reports how fast this calculator can run in isolation. (1/s).
+  double processing_rate;
+
+  // Percentage of the total time spent in this calculator.
+  double time_percent;
+
+  // Records the total time this calculator spent in PROCESS (microseconds).
+  Statistic time_stat;
+
+  // Records the input latency (microseconds). This is the longest time
+  // it takes for the input packets of a calculator to reach this calculator
+  // from their origin.
+  Statistic input_latency_stat;
+
+  // The threads on which this calculator ran.
+  std::set<int> threads;
+};
+
+// A snapshot of statistics generated by Reporter.
+class Report {
+ public:
+  virtual ~Report() = default;
+
+  // Prints the data contained within the report to a given
+  // stream (e.g., std::cout).
+  virtual void Print(std::ostream& output) = 0;
+
+  // Provides the list of headers included in the report. The column
+  // "calculator" will always come first, followed by the selected
+  // columns in alphabetical order.
+  virtual const std::vector<std::string>& headers() = 0;
+
+  // Provides a line for each calculator which in turn contains the name
+  // of the calculator followed by stringified values of each column's
+  // statistics.
+  virtual const std::vector<std::vector<std::string>>& lines() = 0;
+
+  // Returns summary data for the graph. Invalidated if Report() is called again
+  // on Reporter.
+  virtual const GraphData& graph_data() = 0;
+
+  // Returns summary data for each calculator in the graph. Invalidated if
+  // Report() is called again on Reporter.
+  virtual const std::map<std::string, CalculatorData>& calculator_data() = 0;
+};
+
+// Provides a way to accumulate statistics from one or more
+// GraphProfile protobufs in order to generate a report summarizing
+// the statistics within them.
+class Reporter {
+ public:
+  Reporter();
+
+  // Adds the contents of a given profile.
+  void Accumulate(const mediapipe::GraphProfile& profile);
+
+  // Accepts names of of columns or wildcard patterns (* or ?) to
+  // select which statistics columns will be included in a generated
+  // report.
+  ::mediapipe::Status set_columns(const std::vector<std::string>& columns);
+
+  // Generates a report based on the current accumulated statistics.
+  std::unique_ptr<reporter::Report> Report();
+
+  // Set to true to remove decorative whitespace from the output.
+  void set_compact(bool value) { compact_flag_ = value; }
+
+ private:
+  bool compact_flag_ = false;
+
+  std::vector<std::string> columns_;
+
+  // Maps calculator.name -> profile information for that calculator.
+  std::map<std::string, CalculatorData> calculator_data_;
+  GraphData graph_data_;
+};
+
+}  // namespace reporter
+}  // namespace mediapipe
+
+#endif  // MEDIAPIPE_FRAMEWORK_PROFILER_REPORTER_REPORTER_H_
diff --git a/mediapipe/framework/profiler/reporter/statistic.cc b/mediapipe/framework/profiler/reporter/statistic.cc
new file mode 100644
index 000000000..4923f9d2f
--- /dev/null
+++ b/mediapipe/framework/profiler/reporter/statistic.cc
@@ -0,0 +1,46 @@
+#include "mediapipe/framework/profiler/reporter/statistic.h"
+
+#include <cmath>
+
+#include "mediapipe/framework/calculator.pb.h"
+#include "mediapipe/framework/calculator_profile.pb.h"
+
+namespace mediapipe {
+namespace reporter {
+
+// Pushes a single value into the statistics, updating mean and stddev.
+void Statistic::Push(double x) {
+  ++counter_;
+
+  if (counter_ == 1) {
+    mean_ = x;
+    ssd_ = 0.0;
+    total_impl_ = x;
+  } else {
+    // Implementing Welford’s algorithm for computing variance.
+    auto old_mean = mean_;
+    mean_ = mean_ + (x - mean_) / counter_;
+    ssd_ = ssd_ + (x - mean_) * (x - old_mean);
+    total_impl_ += x;
+  }
+}
+
+// Returns the number of data points used to calculator the mean and
+// stddev.
+int Statistic::data_count() const { return counter_; }
+
+// Returns the mean of the data pushed into this statistic.
+double Statistic::mean() const { return (counter_ > 0) ? mean_ : 0.0; }
+
+// Returns the variance of the data pushed into this statistic.
+double Statistic::variance() const {
+  return ((counter_ > 1) ? ssd_ / (counter_ - 1) : 0.0);
+}
+
+// Returns the standard deviation of the data pushed into this statistic.
+double Statistic::stddev() const { return std::sqrt(variance()); }
+
+double Statistic::total() const { return total_impl_; }
+
+}  // namespace reporter
+}  // namespace mediapipe
diff --git a/mediapipe/framework/profiler/reporter/statistic.h b/mediapipe/framework/profiler/reporter/statistic.h
new file mode 100644
index 000000000..fb4bdf8db
--- /dev/null
+++ b/mediapipe/framework/profiler/reporter/statistic.h
@@ -0,0 +1,51 @@
+#ifndef MEDIAPIPE_FRAMEWORK_PROFILER_REPORTER_STATISTIC_H_
+#define MEDIAPIPE_FRAMEWORK_PROFILER_REPORTER_STATISTIC_H_
+
+#include "mediapipe/framework/calculator.pb.h"
+#include "mediapipe/framework/calculator_profile.pb.h"
+
+namespace mediapipe {
+namespace reporter {
+
+// Allows the user to push data and maintains a counter, mean, and stddev of
+// that data.
+class Statistic {
+ public:
+  Statistic() : counter_(0) {}
+
+  // Clears the current statistic.
+  void Clear() { counter_ = 0; }
+
+  // Pushes a single value into the statistic, updating mean and stddev.
+  void Push(double x);
+
+  // Returns the number of data points used to calculate the mean and stddev.
+  int data_count() const;
+
+  // Returns the mean of the data pushed into this statistic.
+  double mean() const;
+
+  // Returns the variance of the data pushed into this statistic.
+  double variance() const;
+
+  // Returns the standard deviation of the data pushed into this statistic.
+  double stddev() const;
+
+  // Returns the sum of values of this statistic.
+  double total() const;
+
+ private:
+  int counter_;
+  double total_impl_;
+
+  // Welford's algorithm allows us to keep a running standard deviation. We need
+  // to hang onto the mean and sum of squared differences in between calls to
+  // push().
+  double mean_;
+  double ssd_;
+};
+
+}  // namespace reporter
+}  // namespace mediapipe
+
+#endif  // MEDIAPIPE_FRAMEWORK_PROFILER_REPORTER_STATISTIC_H_
diff --git a/mediapipe/framework/profiler/reporter_test.cc b/mediapipe/framework/profiler/reporter_test.cc
new file mode 100644
index 000000000..9bdb1557b
--- /dev/null
+++ b/mediapipe/framework/profiler/reporter_test.cc
@@ -0,0 +1,231 @@
+// Copyright 2018 The MediaPipe Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//      http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "mediapipe/framework/profiler/reporter/reporter.h"
+
+#include <fcntl.h>
+#include <unistd.h>
+
+#include <memory>
+#include <sstream>
+#include <string>
+
+#include "absl/status/status.h"
+#include "absl/strings/str_cat.h"
+#include "mediapipe/framework/calculator.pb.h"
+#include "mediapipe/framework/calculator_profile.pb.h"
+#include "mediapipe/framework/port/advanced_proto_inc.h"
+#include "mediapipe/framework/port/gmock.h"
+#include "mediapipe/framework/port/gtest.h"
+#include "mediapipe/framework/port/proto_ns.h"
+#include "mediapipe/framework/port/status_matchers.h"
+#include "mediapipe/framework/profiler/reporter/statistic.h"
+#include "mediapipe/framework/tool/test_util.h"
+
+namespace mediapipe {
+
+using ::mediapipe::reporter::Reporter;
+using ::testing::ElementsAre;
+using ::testing::HasSubstr;
+using ::testing::IsSupersetOf;
+
+void LoadGraphProfile(const std::string& path, GraphProfile* proto) {
+  int fd = open(path.c_str(), O_RDONLY);
+  if (fd == -1) {
+    LOG(ERROR) << "could not open test graph: " << path
+               << ", error: " << strerror(errno);
+    return;
+  }
+  proto_ns::io::FileInputStream input(fd);
+  bool success = proto->ParseFromZeroCopyStream(&input);
+  close(fd);
+  if (!success) {
+    LOG(ERROR) << "could not parse test graph: " << path;
+  }
+}
+
+std::unique_ptr<Reporter> loadReporter(const std::vector<std::string>& paths) {
+  auto reporter = std::make_unique<Reporter>();
+  for (const auto path : paths) {
+    GraphProfile profile;
+    LoadGraphProfile(
+        absl::StrCat(GetTestDataDir("mediapipe/framework/profiler"), path),
+        &profile);
+    reporter->Accumulate(profile);
+  }
+  return reporter;
+}
+
+TEST(Reporter, Trivial) {
+  auto reporter = loadReporter({"profile_opencv_0.binarypb"});
+}
+
+TEST(Reporter, ReportAllColumns) {
+  auto reporter = loadReporter({"profile_opencv_0.binarypb"});
+  auto report = reporter->Report();
+
+  EXPECT_THAT(report->headers(),
+              IsSupersetOf({"calculator", "time_mean", "time_stddev",
+                            "time_total", "input_latency_mean",
+                            "input_latency_stddev", "input_latency_total"}));
+  EXPECT_EQ(report->headers()[0], "calculator");
+}
+
+// Reports only the "calculator" column and one additional column using no
+// wildcards.
+TEST(Reporter, ReportOneColumn) {
+  auto reporter = loadReporter({"profile_opencv_0.binarypb"});
+  MEDIAPIPE_CHECK_OK(reporter->set_columns({"time_mean"}));
+  auto report = reporter->Report();
+  EXPECT_THAT(report->headers(), ElementsAre("calculator", "time_mean"));
+}
+
+// Reports the "calculator" column and additional columns using wildcards.
+// Notice the columns are alphabetical except for the first column, 'calendar'.
+TEST(Reporter, ReportColumnsWithWildcards) {
+  auto reporter = loadReporter({"profile_opencv_0.binarypb"});
+  MEDIAPIPE_CHECK_OK(reporter->set_columns({"*_m??n", "*l?t*cy*"}));
+  EXPECT_THAT(reporter->Report()->headers(),
+              ElementsAre("calculator", "input_latency_mean", "time_mean",
+                          "input_latency_stddev", "input_latency_total"));
+}
+
+TEST(Reporter, AggregatesAreRecorded) {
+  auto reporter = loadReporter({"profile_opencv_0.binarypb"});
+  MEDIAPIPE_CHECK_OK(reporter->set_columns({"time_*", "*latency*"}));
+  const auto& report = reporter->Report();
+  const auto& lines = report->lines();
+  EXPECT_EQ(lines.size(), 3);
+  EXPECT_THAT(lines[2],
+              ElementsAre("OpenCvWriteTextCalculator", "13823.77", "100.00",
+                          "5541.47", "1976799", "245.13", "464.27", "35054"));
+}
+
+TEST(Reporter, JoinsFiles) {
+  auto reporter = loadReporter({
+      "profile_opencv_0.binarypb",
+      "profile_opencv_1.binarypb",
+  });
+  MEDIAPIPE_CHECK_OK(reporter->set_columns({"time_*", "*latency*"}));
+  const auto& report = reporter->Report();
+  const auto& lines = report->lines();
+  EXPECT_EQ(lines.size(), 3);
+  EXPECT_THAT(lines[2],
+              ElementsAre("OpenCvWriteTextCalculator", "14707.77", "100.00",
+                          "5630.52", "3000385", "237.50", "389.35", "48449"));
+}
+
+TEST(Reporter, PrintAllColumns) {
+  auto reporter = loadReporter({"profile_opencv_0.binarypb"});
+  auto report = reporter->Report();
+
+  std::stringstream output;
+  report->Print(output);
+  output.seekp(0);
+
+  std::string header;
+  std::getline(output, header);
+  EXPECT_THAT(header,
+              AllOf(HasSubstr("calculator"), HasSubstr("input_latency_mean"),
+                    HasSubstr("input_latency_stddev"),
+                    HasSubstr("input_latency_total"), HasSubstr("time_mean"),
+                    HasSubstr("time_stddev"), HasSubstr("time_total")));
+}
+
+TEST(Reporter, CanReportBadColumns) {
+  auto reporter = loadReporter({"profile_opencv_0.binarypb"});
+  auto result = reporter->set_columns({"il[leg]al"});
+  EXPECT_EQ(result.code(), StatusCode::kInvalidArgument);
+  EXPECT_EQ(result.message(), "Column 'il[leg]al' is invalid.\n");
+}
+
+TEST(Reporter, CanReportNonMatchingColumns) {
+  auto reporter = loadReporter({"profile_opencv_0.binarypb"});
+  auto result = reporter->set_columns({"time_*", "il[leg]al"});
+  EXPECT_EQ(result.code(), StatusCode::kInvalidArgument);
+  EXPECT_EQ(result.message(), "Column 'il[leg]al' is invalid.\n");
+  // Should not affect active columns, which is currently still "*".
+  auto report = reporter->Report();
+  EXPECT_THAT(report->headers(),
+              IsSupersetOf({"calculator", "time_mean", "time_stddev"}));
+}
+
+TEST(Reporter, BadPatternsIgnored) {
+  auto reporter = loadReporter({"profile_opencv_0.binarypb"});
+  auto result = reporter->set_columns({"time_mean", "il[leg]al", "^bad"});
+  EXPECT_EQ(result.code(), StatusCode::kInvalidArgument);
+  // Can report multiple errors at once, separated by newlines.
+  EXPECT_EQ(result.message(),
+            "Column 'il[leg]al' is invalid.\n"
+            "Column '^bad' is invalid.\n");
+  // Should not affect active columns, which is currently still "*".
+  auto report = reporter->Report();
+  EXPECT_THAT(report->headers(), ElementsAre("calculator", "time_mean"));
+}
+
+TEST(Reporter, NonMatchingColumnsIgnored) {
+  auto reporter = loadReporter({"profile_opencv_0.binarypb"});
+  auto result = reporter->set_columns({"koopa*"});
+  EXPECT_EQ(result.code(), StatusCode::kInvalidArgument);
+  EXPECT_EQ(result.message(), "Column 'koopa*' did not match any columns.\n");
+}
+
+// Tests a much simpler, fabricated log where results can easily be hand
+// calculated.
+TEST(Reporter, ProcessCalculatedCorrectly) {
+  auto reporter = loadReporter({"profile_process_test.binarypb"});
+  auto report = reporter->Report();
+  EXPECT_THAT(report->calculator_data().at("ACalculator").time_percent,
+              testing::DoubleEq(75));
+  EXPECT_THAT(report->calculator_data().at("ACalculator").time_stat.mean(),
+              testing::DoubleEq(450));
+  EXPECT_THAT(report->calculator_data().at("ACalculator").time_stat.stddev(),
+              testing::DoubleNear(70.71, 0.01));
+  EXPECT_THAT(report->calculator_data().at("ACalculator").time_stat.total(),
+              testing::DoubleEq(900));
+  EXPECT_THAT(report->calculator_data().at("BCalculator").time_percent,
+              testing::DoubleEq(25));
+  EXPECT_THAT(report->calculator_data().at("BCalculator").time_stat.mean(),
+              testing::DoubleEq(300));
+  // BCalculator has only one data point, so stddev is zero.
+  EXPECT_THAT(report->calculator_data().at("BCalculator").time_stat.stddev(),
+              testing::DoubleEq(0));
+  EXPECT_THAT(report->calculator_data().at("BCalculator").time_stat.total(),
+              testing::DoubleEq(300));
+}
+
+TEST(Reporter, LatencyCalculatedCorrectly) {
+  auto reporter = loadReporter({"profile_latency_test.binarypb"});
+  auto report = reporter->Report();
+  EXPECT_THAT(
+      report->calculator_data().at("ACalculator").input_latency_stat.mean(),
+      testing::DoubleEq(150));
+  EXPECT_THAT(
+      report->calculator_data().at("ACalculator").input_latency_stat.stddev(),
+      testing::DoubleNear(70.71, 0.01));
+  EXPECT_THAT(
+      report->calculator_data().at("ACalculator").input_latency_stat.total(),
+      testing::DoubleEq(300));
+  EXPECT_THAT(
+      report->calculator_data().at("BCalculator").input_latency_stat.mean(),
+      testing::DoubleEq(750));
+  EXPECT_THAT(
+      report->calculator_data().at("BCalculator").input_latency_stat.stddev(),
+      testing::DoubleNear(212.13, 0.01));
+  EXPECT_THAT(
+      report->calculator_data().at("BCalculator").input_latency_stat.total(),
+      testing::DoubleEq(1500));
+}
+
+}  // namespace mediapipe
diff --git a/mediapipe/framework/subgraph.h b/mediapipe/framework/subgraph.h
index dce1e536c..27bc32d43 100644
--- a/mediapipe/framework/subgraph.h
+++ b/mediapipe/framework/subgraph.h
@@ -46,7 +46,7 @@ class Subgraph {
 
   // Returns options of a specific type.
   template <typename T>
-  static T GetOptions(Subgraph::SubgraphOptions supgraph_options) {
+  static T GetOptions(const Subgraph::SubgraphOptions& supgraph_options) {
     return tool::OptionsMap().Initialize(supgraph_options).Get<T>();
   }
 };
diff --git a/mediapipe/framework/tool/BUILD b/mediapipe/framework/tool/BUILD
index 86d4a3bea..5412e24ee 100644
--- a/mediapipe/framework/tool/BUILD
+++ b/mediapipe/framework/tool/BUILD
@@ -601,6 +601,37 @@ cc_test(
     ],
 )
 
+cc_library(
+    name = "test_util",
+    testonly = 1,
+    srcs = ["test_util.cc"],
+    hdrs = ["test_util.h"],
+    visibility = ["//visibility:public"],
+    deps = [
+        "//mediapipe/framework:calculator_cc_proto",
+        "//mediapipe/framework/deps:file_path",
+        "//mediapipe/framework/formats:image_frame",
+        "//mediapipe/framework/port:advanced_proto",
+        "//mediapipe/framework/port:gtest",
+        "@com_google_absl//absl/container:flat_hash_set",
+        "@com_google_absl//absl/memory",
+        "@com_google_absl//absl/strings",
+        "//mediapipe/framework/deps:no_destructor",
+        "//mediapipe/framework/port:logging",
+    ] + select({
+        "//conditions:default": [
+            "//mediapipe/framework/port:file_helpers",
+        ],
+        "//mediapipe:android": [
+            "//mediapipe/util/android/file/base",
+        ],
+        "//mediapipe:ios": [],
+        "//mediapipe:macos": [
+            "//mediapipe/framework/port:file_helpers",
+        ],
+    }),
+)
+
 exports_files(
     ["build_defs.bzl"],
     visibility = ["//mediapipe/framework:__subpackages__"],
diff --git a/mediapipe/framework/tool/status_util.cc b/mediapipe/framework/tool/status_util.cc
index b5558fbdd..6f712c364 100644
--- a/mediapipe/framework/tool/status_util.cc
+++ b/mediapipe/framework/tool/status_util.cc
@@ -61,9 +61,11 @@ namespace tool {
       }
     }
   }
-  return ::mediapipe::Status(
+  if (error_code == StatusCode::kOk) return OkStatus();
+  Status combined = ::mediapipe::Status(
       error_code,
       absl::StrCat(general_comment, "\n", absl::StrJoin(errors, "\n")));
+  return combined;
 }
 
 }  // namespace tool
diff --git a/mediapipe/framework/tool/status_util.h b/mediapipe/framework/tool/status_util.h
index 18701c212..b9c4235a1 100644
--- a/mediapipe/framework/tool/status_util.h
+++ b/mediapipe/framework/tool/status_util.h
@@ -46,9 +46,9 @@ ABSL_DEPRECATED("Use ::mediapipe::UnknownError(error_message) instead.")
 ::mediapipe::Status AddStatusPrefix(const std::string& prefix,
                                     const ::mediapipe::Status& status);
 
-// Combine a vector of ::mediapipe::Status into a single status.  If statuses
-// is empty or all statuses are OK then ::mediapipe::OkStatus() will be
-// returned.
+// Combine a vector of ::mediapipe::Status into a single composite status.
+// If statuses is empty or all statuses are OK then ::mediapipe::OkStatus()
+// will be returned.
 // This function should be considered internal to the framework.
 // TODO Move this function to somewhere with less visibility.
 ::mediapipe::Status CombinedStatus(
diff --git a/mediapipe/framework/tool/status_util_test.cc b/mediapipe/framework/tool/status_util_test.cc
index 8ab9d1a35..27373d87a 100644
--- a/mediapipe/framework/tool/status_util_test.cc
+++ b/mediapipe/framework/tool/status_util_test.cc
@@ -27,6 +27,10 @@
 namespace mediapipe {
 namespace {
 
+using testing::ContainerEq;
+using testing::HasSubstr;
+using testing::IsEmpty;
+
 TEST(StatusTest, StatusStopIsNotOk) { EXPECT_FALSE(tool::StatusStop().ok()); }
 
 TEST(StatusTest, Prefix) {
@@ -36,13 +40,13 @@ TEST(StatusTest, Prefix) {
       ::mediapipe::StatusCode::kInvalidArgument, base_error_message);
   ::mediapipe::Status status =
       tool::AddStatusPrefix(prefix_error_message, base_status);
-  EXPECT_THAT(status.ToString(), testing::HasSubstr(base_error_message));
-  EXPECT_THAT(status.ToString(), testing::HasSubstr(prefix_error_message));
+  EXPECT_THAT(status.ToString(), HasSubstr(base_error_message));
+  EXPECT_THAT(status.ToString(), HasSubstr(prefix_error_message));
   EXPECT_EQ(::mediapipe::StatusCode::kInvalidArgument, status.code());
 }
 
 TEST(StatusTest, CombinedStatus) {
-  std::vector< ::mediapipe::Status> errors;
+  std::vector<::mediapipe::Status> errors;
   const std::string prefix_error_message("error_with_prefix: ");
   ::mediapipe::Status status;
 
@@ -51,12 +55,12 @@ TEST(StatusTest, CombinedStatus) {
                       "error_with_this_string");
   errors.emplace_back(::mediapipe::StatusCode::kInvalidArgument,
                       "error_with_that_string");
+  errors.back().SetPayload("test payload type",
+                           absl::Cord(absl::string_view("hello")));
   status = tool::CombinedStatus(prefix_error_message, errors);
-  EXPECT_THAT(status.ToString(),
-              testing::HasSubstr(std::string(errors[0].message())));
-  EXPECT_THAT(status.ToString(),
-              testing::HasSubstr(std::string(errors[1].message())));
-  EXPECT_THAT(status.ToString(), testing::HasSubstr(prefix_error_message));
+  EXPECT_THAT(status.ToString(), HasSubstr(std::string(errors[0].message())));
+  EXPECT_THAT(status.ToString(), HasSubstr(std::string(errors[1].message())));
+  EXPECT_THAT(status.ToString(), HasSubstr(prefix_error_message));
   EXPECT_EQ(::mediapipe::StatusCode::kInvalidArgument, status.code());
 
   errors.clear();
@@ -65,20 +69,17 @@ TEST(StatusTest, CombinedStatus) {
   errors.emplace_back(::mediapipe::StatusCode::kInvalidArgument,
                       "error_with_that_string");
   status = tool::CombinedStatus(prefix_error_message, errors);
-  EXPECT_THAT(status.ToString(),
-              testing::HasSubstr(std::string(errors[0].message())));
-  EXPECT_THAT(status.ToString(),
-              testing::HasSubstr(std::string(errors[1].message())));
-  EXPECT_THAT(status.ToString(), testing::HasSubstr(prefix_error_message));
+  EXPECT_THAT(status.ToString(), HasSubstr(std::string(errors[0].message())));
+  EXPECT_THAT(status.ToString(), HasSubstr(std::string(errors[1].message())));
+  EXPECT_THAT(status.ToString(), HasSubstr(prefix_error_message));
   EXPECT_EQ(::mediapipe::StatusCode::kUnknown, status.code());
   errors.clear();
   errors.emplace_back(::mediapipe::StatusCode::kOk, "error_with_this_string");
   errors.emplace_back(::mediapipe::StatusCode::kInvalidArgument,
                       "error_with_that_string");
   status = tool::CombinedStatus(prefix_error_message, errors);
-  EXPECT_THAT(status.ToString(),
-              testing::HasSubstr(std::string(errors[1].message())));
-  EXPECT_THAT(status.ToString(), testing::HasSubstr(prefix_error_message));
+  EXPECT_THAT(status.ToString(), HasSubstr(std::string(errors[1].message())));
+  EXPECT_THAT(status.ToString(), HasSubstr(prefix_error_message));
   EXPECT_EQ(::mediapipe::StatusCode::kInvalidArgument, status.code());
 
   errors.clear();
diff --git a/mediapipe/framework/tool/test_util.cc b/mediapipe/framework/tool/test_util.cc
new file mode 100644
index 000000000..e78c2cf85
--- /dev/null
+++ b/mediapipe/framework/tool/test_util.cc
@@ -0,0 +1,333 @@
+// Copyright 2019 The MediaPipe Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//      http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "mediapipe/framework/tool/test_util.h"
+
+#include <fcntl.h>
+#include <unistd.h>
+
+#include <memory>
+
+#include "absl/container/flat_hash_set.h"
+#include "absl/memory/memory.h"
+#include "absl/strings/match.h"
+#include "absl/strings/substitute.h"
+#include "mediapipe/framework/calculator.pb.h"
+#include "mediapipe/framework/deps/file_path.h"
+#include "mediapipe/framework/deps/no_destructor.h"
+#include "mediapipe/framework/port/advanced_proto_inc.h"
+#include "mediapipe/framework/port/logging.h"
+#include "mediapipe/framework/port/proto_ns.h"
+
+#ifdef __APPLE__
+#include <CoreFoundation/CoreFoundation.h>
+#elif defined(__ANDROID__)
+#include "mediapipe/util/android/file/base/helpers.h"
+#else
+#include "mediapipe/framework/port/file_helpers.h"
+#endif
+
+namespace mediapipe {
+
+namespace {
+
+// Checks if two values are equal within the specified tolerance.
+template <typename T>
+bool EqualWithTolerance(const T value1, const T value2, const T max_diff) {
+  const T diff = (value1 >= value2) ? (value1 - value2) : (value2 - value1);
+  return diff <= max_diff;
+}
+
+template <typename T>
+bool CompareDiff(const ImageFrame& image1, const ImageFrame& image2,
+                 const T max_color_diff, const T max_alpha_diff,
+                 const float max_avg_diff, std::string* error_message) {
+  // Verify image byte depth matches expected byte depth.
+  CHECK_EQ(sizeof(T), image1.ByteDepth());
+  CHECK_EQ(sizeof(T), image2.ByteDepth());
+
+  const bool return_error = error_message != nullptr;
+
+  const int width = image1.Width();
+  const int height = image1.Height();
+  const int channels1 = image1.NumberOfChannels();
+  const int channels2 = image2.NumberOfChannels();
+  const T* pixel1 = reinterpret_cast<const T*>(image1.PixelData());
+  const T* pixel2 = reinterpret_cast<const T*>(image2.PixelData());
+  const int num_channels = std::min(channels1, channels2);
+
+  // Verify the width steps are multiples of byte depth.
+  CHECK_EQ(image1.WidthStep() % image1.ByteDepth(), 0);
+  CHECK_EQ(image2.WidthStep() % image2.ByteDepth(), 0);
+  const int width_padding1 =
+      image1.WidthStep() / image1.ByteDepth() - width * channels1;
+  const int width_padding2 =
+      image2.WidthStep() / image2.ByteDepth() - width * channels2;
+
+  float avg_diff = 0;
+  uint diff_count = 0;
+  for (int row = 0; row < height; ++row) {
+    for (int col = 0; col < width; ++col) {
+      for (int channel = 0; channel < num_channels; ++channel) {
+        // Check local difference.
+        const T max_diff = channel < 3 ? max_color_diff : max_alpha_diff;
+        const T value1 = pixel1[channel];
+        const T value2 = pixel2[channel];
+        if (!EqualWithTolerance<T>(value1, value2, max_diff)) {
+          // We cast uint8 to int using this type (and leave other values as-is)
+          // to avoid printing as a single char.
+          using TypeToPrint =
+              typename std::conditional<std::is_same<T, uint8>::value, int,
+                                        T>::type;
+          std::string error = absl::Substitute(
+              "images differ: row = $0 col = $1 channel = $2 : pixel1 = $3, "
+              "pixel2 = $4",
+              row, col, channel, static_cast<TypeToPrint>(value1),
+              static_cast<TypeToPrint>(value2));
+          if (return_error) {
+            *error_message = error;
+          } else {
+            LOG(ERROR) << error;
+          }
+          return false;
+        }
+        // Check global average difference.
+        const float diff =
+            std::abs(static_cast<float>(value1) - static_cast<float>(value2));
+        avg_diff += (diff - avg_diff) / ++diff_count;
+      }
+      pixel1 += channels1;
+      pixel2 += channels2;
+    }
+    pixel1 += width_padding1;
+    pixel2 += width_padding2;
+  }
+
+  if (avg_diff > max_avg_diff) {
+    std::string error =
+        absl::Substitute("images differ: avg pixel error = $0", avg_diff);
+    if (return_error) {
+      *error_message = error;
+    } else {
+      LOG(ERROR) << error;
+    }
+    return false;
+  }
+
+  return true;
+}
+
+#if defined(__linux__)
+// Returns the directory of the running test binary.
+std::string GetBinaryDirectory() {
+  char full_path[PATH_MAX + 1];
+  int length = readlink("/proc/self/exe", full_path, PATH_MAX + 1);
+  CHECK_GT(length, 0);
+  return std::string(
+      ::mediapipe::file::Dirname(absl::string_view(full_path, length)));
+}
+#endif
+
+}  // namespace
+
+bool CompareImageFrames(const ImageFrame& image1, const ImageFrame& image2,
+                        const float max_color_diff, const float max_alpha_diff,
+                        const float max_avg_diff, std::string* error_message) {
+  const bool return_error = error_message != nullptr;
+
+  auto IsSupportedImageFormatComparison = [](const ImageFrame& image1,
+                                             const ImageFrame& image2) {
+    // Pairs of non-equal image formats that can be compared against each other.
+    static const mediapipe::NoDestructor<absl::flat_hash_set<
+        std::pair<ImageFormat::Format, ImageFormat::Format>>>
+        kCompatibleImageFormats({
+            {ImageFormat::SRGB, ImageFormat::SRGBA},
+            {ImageFormat::SRGB48, ImageFormat::SRGBA64},
+        });
+
+    auto* compatible_image_formats = kCompatibleImageFormats.get();
+
+    return image1.Format() == image2.Format() ||
+           compatible_image_formats->contains(
+               {image1.Format(), image2.Format()}) ||
+           compatible_image_formats->contains(
+               {image2.Format(), image1.Format()});
+  };
+
+  if (!IsSupportedImageFormatComparison(image1, image2)) {
+    std::string error = absl::Substitute(
+        "unsupported image format comparison; image1 = $0, image2 = $1",
+        image1.Format(), image2.Format());
+    if (return_error) {
+      *error_message = error;
+    } else {
+      LOG(ERROR) << error;
+    }
+    return false;
+  }
+
+  if (image1.Width() != image2.Width()) {
+    std::string error =
+        absl::Substitute("image width mismatch: image1 = $0, image2 = $1",
+                         image1.Width(), image2.Width());
+    if (return_error) {
+      *error_message = error;
+    } else {
+      LOG(ERROR) << error;
+    }
+    return false;
+  }
+
+  if (image1.Height() != image2.Height()) {
+    std::string error =
+        absl::Substitute("image height mismatch: image1 = $0, image2 = $1",
+                         image1.Height(), image2.Height());
+    if (return_error) {
+      *error_message = error;
+    } else {
+      LOG(ERROR) << error;
+    }
+    return false;
+  }
+
+  if (image1.ByteDepth() != image2.ByteDepth()) {
+    std::string error =
+        absl::Substitute("image byte depth mismatch: image1 = $0, image2 = $1",
+                         image1.ByteDepth(), image2.ByteDepth());
+    if (return_error) {
+      *error_message = error;
+    } else {
+      LOG(ERROR) << error;
+    }
+    return false;
+  }
+
+  switch (image1.Format()) {
+    case ImageFormat::GRAY8:
+    case ImageFormat::SRGB:
+    case ImageFormat::SRGBA:
+    case ImageFormat::LAB8:
+      return CompareDiff<uint8>(image1, image2, max_color_diff, max_alpha_diff,
+                                max_avg_diff, error_message);
+    case ImageFormat::GRAY16:
+    case ImageFormat::SRGB48:
+    case ImageFormat::SRGBA64:
+      return CompareDiff<uint16>(image1, image2, max_color_diff, max_alpha_diff,
+                                 max_avg_diff, error_message);
+    case ImageFormat::VEC32F1:
+    case ImageFormat::VEC32F2:
+      return CompareDiff<float>(image1, image2, max_color_diff, max_alpha_diff,
+                                max_avg_diff, error_message);
+    default:
+      LOG(FATAL) << ImageFrame::InvalidFormatString(image1.Format());
+  }
+}
+
+std::string GetTestRootDir() {
+#ifdef __APPLE__
+  char path[1024];
+  CFURLRef bundle_url = CFBundleCopyBundleURL(CFBundleGetMainBundle());
+  Boolean success = CFURLGetFileSystemRepresentation(
+      bundle_url, true, reinterpret_cast<UInt8*>(path), sizeof(path));
+  CHECK(success);
+  CFRelease(bundle_url);
+  return path;
+#elif defined(__ANDROID__)
+  char path[1024];
+  char* ptr = getcwd(path, sizeof(path));
+  CHECK_EQ(ptr, path);
+  return path;
+#else
+  return ::mediapipe::file::JoinPath(std::getenv("TEST_SRCDIR"), "mediapipe");
+#endif  // defined(__APPLE__)
+}
+
+std::string GetTestDataDir(const std::string& package_base_path) {
+#ifdef __APPLE__
+  return ::mediapipe::file::JoinPath(GetTestRootDir(), "testdata/");
+#elif defined(__ANDROID__)
+  std::string data_dir = GetTestRootDir();
+  std::string binary_dir = GetBinaryDirectory();
+  // In Mobile Harness, the cwd is "/" and the run dir is "/data/local/tmp".
+  if (data_dir == "/" && absl::StartsWith(binary_dir, "/data")) {
+    data_dir = binary_dir;
+  }
+  return ::mediapipe::file::JoinPath(data_dir, package_base_path, "testdata/");
+#else
+  return ::mediapipe::file::JoinPath(GetTestRootDir(), package_base_path,
+                                     "testdata/");
+#endif  // defined(__APPLE__)
+}
+
+std::unique_ptr<ImageFrame> LoadTestPng(const std::string& path,
+                                        ImageFormat::Format format) {
+  return nullptr;
+}
+
+bool LoadTestGraph(CalculatorGraphConfig* proto, const std::string& path) {
+  int fd = open(path.c_str(), O_RDONLY);
+  if (fd == -1) {
+    LOG(ERROR) << "could not open test graph: " << path
+               << ", error: " << strerror(errno);
+    return false;
+  }
+  proto_ns::io::FileInputStream input(fd);
+  bool success = proto->ParseFromZeroCopyStream(&input);
+  close(fd);
+  if (!success) {
+    LOG(ERROR) << "could not parse test graph: " << path;
+  }
+  return success;
+}
+
+std::unique_ptr<ImageFrame> GenerateLuminanceImage(
+    const ImageFrame& original_image) {
+  const int width = original_image.Width();
+  const int height = original_image.Height();
+  const int channels = original_image.NumberOfChannels();
+  if (channels != 3 && channels != 4) {
+    LOG(ERROR) << "Invalid number of image channels: " << channels;
+    return nullptr;
+  }
+  auto luminance_image =
+      absl::make_unique<ImageFrame>(original_image.Format(), width, height,
+                                    ImageFrame::kGlDefaultAlignmentBoundary);
+  const uint8* pixel1 = original_image.PixelData();
+  uint8* pixel2 = luminance_image->MutablePixelData();
+  const int width_padding1 = original_image.WidthStep() - width * channels;
+  const int width_padding2 = luminance_image->WidthStep() - width * channels;
+  for (int row = 0; row < height; ++row) {
+    for (int col = 0; col < width; ++col) {
+      float luminance =
+          pixel1[0] * 0.2125f + pixel1[1] * 0.7154f + pixel1[2] * 0.0721f;
+      uint8 luminance_byte = 255;
+      if (luminance < 255.0f) {
+        luminance_byte = static_cast<uint8>(luminance);
+      }
+      pixel2[0] = luminance_byte;
+      pixel2[1] = luminance_byte;
+      pixel2[2] = luminance_byte;
+      if (channels == 4) {
+        pixel2[3] = pixel1[3];
+      }
+      pixel1 += channels;
+      pixel2 += channels;
+    }
+    pixel1 += width_padding1;
+    pixel2 += width_padding2;
+  }
+  return luminance_image;
+}
+
+}  // namespace mediapipe
diff --git a/mediapipe/framework/tool/test_util.h b/mediapipe/framework/tool/test_util.h
new file mode 100644
index 000000000..56875ee2a
--- /dev/null
+++ b/mediapipe/framework/tool/test_util.h
@@ -0,0 +1,67 @@
+// Copyright 2019 The MediaPipe Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//      http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef MEDIAPIPE_FRAMEWORK_TEST_UTIL_H_
+#define MEDIAPIPE_FRAMEWORK_TEST_UTIL_H_
+
+#include "mediapipe/framework/calculator.pb.h"
+#include "mediapipe/framework/formats/image_frame.h"
+
+namespace mediapipe {
+using mediapipe::CalculatorGraphConfig;
+
+// Checks if two image frames are equal within the specified tolerance.
+// image1 and image2 may be of different-but-compatible image formats (e.g.,
+// SRGB and SRGBA); in that case, only the channels available in both are
+// compared.
+// max_color_diff applies to the first 3 channels; i.e., R, G, B for sRGB and
+// sRGBA, and the single gray channel for GRAY8 and GRAY16. It is the maximum
+// pixel color value difference allowed; i.e., a value from 0 to 2^8-1 for 8-bit
+// data and a value from 0 to 2^16-1 for 16-bit data.
+// max_alpha_diff applies to the 4th (alpha) channel only, if present.
+// max_avg_diff applies to all channels, normalized across all pixels.
+//
+// Note: Although max_color_diff and max_alpha_diff are floats, all uint8/uint16
+// values are exactly representable. (2^24 + 1 is the first non-representable
+// positive integral value.)
+bool CompareImageFrames(const ImageFrame& image1, const ImageFrame& image2,
+                        const float max_color_diff, const float max_alpha_diff,
+                        const float max_avg_diff = 1.0,
+                        std::string* error_message = nullptr);
+
+// Returns the absolute path to the directory that contains test source code.
+std::string GetTestRootDir();
+
+// Returns the absolute path to the contents of the package's "testdata"
+// directory.
+// This handles the different paths where test data ends up when using
+// ion_cc_test on various platforms.
+std::string GetTestDataDir(const std::string& package_base_path);
+
+// Loads a binary graph from path. Returns true iff successful.
+bool LoadTestGraph(CalculatorGraphConfig* proto, const std::string& path);
+
+// Loads a PNG image from path using the given ImageFormat. Returns nullptr in
+// case of failure.
+std::unique_ptr<ImageFrame> LoadTestPng(
+    const std::string& path, ImageFormat::Format format = ImageFormat::SRGBA);
+
+// Returns the luminance image of |original_image|.
+// The format of |original_image| must be sRGB or sRGBA.
+std::unique_ptr<ImageFrame> GenerateLuminanceImage(
+    const ImageFrame& original_image);
+
+}  // namespace mediapipe
+
+#endif  // MEDIAPIPE_FRAMEWORK_TEST_UTIL_H_
diff --git a/mediapipe/framework/transitive_protos.bzl b/mediapipe/framework/transitive_protos.bzl
index 76c04c776..e2566b123 100644
--- a/mediapipe/framework/transitive_protos.bzl
+++ b/mediapipe/framework/transitive_protos.bzl
@@ -5,20 +5,21 @@ ProtoLibsInfo = provider(fields = ["targets", "out"])
 def _get_proto_rules(deps, proto_rules = None):
     useful_deps = [dep for dep in deps if hasattr(dep, "proto_rules")]
     if proto_rules == None:
-        proto_rules = []
-    for dep in useful_deps:
-        proto_rules = proto_rules + dep.proto_rules
+        proto_rules = depset()
+    proto_rules = depset(
+        transitive = [proto_rules] + [dep.proto_rules for dep in useful_deps],
+    )
     return proto_rules
 
 def _proto_rules_aspect_impl(target, ctx):
     # Make sure the rule has a srcs attribute.
-    proto_rules = []
+    proto_rules = depset()
     found_cc_proto = False
     if hasattr(ctx.rule.attr, "srcs") and len(ctx.rule.attr.srcs) == 1:
         for f in ctx.rule.attr.srcs[0].files.to_list():
             if f.basename.endswith(".pb.cc"):
-                proto_rules = [target[CcInfo]]
-                found = True
+                proto_rules = depset([target[CcInfo]])
+                found_cc_proto = True
                 break
 
     if not found_cc_proto:
@@ -43,10 +44,10 @@ def _transitive_protos_impl(ctx):
       A proto provider (with transitive_sources and transitive_descriptor_sets filled in),
       and marks all transitive sources as default output.
     """
-    cc_infos = []
+    cc_info_sets = []
     for dep in ctx.attr.deps:
-        for dep_proto_rule in dep.proto_rules:
-            cc_infos.append(dep_proto_rule)
+        cc_info_sets.append(dep.proto_rules)
+    cc_infos = depset(transitive = cc_info_sets).to_list()
     return [cc_common.merge_cc_infos(cc_infos = cc_infos)]
 
 transitive_protos = rule(
diff --git a/mediapipe/java/com/google/mediapipe/components/FrameProcessor.java b/mediapipe/java/com/google/mediapipe/components/FrameProcessor.java
index b2fc82b3f..d9245e768 100644
--- a/mediapipe/java/com/google/mediapipe/components/FrameProcessor.java
+++ b/mediapipe/java/com/google/mediapipe/components/FrameProcessor.java
@@ -71,7 +71,7 @@ public class FrameProcessor implements TextureFrameProcessor, AudioDataProcessor
   private double audioSampleRate;
 
   /**
-   * Constructor.
+   * Constructor for video input/output.
    *
    * @param context an Android {@link Context}.
    * @param parentNativeContext a native handle to a GL context. The GL context(s) used by the
@@ -86,50 +86,41 @@ public class FrameProcessor implements TextureFrameProcessor, AudioDataProcessor
       long parentNativeContext,
       String graphName,
       String inputStream,
-      String outputStream) {
-    mediapipeGraph = new Graph();
-    videoInputStream = inputStream;
-    videoOutputStream = outputStream;
-
+      @Nullable String outputStream) {
     try {
-      if (new File(graphName).isAbsolute()) {
-        mediapipeGraph.loadBinaryGraph(graphName);
-      } else {
-        mediapipeGraph.loadBinaryGraph(
-            AndroidAssetUtil.getAssetBytes(context.getAssets(), graphName));
-      }
-
-      packetCreator = new AndroidPacketCreator(mediapipeGraph);
-      mediapipeGraph.addPacketCallback(
-          videoOutputStream,
-          new PacketCallback() {
-            @Override
-            public void process(Packet packet) {
-              List<TextureFrameConsumer> currentConsumers;
-              synchronized (this) {
-                currentConsumers = videoConsumers;
-              }
-              for (TextureFrameConsumer consumer : currentConsumers) {
-                TextureFrame frame = PacketGetter.getTextureFrame(packet);
-                if (Log.isLoggable(TAG, Log.VERBOSE)) {
-                  Log.v(
-                      TAG,
-                      String.format(
-                          "Output tex: %d width: %d height: %d to consumer %h",
-                          frame.getTextureName(), frame.getWidth(), frame.getHeight(), consumer));
-                }
-                consumer.onNewFrame(frame);
-              }
-            }
-          });
-
-      mediapipeGraph.setParentGlContext(parentNativeContext);
+      initializeGraphAndPacketCreator(context, graphName);
+      addVideoStreams(parentNativeContext, inputStream, outputStream);
     } catch (MediaPipeException e) {
       // TODO: do not suppress exceptions here!
-      Log.e(TAG, "Mediapipe error: ", e);
+      Log.e(TAG, "MediaPipe error: ", e);
     }
+  }
 
-    videoSurfaceOutput = mediapipeGraph.addSurfaceOutput(videoOutputStream);
+  /**
+   * Constructor.
+   *
+   * @param context an Android {@link Context}.
+   * @param graphName the name of the file containing the binary representation of the graph.
+   */
+  public FrameProcessor(Context context, String graphName) {
+    initializeGraphAndPacketCreator(context, graphName);
+  }
+
+  /**
+   * Initializes a graph for processing data in real time.
+   *
+   * @param context an Android {@link Context}.
+   * @param graphName the name of the file containing the binary representation of the graph.
+   */
+  private void initializeGraphAndPacketCreator(Context context, String graphName) {
+    mediapipeGraph = new Graph();
+    if (new File(graphName).isAbsolute()) {
+      mediapipeGraph.loadBinaryGraph(graphName);
+    } else {
+      mediapipeGraph.loadBinaryGraph(
+          AndroidAssetUtil.getAssetBytes(context.getAssets(), graphName));
+    }
+    packetCreator = new AndroidPacketCreator(mediapipeGraph);
   }
 
   /** Callback for errors occurring during processing in the graph. */
@@ -167,6 +158,51 @@ public class FrameProcessor implements TextureFrameProcessor, AudioDataProcessor
             });
   }
 
+  /**
+   * Adds input streams to process video data and output streams that output processed video data.
+   *
+   * @param parentNativeContext a native handle to a GL context. The GL context(s) used by the
+   *     calculators in the graph will join the parent context's sharegroup, so that textures
+   *     generated by the calculators are available in the parent context, and vice versa.
+   * @param inputStream the graph input stream that will receive input video frames.
+   * @param outputStream the output stream from which output frames will be produced.
+   */
+  public void addVideoStreams(
+      long parentNativeContext, @Nullable String inputStream, @Nullable String outputStream) {
+
+    videoInputStream = inputStream;
+    videoOutputStream = outputStream;
+
+    mediapipeGraph.setParentGlContext(parentNativeContext);
+
+    if (videoOutputStream != null) {
+      mediapipeGraph.addPacketCallback(
+          videoOutputStream,
+          new PacketCallback() {
+            @Override
+            public void process(Packet packet) {
+              List<TextureFrameConsumer> currentConsumers;
+              synchronized (this) {
+                currentConsumers = videoConsumers;
+              }
+              for (TextureFrameConsumer consumer : currentConsumers) {
+                TextureFrame frame = PacketGetter.getTextureFrame(packet);
+                if (Log.isLoggable(TAG, Log.VERBOSE)) {
+                  Log.v(
+                      TAG,
+                      String.format(
+                          "Output tex: %d width: %d height: %d to consumer %h",
+                          frame.getTextureName(), frame.getWidth(), frame.getHeight(), consumer));
+                }
+                consumer.onNewFrame(frame);
+              }
+            }
+          });
+
+      videoSurfaceOutput = mediapipeGraph.addSurfaceOutput(videoOutputStream);
+    }
+  }
+
   /**
    * Adds input streams to process audio data and output streams that output processed audio data.
    *
@@ -183,11 +219,12 @@ public class FrameProcessor implements TextureFrameProcessor, AudioDataProcessor
     audioInputStream = inputStream;
     audioOutputStream = outputStream;
     numAudioChannels = numChannels;
+    int audioChannelMask =
+        numAudioChannels == 2 ? AudioFormat.CHANNEL_IN_STEREO : AudioFormat.CHANNEL_IN_MONO;
     audioSampleRate = audioSampleRateInHz;
 
     if (audioInputStream != null) {
-      Packet audioHeader =
-          packetCreator.createTimeSeriesHeader(numAudioChannels, audioSampleRateInHz);
+      Packet audioHeader = packetCreator.createTimeSeriesHeader(numAudioChannels, audioSampleRate);
       mediapipeGraph.setStreamHeader(audioInputStream, audioHeader);
     }
 
@@ -195,8 +232,8 @@ public class FrameProcessor implements TextureFrameProcessor, AudioDataProcessor
       AudioFormat audioFormat =
           new AudioFormat.Builder()
               .setEncoding(AUDIO_ENCODING)
-              .setSampleRate((int) audioSampleRateInHz)
-              .setChannelMask(numAudioChannels)
+              .setSampleRate((int) audioSampleRate)
+              .setChannelMask(audioChannelMask)
               .build();
       mediapipeGraph.addPacketCallback(
           audioOutputStream,
diff --git a/mediapipe/models/README.md b/mediapipe/models/README.md
index 4bdd4d09b..0d15c968c 100644
--- a/mediapipe/models/README.md
+++ b/mediapipe/models/README.md
@@ -43,6 +43,7 @@ Here are the descriptions of the models used in the [example applications](../do
 ### KNIFT (Keypoint Neural Invariant Feature Transform)
   * Up to 200 keypoints: [TFLite model](https://github.com/google/mediapipe/tree/master/mediapipe/models/knift_float.tflite)
   * Up to 400 keypoints: [TFLite model](https://github.com/google/mediapipe/tree/master/mediapipe/models/knift_float_400.tflite)
+  * Up to 1000 keypoints: [TFLite model](https://github.com/google/mediapipe/tree/master/mediapipe/models/knift_float_1k.tflite)
   * [Google Developers Blog post](https://mediapipe.page.link/knift)
   * [Model card](https://mediapipe.page.link/knift-mc)
 
diff --git a/mediapipe/models/knift_float_1k.tflite b/mediapipe/models/knift_float_1k.tflite
new file mode 100644
index 000000000..b0f105359
Binary files /dev/null and b/mediapipe/models/knift_float_1k.tflite differ
diff --git a/mediapipe/models/object_detection_saved_model/README.md b/mediapipe/models/object_detection_saved_model/README.md
index afd49f132..52f8d3af4 100644
--- a/mediapipe/models/object_detection_saved_model/README.md
+++ b/mediapipe/models/object_detection_saved_model/README.md
@@ -1,25 +1,13 @@
 ## TensorFlow/TFLite Object Detection Model
 
-This is the description of the object detection model we used in the following examples:
-
-   * `Object Detection on Desktop`
-   * `Object Detection on GPU on Android`
-   * `Object Detection on CPU on Android`
-
 ### TensorFlow model
 
-This model is used in `Object Detection on Desktop TensorFlow Demo`. The model is trained on [MSCOCO 2014](http://cocodataset.org) dataset using [TensorFlow Object Detection API](https://github.com/tensorflow/models/tree/master/research/object_detection). It is a MobileNetV2-based SSD model with 0.5 depth multiplier. Detailed training configuration is in the provided `pipeline.config`. The model is a relatively compact model which has `0.171 mAP` to achieve real-time performance on mobile devices. You can compare it with other models from the [TensorFlow detection model zoo](https://github.com/tensorflow/models/blob/master/research/object_detection/g3doc/detection_model_zoo.md).
+The model is trained on [MSCOCO 2014](http://cocodataset.org) dataset using [TensorFlow Object Detection API](https://github.com/tensorflow/models/tree/master/research/object_detection). It is a MobileNetV2-based SSD model with 0.5 depth multiplier. Detailed training configuration is in the provided `pipeline.config`. The model is a relatively compact model which has `0.171 mAP` to achieve real-time performance on mobile devices. You can compare it with other models from the [TensorFlow detection model zoo](https://github.com/tensorflow/models/blob/master/research/object_detection/g3doc/detection_model_zoo.md).
 
 
 ### TFLite model
 
-The TFLite model is converted from the TensorFlow above. It is used in:
-
-   * `Object Detection on Desktop TFLite Demo`
-   * `Object Detection on GPU on Android`
-   * `Object Detection on CPU on Android`
-
-The steps needed to convert the model are similar to [this tutorial](https://medium.com/tensorflow/training-and-serving-a-realtime-mobile-object-detector-in-30-minutes-with-cloud-tpus-b78971cf1193) with minor modifications. Assuming now we have a trained TensorFlow model which includes the checkpoint files and the training configuration file, for example the files provided in this repo:
+The TFLite model is converted from the TensorFlow above. The steps needed to convert the model are similar to [this tutorial](https://medium.com/tensorflow/training-and-serving-a-realtime-mobile-object-detector-in-30-minutes-with-cloud-tpus-b78971cf1193) with minor modifications. Assuming now we have a trained TensorFlow model which includes the checkpoint files and the training configuration file, for example the files provided in this repo:
 
    * `model.ckpt.index`
    * `model.ckpt.meta`
diff --git a/mediapipe/objc/MPPCameraInputSource.h b/mediapipe/objc/MPPCameraInputSource.h
index 7f547b2d4..9bb7439b5 100644
--- a/mediapipe/objc/MPPCameraInputSource.h
+++ b/mediapipe/objc/MPPCameraInputSource.h
@@ -34,6 +34,9 @@
 /// Whether to rotate video buffers with device rotation.
 @property(nonatomic) BOOL autoRotateBuffers;
 
+/// Whether to mirror the video or not.
+@property(nonatomic) BOOL videoMirrored;
+
 /// The camera intrinsic matrix.
 @property(nonatomic, readonly) matrix_float3x3 cameraIntrinsicMatrix;
 
diff --git a/mediapipe/objc/MPPCameraInputSource.m b/mediapipe/objc/MPPCameraInputSource.m
index 65468408c..b9718680c 100644
--- a/mediapipe/objc/MPPCameraInputSource.m
+++ b/mediapipe/objc/MPPCameraInputSource.m
@@ -34,6 +34,7 @@
   BOOL _setupDone;
   BOOL _useDepth;
   BOOL _useCustomOrientation;
+  BOOL _videoMirrored;
 }
 
 - (instancetype)init {
@@ -123,6 +124,22 @@
   }
 }
 
+- (void)setVideoMirrored:(BOOL)videoMirrored {
+  if (videoMirrored == _videoMirrored) {
+    return;
+  }
+
+  BOOL wasRunning = [self isRunning];
+  if (wasRunning) {
+    [self stop];
+  }
+  _videoMirrored = videoMirrored;
+  _setupDone = NO;
+  if (wasRunning) {
+    [self start];
+  }
+}
+
 - (void)setAutoRotateBuffers:(BOOL)autoRotateBuffers {
   if (autoRotateBuffers == _autoRotateBuffers) {
     return;  // State has not changed.
@@ -252,6 +269,11 @@
     }
   }
 
+  if (_videoMirrored) {
+    AVCaptureConnection* connection = [_videoDataOutput connectionWithMediaType:AVMediaTypeVideo];
+    connection.videoMirrored = _videoMirrored;
+  }
+
   _setupDone = YES;
 }
 
diff --git a/mediapipe/util/tflite/BUILD b/mediapipe/util/tflite/BUILD
index 04f21ff74..f5ab6c1f1 100644
--- a/mediapipe/util/tflite/BUILD
+++ b/mediapipe/util/tflite/BUILD
@@ -101,5 +101,15 @@ cc_library(
             "@org_tensorflow//tensorflow/lite/delegates/gpu/common:model",
             "@org_tensorflow//tensorflow/lite/delegates/gpu/gl:api2",
         ],
+        "//mediapipe:android": [
+            "@com_google_absl//absl/strings",
+            "//mediapipe/framework/port:ret_check",
+            "//mediapipe/framework/port:status",
+            "//mediapipe/framework/port:statusor",
+            "@org_tensorflow//tensorflow/lite:framework",
+            "@org_tensorflow//tensorflow/lite/delegates/gpu:api",
+            "@org_tensorflow//tensorflow/lite/delegates/gpu/common:model",
+            "@org_tensorflow//tensorflow/lite/delegates/gpu/gl:api2",
+        ],
     }) + ["@org_tensorflow//tensorflow/lite/core/api"],
 )
diff --git a/mediapipe/util/tflite/tflite_gpu_runner.cc b/mediapipe/util/tflite/tflite_gpu_runner.cc
index a44ac5c5b..510b291e2 100644
--- a/mediapipe/util/tflite/tflite_gpu_runner.cc
+++ b/mediapipe/util/tflite/tflite_gpu_runner.cc
@@ -51,10 +51,10 @@ ObjectDef GetSSBOObjectDef(int channels) {
 mediapipe::Status TFLiteGPURunner::InitializeWithModel(
     const tflite::FlatBufferModel& flatbuffer,
     const tflite::OpResolver& op_resolver) {
-  for (const auto& input : graph_->inputs()) {
+  for (const auto& input : graph_gl_->inputs()) {
     input_shapes_.push_back(input->tensor.shape);
   }
-  for (const auto& output : graph_->outputs()) {
+  for (const auto& output : graph_gl_->outputs()) {
     output_shapes_.push_back(output->tensor.shape);
   }
   return absl::OkStatus();
@@ -79,7 +79,18 @@ mediapipe::StatusOr<int64_t> TFLiteGPURunner::GetOutputElements(int id) {
 mediapipe::Status TFLiteGPURunner::Build() {
   // 1. Prepare inference builder.
   std::unique_ptr<InferenceBuilder> builder;
-  MP_RETURN_IF_ERROR(InitializeOpenGL(&builder));
+  // By default, we try CL first & fall back to GL if that fails.
+  absl::Status status = InitializeOpenCL(&builder);
+  if (status.ok()) {
+    LOG(INFO) << "OpenCL backend is used.";
+  } else {
+    LOG(ERROR) << "Falling back to OpenGL: " << status.message();
+    MP_RETURN_IF_ERROR(InitializeOpenGL(&builder));
+  }
+
+  // Both graphs are not needed anymore. Make sure they are deleted.
+  graph_gl_.reset(nullptr);
+  graph_cl_.reset(nullptr);
 
   // 2. Describe output/input objects for created builder.
   for (int flow_index = 0; flow_index < input_shapes_.size(); ++flow_index) {
@@ -122,9 +133,13 @@ mediapipe::Status TFLiteGPURunner::InitializeOpenGL(
   gl_options.usage = options_.usage;
   MP_RETURN_IF_ERROR(
       NewInferenceEnvironment(env_options, &gl_environment_, &properties));
-  MP_RETURN_IF_ERROR(gl_environment_->NewInferenceBuilder(std::move(*graph_),
+  MP_RETURN_IF_ERROR(gl_environment_->NewInferenceBuilder(std::move(*graph_gl_),
                                                           gl_options, builder));
-  graph_.release();
+  return absl::OkStatus();
+}
+
+absl::Status TFLiteGPURunner::InitializeOpenCL(
+    std::unique_ptr<InferenceBuilder>* builder) {
   return absl::OkStatus();
 }
 
diff --git a/mediapipe/util/tflite/tflite_gpu_runner.h b/mediapipe/util/tflite/tflite_gpu_runner.h
index 12f744532..fef2a818f 100644
--- a/mediapipe/util/tflite/tflite_gpu_runner.h
+++ b/mediapipe/util/tflite/tflite_gpu_runner.h
@@ -67,12 +67,15 @@ class TFLiteGPURunner {
  private:
   mediapipe::Status InitializeOpenGL(
       std::unique_ptr<InferenceBuilder>* builder);
+  mediapipe::Status InitializeOpenCL(
+      std::unique_ptr<InferenceBuilder>* builder);
 
   InferenceOptions options_;
   std::unique_ptr<gl::InferenceEnvironment> gl_environment_;
 
   // graph_ is maintained temporarily and becomes invalid after runner_ is ready
-  std::unique_ptr<GraphFloat32> graph_;
+  std::unique_ptr<GraphFloat32> graph_gl_;
+  std::unique_ptr<GraphFloat32> graph_cl_;
   std::unique_ptr<InferenceRunner> runner_;
 
   // We keep information about input/output shapes, because they are needed
diff --git a/mediapipe/util/tracking/BUILD b/mediapipe/util/tracking/BUILD
index 8280c07cb..2e881a789 100644
--- a/mediapipe/util/tracking/BUILD
+++ b/mediapipe/util/tracking/BUILD
@@ -426,6 +426,7 @@ cc_library(
         "//mediapipe/framework/port:logging",
         "//mediapipe/framework/port:vector",
         "@com_google_absl//absl/container:node_hash_map",
+        "@com_google_absl//absl/container:node_hash_set",
         "@com_google_absl//absl/strings",
         "@eigen_archive//:eigen",
     ],
diff --git a/mediapipe/util/tracking/motion_estimation.cc b/mediapipe/util/tracking/motion_estimation.cc
index 341d91f53..18e74392d 100644
--- a/mediapipe/util/tracking/motion_estimation.cc
+++ b/mediapipe/util/tracking/motion_estimation.cc
@@ -30,6 +30,7 @@
 #include "Eigen/QR"
 #include "Eigen/SVD"
 #include "absl/container/node_hash_map.h"
+#include "absl/container/node_hash_set.h"
 #include "absl/strings/str_cat.h"
 #include "mediapipe/framework/port/logging.h"
 #include "mediapipe/util/tracking/camera_motion.h"
@@ -2132,7 +2133,7 @@ void MotionEstimation::UpdateLongFeatureBias(
   }
 
   // Tracks current ids in this frame.
-  std::unordered_set<int> curr_track_ids;
+  absl::node_hash_set<int> curr_track_ids;
 
   // Scale applied to irls weight for linear interpolation between inlier and
   // outlier bias.
diff --git a/setup_opencv.sh b/setup_opencv.sh
index 04b219c97..983ccc7cd 100644
--- a/setup_opencv.sh
+++ b/setup_opencv.sh
@@ -32,6 +32,9 @@ if [ "$1" ] && [ "$1" != "config_only" ]
     exit 0
 fi
 
+opencv_build_file="$( cd "$(dirname "$0")" ; pwd -P )"/third_party/opencv_linux.BUILD
+workspace_file="$( cd "$(dirname "$0")" ; pwd -P )"/WORKSPACE
+
 if [ -z "$1" ]
   then
     echo "Installing OpenCV from source"
@@ -76,9 +79,6 @@ fi
 # Modify the build file.
 echo "Modifying MediaPipe opencv config"
 
-opencv_build_file="$( cd "$(dirname "$0")" ; pwd -P )"/third_party/opencv_linux.BUILD
-workspace_file="$( cd "$(dirname "$0")" ; pwd -P )"/WORKSPACE
-
 sed -i "s/lib\/x86_64-linux-gnu/lib/g" $opencv_build_file
 linux_opencv_config=$(grep -n 'linux_opencv' $workspace_file | awk -F  ":" '{print $1}')
 path_line=$((linux_opencv_config + 2))
diff --git a/third_party/org_tensorflow_compatibility_fixes.diff b/third_party/org_tensorflow_compatibility_fixes.diff
index 4f8579d98..5478e3d02 100644
--- a/third_party/org_tensorflow_compatibility_fixes.diff
+++ b/third_party/org_tensorflow_compatibility_fixes.diff
@@ -23,3 +23,62 @@ index b7c22ae77b..d0ba7b48b4 100644
        pct_samples.points.push_back(pct);
      }
    }
+diff --git a/tensorflow/lite/delegates/gpu/cl/api.cc b/tensorflow/lite/delegates/gpu/cl/api.cc
+index 09c82307a5..0318c1a447 100644
+--- a/tensorflow/lite/delegates/gpu/cl/api.cc
++++ b/tensorflow/lite/delegates/gpu/cl/api.cc
+@@ -352,10 +352,10 @@ class GlBufferHolder : public TensorTie {
+ };
+ 
+ TensorObject TensorToObj(const Tensor& tensor) {
+-  if (tensor.StorageType() == TensorStorageType::BUFFER) {
++  if (tensor.GetStorageType() == TensorStorageType::BUFFER) {
+     return OpenClBuffer{tensor.GetMemoryPtr()};
+   }
+-  if (tensor.StorageType() == TensorStorageType::IMAGE_BUFFER) {
++  if (tensor.GetStorageType() == TensorStorageType::IMAGE_BUFFER) {
+     return OpenClBuffer{tensor.GetMemoryPtrForWriting()};
+   }
+   return OpenClTexture{tensor.GetMemoryPtr()};
+@@ -516,9 +516,9 @@ TensorObjectDef TensorToDef(const Tensor& tensor) {
+   def.dimensions.h = tensor.Height();
+   def.dimensions.w = tensor.Width();
+   def.dimensions.c = tensor.Channels();
+-  def.object_def.data_layout = ToDataLayout(tensor.StorageType());
+-  def.object_def.data_type = tensor.DataType();
+-  def.object_def.object_type = ToObjectType(tensor.StorageType());
++  def.object_def.data_layout = ToDataLayout(tensor.GetStorageType());
++  def.object_def.data_type = tensor.GetDataType();
++  def.object_def.object_type = ToObjectType(tensor.GetStorageType());
+   def.object_def.user_provided = false;
+   return def;
+ }
+diff --git a/tensorflow/lite/delegates/gpu/cl/tensor.cc b/tensorflow/lite/delegates/gpu/cl/tensor.cc
+index 308e1b6920..9b613c63f7 100644
+--- a/tensorflow/lite/delegates/gpu/cl/tensor.cc
++++ b/tensorflow/lite/delegates/gpu/cl/tensor.cc
+@@ -29,7 +29,7 @@ namespace cl {
+ namespace {
+ 
+ absl::Status CreateImageBufferFromBuffer(const CLContext& context,
+-                                         cl_mem memory, enum DataType data_type,
++                                         cl_mem memory, DataType data_type,
+                                          int width, cl_mem* result) {
+   cl_image_format format;
+   cl_image_desc desc;
+diff --git a/tensorflow/lite/delegates/gpu/cl/tensor.h b/tensorflow/lite/delegates/gpu/cl/tensor.h
+index a27c54a74e..39d3a04a47 100644
+--- a/tensorflow/lite/delegates/gpu/cl/tensor.h
++++ b/tensorflow/lite/delegates/gpu/cl/tensor.h
+@@ -75,8 +75,8 @@ class Tensor {
+   int4 GetWHSB() const { return int4(shape_.w, shape_.h, Slices(), shape_.b); }
+   int4 GetWHDS() const { return int4(shape_.w, shape_.h, shape_.d, Slices()); }
+ 
+-  enum DataType DataType() const { return descriptor_.data_type; }
+-  TensorStorageType StorageType() const { return descriptor_.storage_type; }
++  DataType GetDataType() const { return descriptor_.data_type; }
++  TensorStorageType GetStorageType() const { return descriptor_.storage_type; }
+ 
+   // for profiling and memory statistics
+   uint64_t GetMemorySizeInBytes() const;
+