diff --git a/.idea/.gitignore b/.idea/.gitignore
new file mode 100644
index 000000000..73f69e095
--- /dev/null
+++ b/.idea/.gitignore
@@ -0,0 +1,8 @@
+# Default ignored files
+/shelf/
+/workspace.xml
+# Datasource local storage ignored files
+/dataSources/
+/dataSources.local.xml
+# Editor-based HTTP Client requests
+/httpRequests/
diff --git a/.idea/inspectionProfiles/profiles_settings.xml b/.idea/inspectionProfiles/profiles_settings.xml
new file mode 100644
index 000000000..105ce2da2
--- /dev/null
+++ b/.idea/inspectionProfiles/profiles_settings.xml
@@ -0,0 +1,6 @@
+<component name="InspectionProjectProfileManager">
+  <settings>
+    <option name="USE_PROJECT_PROFILE" value="false" />
+    <version value="1.0" />
+  </settings>
+</component>
\ No newline at end of file
diff --git a/.idea/mediapipe.iml b/.idea/mediapipe.iml
new file mode 100644
index 000000000..8b8c39547
--- /dev/null
+++ b/.idea/mediapipe.iml
@@ -0,0 +1,12 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<module type="PYTHON_MODULE" version="4">
+  <component name="NewModuleRootManager">
+    <content url="file://$MODULE_DIR$" />
+    <orderEntry type="inheritedJdk" />
+    <orderEntry type="sourceFolder" forTests="false" />
+  </component>
+  <component name="PyDocumentationSettings">
+    <option name="format" value="PLAIN" />
+    <option name="myDocStringFormat" value="Plain" />
+  </component>
+</module>
\ No newline at end of file
diff --git a/.idea/misc.xml b/.idea/misc.xml
new file mode 100644
index 000000000..084c5288e
--- /dev/null
+++ b/.idea/misc.xml
@@ -0,0 +1,4 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="ProjectRootManager" version="2" project-jdk-name="Python 3.9 (projects python)" project-jdk-type="Python SDK" />
+</project>
\ No newline at end of file
diff --git a/.idea/modules.xml b/.idea/modules.xml
new file mode 100644
index 000000000..3c43275a1
--- /dev/null
+++ b/.idea/modules.xml
@@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="ProjectModuleManager">
+    <modules>
+      <module fileurl="file://$PROJECT_DIR$/.idea/mediapipe.iml" filepath="$PROJECT_DIR$/.idea/mediapipe.iml" />
+    </modules>
+  </component>
+</project>
\ No newline at end of file
diff --git a/.idea/vcs.xml b/.idea/vcs.xml
new file mode 100644
index 000000000..94a25f7f4
--- /dev/null
+++ b/.idea/vcs.xml
@@ -0,0 +1,6 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="VcsDirectoryMappings">
+    <mapping directory="$PROJECT_DIR$" vcs="Git" />
+  </component>
+</project>
\ No newline at end of file
diff --git a/docs/solutions/hands.md b/docs/solutions/hands.md
index 6cf2264ed..4afd390d6 100644
--- a/docs/solutions/hands.md
+++ b/docs/solutions/hands.md
@@ -36,7 +36,7 @@ and hand gesture control, and can also enable the overlay of digital content and
 information on top of the physical world in augmented reality. While coming
 naturally to people, robust real-time hand perception is a decidedly challenging
 computer vision task, as hands often occlude themselves or each other (e.g.
-finger/palm occlusions and hand shakes) and lack high contrast patterns.
+finger/palm occlusions and handshakes) and lack high contrast patterns.
 
 MediaPipe Hands is a high-fidelity hand and finger tracking solution. It employs
 machine learning (ML) to infer 21 3D landmarks of a hand from just a single
@@ -116,12 +116,12 @@ train a palm detector instead of a hand detector, since estimating bounding
 boxes of rigid objects like palms and fists is significantly simpler than
 detecting hands with articulated fingers. In addition, as palms are smaller
 objects, the non-maximum suppression algorithm works well even for two-hand
-self-occlusion cases, like handshakes. Moreover, palms can be modelled using
+self-occlusion cases, like handshakes. Moreover, palms can be modeled using
 square bounding boxes (anchors in ML terminology) ignoring other aspect ratios,
 and therefore reducing the number of anchors by a factor of 3-5. Second, an
 encoder-decoder feature extractor is used for bigger scene context awareness
 even for small objects (similar to the RetinaNet approach). Lastly, we minimize
-the focal loss during training to support a large amount of anchors resulting
+the focal loss during training to support a large number of anchors resulting
 from the high scale variance.
 
 With the above techniques, we achieve an average precision of 95.7% in palm
@@ -138,7 +138,7 @@ The model learns a consistent internal hand pose representation and is robust
 even to partially visible hands and self-occlusions.
 
 To obtain ground truth data, we have manually annotated ~30K real-world images
-with 21 3D coordinates, as shown below (we take Z-value from image depth map, if
+with 21 3D coordinates, as shown below (we take Z-value from the image depth map, if
 it exists per corresponding coordinate). To better cover the possible hand poses
 and provide additional supervision on the nature of hand geometry, we also
 render a high-quality synthetic hand model over various backgrounds and map it
@@ -172,11 +172,11 @@ unrelated, images. Default to `false`.
 
 #### max_num_hands
 
-Maximum number of hands to detect. Default to `2`.
+The maximum number of hands to detect. Default to `2`.
 
 #### model_complexity
 
-Complexity of the hand landmark model: `0` or `1`. Landmark accuracy as well as
+The complexity of the hand landmark model: `0` or `1`. Landmark accuracy as well as
 inference latency generally go up with the model complexity. Default to `1`.
 
 #### min_detection_confidence
@@ -217,7 +217,7 @@ approximate geometric center.
 
 Collection of handedness of the detected/tracked hands (i.e. is it a left or
 right hand). Each hand is composed of `label` and `score`. `label` is a string
-of value either `"Left"` or `"Right"`. `score` is the estimated probability of
+of values either `"Left"` or `"Right"`. `score` is the estimated probability of
 the predicted handedness and is always greater than or equal to `0.5` (and the
 opposite handedness has an estimated probability of `1 - score`).