Graph builder Dos and Donts / Nodes minimal direct usage

PiperOrigin-RevId: 509632450
2023-02-14 14:05:58 -08:00 · 2023-02-14 14:05:58 -08:00 · 63a57e2da3
commit 63a57e2da3
parent 9b1fe849d5
1 changed files with 184 additions and 0 deletions
--- a/docs/framework_concepts/building_graphs_cpp.md
+++ b/docs/framework_concepts/building_graphs_cpp.md
@ -409,3 +409,187 @@ CalculatorGraphConfig BuildGraph() {
  return graph.GetConfig();
 }
 ```
+
+### Keep nodes decoupled from each other
+
+In MediaPipe, packet streams and side packets are as meaningful as processing
+nodes. And any node input requirements and output products are expressed clearly
+and independently in terms of the streams and side packets it consumes and
+produces.
+
+```c++ {.bad}
+CalculatorGraphConfig BuildGraph() {
+  Graph graph;
+
+  // Inputs.
+  Stream<A> a = graph.In(0).Cast<A>();
+
+  auto& node1 = graph.AddNode("Calculator1");
+  a.ConnectTo(node1.In("INPUT"));
+
+  auto& node2 = graph.AddNode("Calculator2");
+  node1.Out("OUTPUT").ConnectTo(node2.In("INPUT"));  // Bad.
+
+  auto& node3 = graph.AddNode("Calculator3");
+  node1.Out("OUTPUT").ConnectTo(node3.In("INPUT_B"));  // Bad.
+  node2.Out("OUTPUT").ConnectTo(node3.In("INPUT_C"));  // Bad.
+
+  auto& node4 = graph.AddNode("Calculator4");
+  node1.Out("OUTPUT").ConnectTo(node4.In("INPUT_B"));  // Bad.
+  node2.Out("OUTPUT").ConnectTo(node4.In("INPUT_C"));  // Bad.
+  node3.Out("OUTPUT").ConnectTo(node4.In("INPUT_D"));  // Bad.
+
+  // Outputs.
+  node1.Out("OUTPUT").SetName("b").ConnectTo(graph.Out(0));  // Bad.
+  node2.Out("OUTPUT").SetName("c").ConnectTo(graph.Out(1));  // Bad.
+  node3.Out("OUTPUT").SetName("d").ConnectTo(graph.Out(2));  // Bad.
+  node4.Out("OUTPUT").SetName("e").ConnectTo(graph.Out(3));  // Bad.
+
+  return graph.GetConfig();
+}
+```
+
+In the above code:
+
+*   Nodes are coupled to each other, e.g. `node4` knows where its inputs are
+    coming from (`node1`, `node2`, `node3`) and it complicates refactoring,
+    maintenance and code reuse
+    *   Such usage pattern is a downgrade from proto representation, where nodes
+        are decoupled by default.
+*   `node#.Out("OUTPUT")` calls are duplicated and readability suffers as you
+    could use cleaner names instead and also provide an actual type.
+
+So, to fix the above issues you can write the following graph construction code:
+
+```c++ {.good}
+CalculatorGraphConfig BuildGraph() {
+  Graph graph;
+
+  // Inputs.
+  Stream<A> a = graph.In(0).Cast<A>();
+
+  // `node1` usage is limited to 3 lines below.
+  auto& node1 = graph.AddNode("Calculator1");
+  a.ConnectTo(node1.In("INPUT"));
+  Stream<B> b = node1.Out("OUTPUT").Cast<B>();
+
+  // `node2` usage is limited to 3 lines below.
+  auto& node2 = graph.AddNode("Calculator2");
+  b.ConnectTo(node2.In("INPUT"));
+  Stream<C> c = node2.Out("OUTPUT").Cast<C>();
+
+  // `node3` usage is limited to 4 lines below.
+  auto& node3 = graph.AddNode("Calculator3");
+  b.ConnectTo(node3.In("INPUT_B"));
+  c.ConnectTo(node3.In("INPUT_C"));
+  Stream<D> d = node3.Out("OUTPUT").Cast<D>();
+
+  // `node4` usage is limited to 5 lines below.
+  auto& node4 = graph.AddNode("Calculator4");
+  b.ConnectTo(node4.In("INPUT_B"));
+  c.ConnectTo(node4.In("INPUT_C"));
+  d.ConnectTo(node4.In("INPUT_D"));
+  Stream<E> e = node4.Out("OUTPUT").Cast<E>();
+
+  // Outputs.
+  b.SetName("b").ConnectTo(graph.Out(0));
+  c.SetName("c").ConnectTo(graph.Out(1));
+  d.SetName("d").ConnectTo(graph.Out(2));
+  e.SetName("e").ConnectTo(graph.Out(3));
+
+  return graph.GetConfig();
+}
+```
+
+Now, if needed, you can easily remove `node1` and make `b` a graph input and no
+updates are needed to `node2`, `node3`, `node4` (same as in proto representation
+by the way), because they are decoupled from each other.
+
+Overall, the above code replicates the proto graph more closely:
+
+```proto
+input_stream: "a"
+
+node {
+  calculator: "Calculator1"
+  input_stream: "INPUT:a"
+  output_stream: "OUTPUT:b"
+}
+
+node {
+  calculator: "Calculator2"
+  input_stream: "INPUT:b"
+  output_stream: "OUTPUT:C"
+}
+
+node {
+  calculator: "Calculator3"
+  input_stream: "INPUT_B:b"
+  input_stream: "INPUT_C:c"
+  output_stream: "OUTPUT:d"
+}
+
+node {
+  calculator: "Calculator4"
+  input_stream: "INPUT_B:b"
+  input_stream: "INPUT_C:c"
+  input_stream: "INPUT_D:d"
+  output_stream: "OUTPUT:e"
+}
+
+output_stream: "b"
+output_stream: "c"
+output_stream: "d"
+output_stream: "e"
+```
+
+On top of that, now you can extract utility functions for further reuse in other graphs:
+
+```c++ {.good}
+Stream<B> RunCalculator1(Stream<A> a, Graph& graph) {
+  auto& node = graph.AddNode("Calculator1");
+  a.ConnectTo(node.In("INPUT"));
+  return node.Out("OUTPUT").Cast<B>();
+}
+
+Stream<C> RunCalculator2(Stream<B> b, Graph& graph) {
+  auto& node = graph.AddNode("Calculator2");
+  b.ConnectTo(node.In("INPUT"));
+  return node.Out("OUTPUT").Cast<C>();
+}
+
+Stream<D> RunCalculator3(Stream<B> b, Stream<C> c, Graph& graph) {
+  auto& node = graph.AddNode("Calculator3");
+  b.ConnectTo(node.In("INPUT_B"));
+  c.ConnectTo(node.In("INPUT_C"));
+  return node.Out("OUTPUT").Cast<D>();
+}
+
+Stream<E> RunCalculator4(Stream<B> b, Stream<C> c, Stream<D> d, Graph& graph) {
+  auto& node = graph.AddNode("Calculator4");
+  b.ConnectTo(node.In("INPUT_B"));
+  c.ConnectTo(node.In("INPUT_C"));
+  d.ConnectTo(node.In("INPUT_D"));
+  return node.Out("OUTPUT").Cast<E>();
+}
+
+CalculatorGraphConfig BuildGraph() {
+  Graph graph;
+
+  // Inputs.
+  Stream<A> a = graph.In(0).Cast<A>();
+
+  Stream<B> b = RunCalculator1(a, graph);
+  Stream<C> c = RunCalculator2(b, graph);
+  Stream<D> d = RunCalculator3(b, c, graph);
+  Stream<E> e = RunCalculator4(b, c, d, graph);
+
+  // Outputs.
+  b.SetName("b").ConnectTo(graph.Out(0));
+  c.SetName("c").ConnectTo(graph.Out(1));
+  d.SetName("d").ConnectTo(graph.Out(2));
+  e.SetName("e").ConnectTo(graph.Out(3));
+
+  return graph.GetConfig();
+}
+```