util: function to extract part of an ONNX model (onnx#2994)

zhenhuaw-me · web-flow · commit 191d2dd838cf · 2020-10-12T09:54:25.000-07:00
* util: function to extract part of an ONNX model Sometimes, people would like to _extract_ part of an model for development, validation or other purposes. With `onnx.util.extract`, this is doable by specifying the input and output tensor names of the subgraph. Signed-off-by: Zhenhua Wang <zhenhuaw@nvidia.com> * Address review comments onnx#1 * Re-style function of Extractor * Reject empty input/output names * Misc change for readibility * Type annotation Signed-off-by: Zhenhua Wang <zhenhuaw@nvidia.com>
diff --git a/docs/PythonAPIOverview.md b/docs/PythonAPIOverview.md
@@ -257,13 +257,32 @@ Function `polish_model` runs model checker, optimizer, shape inference engine on
 and also strips the doc_string for you.
 ```python
 import onnx
-import onnx.utils
 
 
 model = onnx.load('path/to/the/model.onnx')
 polished_model = onnx.utils.polish_model(model)
 ```
 
+### Extracting Sub-model with Inputs Outputs Tensor Names
+
+Function `extract_model()` extracts sub-model from an ONNX model.
+The sub-model is defined by the names of the input and output tensors *exactly*.
+
+```python
+import onnx
+
+input_path = 'path/to/the/original/model.onnx'
+output_path = 'path/to/save/the/extracted/model.onnx'
+input_names = ['input_0', 'input_1', 'input_2']
+output_names = ['output_0', 'output_1']
+
+onnx.utils.extract_model(input_path, output_path, input_names, output_names)
+```
+
+Note: For control-flow operators, e.g. If and Loop, the _boundary of sub-model_,
+which is defined by the input and output tensors, should not _cut through_ the
+subgraph that is connected to the _main graph_ as attributes of these operators.
+
 ## Tools
 ### Updating Model's Inputs Outputs Dimension Sizes with Variable Length
 Function `update_inputs_outputs_dims` updates the dimension of the inputs and outputs of the model,
diff --git a/onnx/__init__.py b/onnx/__init__.py
@@ -13,9 +13,10 @@
 from .version import version as __version__  # noqa
 
 # Import common subpackages so they're available when you 'import onnx'
-import onnx.helper  # noqa
 import onnx.checker  # noqa
 import onnx.defs  # noqa
+import onnx.helper  # noqa
+import onnx.utils  # noqa
 
 import google.protobuf.message
 
diff --git a/onnx/test/utils_test.py b/onnx/test/utils_test.py
@@ -3,8 +3,12 @@
 from __future__ import print_function
 from __future__ import unicode_literals
 
+import os
+import shutil
+import tempfile
 import unittest
-import onnx.utils
+
+import onnx
 from onnx import helper, TensorProto
 
 
@@ -23,6 +27,53 @@ def test_polish_model(self):  # type: () -> None
         self.assertEqual(len(polished_def.graph.node), 1)
         self.assertFalse(polished_def.graph.node[0].HasField('doc_string'))
 
+    def test_extract_model(self):  # type: () -> None
+        def create_tensor(name):  # type: ignore
+            return helper.make_tensor_value_info(name, TensorProto.FLOAT, [1, 2])
+        A0 = create_tensor("A0")
+        A1 = create_tensor("A1")
+        B0 = create_tensor("B0")
+        B1 = create_tensor("B1")
+        B2 = create_tensor("B2")
+        C0 = create_tensor("C0")
+        C1 = create_tensor("C1")
+        D0 = create_tensor("D0")
+        L0_0 = helper.make_node("Add", ["A0", "A1"], ["B0"])
+        L0_1 = helper.make_node("Sub", ["A0", "A1"], ["B1"])
+        L0_2 = helper.make_node("Mul", ["A0", "A1"], ["B2"])
+        L1_0 = helper.make_node("Add", ["B0", "B1"], ["C0"])
+        L1_1 = helper.make_node("Sub", ["B1", "B2"], ["C1"])
+        L2_0 = helper.make_node("Mul", ["C0", "C1"], ["D0"])
+
+        g0 = helper.make_graph(
+            [L0_0, L0_1, L0_2, L1_0, L1_1, L2_0],
+            "test",
+            [A0, A1],
+            [D0])
+        m0 = helper.make_model(g0, producer_name='test')
+        tdir = tempfile.mkdtemp()
+        p0 = os.path.join(tdir, "original.onnx")
+        onnx.save(m0, p0)
+
+        p1 = os.path.join(tdir, "extracted.onnx")
+        input_names = ["B0", "B1", "B2"]
+        output_names = ["C0", "C1"]
+        onnx.utils.extract_model(p0, p1, input_names, output_names)
+
+        m1 = onnx.load(p1)
+        self.assertEqual(m1.producer_name, 'onnx.utils.extract_model')
+        self.assertEqual(m1.ir_version, m0.ir_version)
+        self.assertEqual(m1.opset_import, m0.opset_import)
+        self.assertEqual(len(m1.graph.node), 2)
+        self.assertEqual(len(m1.graph.input), 3)
+        self.assertEqual(len(m1.graph.output), 2)
+        self.assertEqual(m1.graph.input[0], B0)
+        self.assertEqual(m1.graph.input[1], B1)
+        self.assertEqual(m1.graph.input[2], B2)
+        self.assertEqual(m1.graph.output[0], C0)
+        self.assertEqual(m1.graph.output[1], C1)
+        shutil.rmtree(tdir, ignore_errors=True)
+
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/onnx/utils.py b/onnx/utils.py
@@ -3,12 +3,15 @@
 from __future__ import print_function
 from __future__ import unicode_literals
 
+import os
+from typing import List, Tuple, Text
+
 import onnx.checker
 import onnx.helper
 import onnx.optimizer
 import onnx.shape_inference
 
-from onnx import ModelProto
+from onnx import ModelProto, NodeProto, TensorProto, ValueInfoProto
 
 
 def polish_model(model):  # type: (ModelProto) -> ModelProto
@@ -21,3 +24,154 @@ def polish_model(model):  # type: (ModelProto) -> ModelProto
     model = onnx.optimizer.optimize(model)
     onnx.checker.check_model(model)
     return model
+
+
+class Extractor:
+    def __init__(self, model):  # type: (ModelProto) -> None
+        self.model = onnx.shape_inference.infer_shapes(model)
+        self.graph = self.model.graph
+        self.wmap = self._build_name2obj_dict(self.graph.initializer)
+        self.vimap = self._build_name2obj_dict(self.graph.value_info)
+
+    @staticmethod
+    def _build_name2obj_dict(objs):  # type: ignore
+        return {obj.name: obj for obj in objs}
+
+    def _collect_new_io_core(self, original_io, io_names_to_extract):  # type: ignore
+        original_io_map = self._build_name2obj_dict(original_io)
+        original_io_names = set(original_io_map.keys())
+        s_io_names_to_extract = set(io_names_to_extract)
+        io_names_to_keep = s_io_names_to_extract & original_io_names
+        new_io_names_to_add = s_io_names_to_extract - original_io_names
+
+        new_io_tensors = []
+        for name in io_names_to_keep:
+            new_io_tensors.append(original_io_map[name])
+        for name in new_io_names_to_add:
+            # activation become input or output
+            new_io_tensors.append(self.vimap[name])
+
+        # adjust sequence
+        new_io_tensors_map = self._build_name2obj_dict(new_io_tensors)
+        return [new_io_tensors_map[name] for name in io_names_to_extract]
+
+    def _collect_new_inputs(self, names):  # type: (List[Text]) -> List[ValueInfoProto]
+        return self._collect_new_io_core(self.graph.input, names)  # type: ignore
+
+    def _collect_new_outputs(self, names):  # type: (List[Text]) -> List[ValueInfoProto]
+        return self._collect_new_io_core(self.graph.output, names)  # type: ignore
+
+    def _dfs_search_reachable_nodes(
+            self,
+            node_output_name,  # type: Text
+            graph_input_names,  # type: List[Text]
+            reachable_nodes,  # type: List[NodeProto]
+    ):  # type: (...) -> None
+        if node_output_name in graph_input_names:
+            return
+        for node in self.graph.node:
+            if node in reachable_nodes:
+                continue
+            if node_output_name not in node.output:
+                continue
+            reachable_nodes.append(node)
+            for name in node.input:
+                self._dfs_search_reachable_nodes(name, graph_input_names, reachable_nodes)
+
+    def _collect_reachable_nodes(
+            self,
+            input_names,  # type: List[Text]
+            output_names,  # type: List[Text]
+    ):  # type: (...) -> List[NodeProto]
+        reachable_nodes = list()  # type: ignore
+        for name in output_names:
+            self._dfs_search_reachable_nodes(name, input_names, reachable_nodes)
+        # needs to be topology sorted.
+        nodes = [n for n in self.graph.node if n in reachable_nodes]
+        return nodes
+
+    def _collect_reachable_tensors(
+            self,
+            nodes,  # type: List[NodeProto]
+    ):  # type: (...) -> Tuple[List[TensorProto], List[ValueInfoProto]]
+        all_tensors_name = set()
+        for node in nodes:
+            for name in node.input:
+                all_tensors_name.add(name)
+            for name in node.output:
+                all_tensors_name.add(name)
+
+        initializer = [self.wmap[t] for t in self.wmap.keys() if t in all_tensors_name]
+        value_info = [self.vimap[t] for t in self.vimap.keys() if t in all_tensors_name]
+        assert(len(self.graph.sparse_initializer) == 0)
+        assert(len(self.graph.quantization_annotation) == 0)
+        return (initializer, value_info)
+
+    def _make_model(
+            self,
+            nodes,  # type: List[NodeProto]
+            inputs,  # type: List[ValueInfoProto]
+            outputs,  # type: List[ValueInfoProto]
+            initializer,  # type: List[TensorProto]
+            value_info  # type: List[ValueInfoProto]
+    ):  # type: (...) -> ModelProto
+        name = 'Extracted from {' + self.graph.name + '}'
+        graph = onnx.helper.make_graph(nodes, name, inputs, outputs, initializer=initializer,
+                                      value_info=value_info)
+
+        meta = {
+            'ir_version': self.model.ir_version,
+            'opset_imports': self.model.opset_import,
+            'producer_name': 'onnx.utils.extract_model',
+        }
+        return onnx.helper.make_model(graph, **meta)
+
+    def extract_model(
+            self,
+            input_names,  # type: List[Text]
+            output_names,  # type: List[Text]
+    ):  # type: (...) -> ModelProto
+        inputs = self._collect_new_inputs(input_names)
+        outputs = self._collect_new_outputs(output_names)
+        nodes = self._collect_reachable_nodes(input_names, output_names)
+        initializer, value_info = self._collect_reachable_tensors(nodes)
+        model = self._make_model(nodes, inputs, outputs, initializer, value_info)
+
+        return model
+
+
+def extract_model(
+        input_path,  # type: Text
+        output_path,  # type: Text
+        input_names,  # type: List[Text]
+        output_names  # type: List[Text]
+):  # type: (...) -> None
+    """Extracts sub-model from an ONNX model.
+
+    The sub-model is defined by the names of the input and output tensors *exactly*.
+
+    Note: For control-flow operators, e.g. If and Loop, the _boundary of sub-model_,
+    which is defined by the input and output tensors, should not _cut through_ the
+    subgraph that is connected to the _main graph_ as attributes of these operators.
+
+    Arguments:
+        input_path (string): The path to original ONNX model.
+        output_path (string): The path to save the extracted ONNX model.
+        input_names (list of string): The names of the input tensors that to be extracted.
+        output_names (list of string): The names of the output tensors that to be extracted.
+    """
+    if not os.path.exists(input_path):
+        raise ValueError("Invalid input model path: %s" % input_path)
+    if not output_path:
+        raise ValueError("Output model path shall not be empty!")
+    if not output_names:
+        raise ValueError("Output tensor names shall not be empty!")
+
+    onnx.checker.check_model(input_path)
+    model = onnx.load(input_path)
+
+    e = Extractor(model)
+    extracted = e.extract_model(input_names, output_names)
+
+    onnx.save(extracted, output_path)
+    onnx.checker.check_model(output_path)