onnx · OYCN · Feb 16, 2024 · Feb 16, 2024 · Feb 26, 2024 · Feb 28, 2024
@@ -2,6 +2,7 @@
 //
 // SPDX-License-Identifier: Apache-2.0
 
+#include <pybind11/functional.h>
 #include <pybind11/pybind11.h>
 #include <pybind11/stl.h>
 
@@ -15,6 +16,7 @@
 #include "onnx/defs/parser.h"
 #include "onnx/defs/printer.h"
 #include "onnx/defs/schema.h"
+#include "onnx/defs/shape_inference.h"
 #include "onnx/inliner/inliner.h"
 #include "onnx/py_utils.h"
 #include "onnx/shape_inference/implementation.h"
@@ -114,6 +116,9 @@ PYBIND11_MODULE(onnx_cpp2py_export, onnx_cpp2py_export) {
 #endif // ONNX_ML
   );
 
+  // Avoid Segmentation fault if we not free the python function in Custom Schema
+  onnx_cpp2py_export.add_object("_cleanup", py::capsule([] { OpSchemaRegistry::OpSchemaDeregisterAll(); }));
+
   // Submodule `schema`
   auto defs = onnx_cpp2py_export.def_submodule("defs");
   defs.doc() = "Schema submodule";
@@ -394,6 +399,12 @@ PYBIND11_MODULE(onnx_cpp2py_export, onnx_cpp2py_export) {
               func_proto.SerializeToString(&func_bytes);
             }
             return py::bytes(func_bytes);
+          })
+      .def(
+          "set_type_and_shape_inference_function",
+          [](OpSchema* op, const std::function<void(InferenceContext*)>& func) {
+            auto wrapper = [=](InferenceContext& ctx) { func(&ctx); };
+            return op->TypeAndShapeInferenceFunction(wrapper);
           });
 
   defs.def(
@@ -625,6 +636,127 @@ PYBIND11_MODULE(onnx_cpp2py_export, onnx_cpp2py_export) {
   shape_inference.doc() = "Shape Inference submodule";
   py::register_exception<InferenceError>(shape_inference, "InferenceError");
 
+  py::class_<InferenceContext> inference_ctx(shape_inference, "InferenceContext", "Inference context");
+
+  inference_ctx.def("__get_attribute", [](InferenceContext* ctx, std::string name) {
+    if (ctx == nullptr) {
+      fail_shape_inference("Internal error: `ctx` is nullptr in `__get_attribute`");
+    }
+    auto attr = ctx->getAttribute(name);
+    if (attr == nullptr) {
+      fail_shape_inference("Internal error: `attr` is nullptr in `__get_attribute`");
+    }
+    std::string data;
+    attr->SerializeToString(&data);
+    return py::bytes(data);
+  });
+  inference_ctx.def("get_num_inputs", &InferenceContext::getNumInputs);
+  inference_ctx.def("has_input", &InferenceContext::hasInput);
+  inference_ctx.def("__get_input_type", [](InferenceContext* ctx, size_t index) {
+    if (ctx == nullptr) {
+      fail_shape_inference("Internal error: `ctx` is nullptr in `__get_input_type`");
+    }
+    auto type = ctx->getInputType(index);
+    if (type == nullptr) {
+      fail_shape_inference("Internal error: `type` is nullptr in `__get_input_type`");
+    }
+    std::string data;
+    type->SerializeToString(&data);
+    return py::bytes(data);
+  });
+  inference_ctx.def("__get_input_data", [](InferenceContext* ctx, size_t index) {
+    if (ctx == nullptr) {
+      fail_shape_inference("Internal error: `ctx` is nullptr in `__get_input_data`");
+    }
+    auto tensor = ctx->getInputData(index);
+    if (tensor == nullptr) {
+      fail_shape_inference("Internal error: `tensor` is nullptr in `__get_input_data`");
+    }
+    std::string data;
+    tensor->SerializeToString(&data);
+    return py::bytes(data);
+  });
+  inference_ctx.def("__get_input_sparse_data", [](InferenceContext* ctx, size_t index) {
+    if (ctx == nullptr) {
+      fail_shape_inference("Internal error: `ctx` is nullptr in `__get_input_sparse_data`");
+    }
+    auto stensor = ctx->getInputSparseData(index);
+    if (stensor == nullptr) {
+      fail_shape_inference("Internal error: `stensor` is nullptr in `__get_input_sparse_data`");
+    }
+    std::string data;
+    stensor->SerializeToString(&data);
+    return py::bytes(data);
+  });
+  inference_ctx.def("__get_symbolic_input", [](InferenceContext* ctx, size_t index) {
+    if (ctx == nullptr) {
+      fail_shape_inference("Internal error: `ctx` is nullptr in `__get_symbolic_input`");
+    }
+    auto shape = ctx->getSymbolicInput(index);
+    if (shape == nullptr) {
+      fail_shape_inference("Internal error: `shape` is nullptr in `__get_symbolic_input`");
+    }
+    std::string data;
+    shape->SerializeToString(&data);
+    return py::bytes(data);
+  });
+  inference_ctx.def("__get_graph_attribute_inferencer", &InferenceContext::getGraphAttributeInferencer);
+  inference_ctx.def("get_num_outputs", &InferenceContext::getNumOutputs);
+  inference_ctx.def("__get_output_type", [](InferenceContext* ctx, size_t index) {
+    if (ctx == nullptr) {
+      fail_shape_inference("Internal error: `ctx` is nullptr in `__get_output_type`");
+    }
+    auto type = ctx->getOutputType(index);
+    if (type == nullptr) {
+      fail_shape_inference("Internal error: `type` is nullptr in `__get_output_type`");
+    }
+    std::string data;
+    type->SerializeToString(&data);
+    return py::bytes(data);
+  });
+  inference_ctx.def("__set_output_type", [](InferenceContext* ctx, size_t index, py::bytes bytes) {
+    if (ctx == nullptr) {
+      fail_shape_inference("Internal error: `ctx` is nullptr in `__set_output_type`");
+    }
+    auto type = ctx->getOutputType(index);
+    if (type == nullptr) {
+      fail_shape_inference("Internal error: `type` is nullptr in `__set_output_type`");
+    }
+    ParseProtoFromPyBytes(type, bytes);
+  });
+
+  py::class_<GraphInferencer> graph_inferencer(shape_inference, "GraphInferencer", "Graph Inferencer");
+  graph_inferencer.def(
+      "__do_inferencing",
+      [](GraphInferencer* inferencer,
+         const std::vector<py::bytes>& input_types,
+         const std::vector<py::bytes>& input_data) {
+        std::vector<TypeProto> type_proto;
+        std::vector<TensorProto> tensor_proto;
+        std::vector<const TypeProto*> type_inputs;
+        std::vector<const TensorProto*> tensor_inputs;
+        for (const auto& bytes : input_types) {
+          TypeProto proto{};
+          ParseProtoFromPyBytes(&proto, bytes);
+          type_proto.emplace_back(proto);
+          type_inputs.emplace_back(&type_proto.back());
+        }
+        for (const auto& bytes : input_data) {
+          TensorProto proto{};
+          ParseProtoFromPyBytes(&proto, bytes);
+          tensor_proto.emplace_back(proto);
+          tensor_inputs.emplace_back(&tensor_proto.back());
+        }
+        auto ret = inferencer->doInferencing(type_inputs, tensor_inputs);
+        std::vector<py::bytes> out;
+        for (const auto& type : ret) {
+          std::string data;
+          type->SerializeToString(&data);
+          out.emplace_back(py::bytes(data));
+        }
+        return out;
+      });
+
   shape_inference.def(
       "infer_shapes",
       [](const py::bytes& bytes, bool check_type, bool strict_mode, bool data_prop) {

@@ -68,6 +68,7 @@ class OpSchema:
     ) -> dict[str, bytes]: ...
     @property
     def function_body(self) -> FunctionProto: ...
+    def set_type_and_shape_inference_function(self, func) -> None: ...
 
     class TypeConstraintParam:
         def __init__(

@@ -1,6 +1,38 @@
+from types import List
+
+from onnx import AttributeProto, TypeProto, TensorProto, SparseTensorProto, TensorShapeProto
 
 class InferenceError(Exception): ...
 
+class GraphInferencer:
+    # Impl in cpp (onnx/cpp2py_export.cc)
+    def __do_inferencing(self, input_types: List[bytes], input_data: List[bytes]) -> List[bytes]: ...
+    # Impl in py (onnx/shape_inference.py)
+    def do_inferencing(self, input_types: List[TypeProto], input_data: List[TensorProto]) -> List[TypeProto]: ...
+
+class InferenceContext:
+    # Impl in cpp  (onnx/cpp2py_export.cc)
+    def get_num_inputs(self) -> int: ...
+    def has_input(self, idx: int) -> bool: ...
+    def get_num_outputs(self) -> int: ...
+    def __get_attribute(self, name: str) -> bytes: ...
+    def __get_input_type(self, idx: int) -> bytes: ...
+    def __get_input_data(self, idx: int) -> bytes: ...
+    def __get_input_sparse_data(self, idx: int) -> bytes: ...
+    def __get_symbolic_input(self, idx: int) -> bytes: ...
+    def __get_graph_attribute_inferencer(self) -> GraphInferencer: ...
+    def __get_output_type(self, idx: int) -> bytes: ...
+    def __set_output_type(self, idx: int, output: bytes) -> None: ...
+    # Impl in py (onnx/shape_inference.py)
+    def get_attribute(self, name: str) -> AttributeProto: ...
+    def get_input_type(self, idx: int) -> TypeProto: ...
+    def get_input_data(self, idx: int) -> TensorProto: ...
+    def get_input_sparse_data(self, idx: int) -> SparseTensorProto: ...
+    def get_symbolic_input(self, idx: int) -> TensorShapeProto: ...
+    def get_graph_attribute_inferencer(self) -> GraphInferencer: ...
+    def get_output_type(self, idx: int) -> TypeProto: ...
+    def set_output_type(self, idx: int, output: TypeProto) -> None: ...
+
 def infer_shapes(
     b: bytes, check_type: bool, strict_mode: bool, data_prop: bool
 ) -> bytes: ...

@@ -14,7 +14,58 @@
 
 import onnx
 import onnx.onnx_cpp2py_export.shape_inference as C  # noqa: N812
-from onnx import AttributeProto, FunctionProto, ModelProto, TypeProto
+from onnx import (
+    AttributeProto,
+    FunctionProto,
+    ModelProto,
+    SparseTensorProto,
+    TensorProto,
+    TensorShapeProto,
+    TypeProto,
+)
+
+GraphInferencer = C.GraphInferencer
+
+
+def _do_inferencing(
+    self, input_types: list[TypeProto], input_data: list[TensorProto]
+) -> list[TypeProto]:
+    input_types_bytes = [proto.SerializeToString() for proto in input_types]
+    input_data_bytes = [proto.SerializeToString() for proto in input_data]
+    ret = self.__impl.__do_inferencing(input_types_bytes, input_data_bytes)
+    return [TypeProto.FromString(data) for data in ret]
+
+
+GraphInferencer.do_inferencing = _do_inferencing  # type: ignore
+
+
+def _parse_to_proto(attr, proto_type):
+    def impl(self, *args, **kwargs):
+        data = getattr(self, attr)(*args, **kwargs)
+        return proto_type.FromString(data)
+
+    return impl
+
+
+InferenceContext = C.InferenceContext
+InferenceContext.get_attribute = _parse_to_proto("__get_attribute", AttributeProto)  # type: ignore
+InferenceContext.get_input_type = _parse_to_proto("__get_input_type", TypeProto)  # type: ignore
+InferenceContext.get_input_data = _parse_to_proto("__get_input_data", TensorProto)  # type: ignore
+InferenceContext.get_input_sparse_data = _parse_to_proto(  # type: ignore
+    "__get_input_sparse_data", SparseTensorProto
+)
+InferenceContext.get_symbolic_input = _parse_to_proto(  # type: ignore
+    "__get_symbolic_input", TensorShapeProto
+)
+InferenceContext.get_output_type = _parse_to_proto("__get_output_type", TypeProto)  # type: ignore
+
+
+def _op_set_output_type(self, idx: int, output: TypeProto):
+    data = output.SerializeToString()
+    self.__set_output_type(idx, data)
+
+
+InferenceContext.set_output_type = _op_set_output_type  # type: ignore
 
 
 def infer_shapes(

@@ -10172,6 +10172,103 @@ def test_check_type_when_schema_has_empty_io(self):
             op_schema.name, op_schema.since_version, op_schema.domain
         )
 
+    def test_custom_schema_shape_inference(self) -> None:
+        # CustomOp schema:
+        #   attrs:
+        #       out_len: [L0, L1, ...]
+        #   inputs:
+        #       a[N, La]
+        #       b[N, Lb]
+        #   outputs:
+        #       out0[N, La * Lb, L0]
+        #       out1[N, La * Lb, L1]
+        #       ...
+        N = 3
+        La = 32
+        Lb = 64
+        out_len = [1, 2]
+        outs = [f"out{i}" for i in range(len(out_len))]
+        graph = self._make_graph(
+            [
+                ("a", TensorProto.FLOAT, (N, La)),
+                ("b", TensorProto.FLOAT, (N, Lb)),
+            ],
+            [make_node("CustomOp", ["a", "b"], outs, out_len=out_len)],
+            [],
+        )
+        with self.assertRaises(onnx.checker.ValidationError):
+            self._assert_inferred(
+                graph,
+                [
+                    make_tensor_value_info(
+                        f"out{i}", TensorProto.FLOAT, (N, La * Lb, Li)
+                    )
+                    for i, Li in enumerate(out_len)
+                ],
+            )
+
+        schema = OpSchema(
+            "CustomOp",
+            "",
+            1,
+            inputs=[
+                defs.OpSchema.FormalParameter("a", "float"),
+                defs.OpSchema.FormalParameter("b", "float"),
+            ],
+            outputs=[
+                defs.OpSchema.FormalParameter(
+                    "out", "float", param_option=OpSchema.FormalParameterOption.Variadic
+                ),
+            ],
+            attributes=[
+                defs.OpSchema.Attribute("out_len", defs.OpSchema.AttrType.INTS)
+            ],
+        )
+
+        def func(ctx: onnx.shape_inference.InferenceContext):
+            def parse_tensor_input(t: TypeProto):
+                assert isinstance(t, TypeProto)
+                return (
+                    t.tensor_type.elem_type,
+                    [
+                        d.dim_value if d.HasField("dim_value") else None
+                        for d in t.tensor_type.shape.dim
+                    ],
+                )
+
+            assert ctx.get_num_inputs() == 2
+            in0 = ctx.get_input_type(0)
+            in1 = ctx.get_input_type(1)
+            in0_type, in0_shape = parse_tensor_input(in0)
+            in1_type, in1_shape = parse_tensor_input(in1)
+            assert in0_type == in1_type == TensorProto.FLOAT
+            assert len(in0_shape) == len(in1_shape) == 2
+            assert in0_shape[0] == in1_shape[0]
+            N, La = in0_shape
+            _, Lb = in1_shape
+            attr = ctx.get_attribute("out_len")
+            out_len = attr.ints
+            assert len(out_len) == ctx.get_num_outputs()
+            for i in range(ctx.get_num_outputs()):
+                out = ctx.get_output_type(i)
+                out.tensor_type.elem_type = in0_type
+                out.tensor_type.shape.dim.add().dim_value = N
+                out.tensor_type.shape.dim.add().dim_value = La * Lb
+                out.tensor_type.shape.dim.add().dim_value = out_len[i]
+                ctx.set_output_type(i, out)
+
+        schema.set_type_and_shape_inference_function(func)
+        onnx.defs.register_schema(schema)
+
+        self._assert_inferred(
+            graph,
+            [
+                make_tensor_value_info(f"out{i}", TensorProto.FLOAT, (N, La * Lb, Li))
+                for i, Li in enumerate(out_len)
+            ],
+        )
+        onnx.defs.deregister_schema(schema.name, schema.since_version, schema.domain)
+
 
 if __name__ == "__main__":
     unittest.main()