5.6. 开发 Custom Operation
PopRT 支持用户开发自定义算子, 用于对 PopRT 做扩展.
典型的应用场景是: 用户有一个 ONNX 模型, 其中某个算子在 PopRT 中不支持, 此时用户就可以编写一个自定义算子, 并编译成动态链接库, PopRT 支持通过命令行的方式把这个自定义算子动态链接进 PopRT.
下面通过一个例子来描述为 PopRT 开发自定义算子的流程.
5.6.1. 编写自定义算子
由于 PopRT 是用 PopART 作为 backend, 因此为 PopRT 开发自定义算子的流程和 PopART 一致, 请参考 Creating Custom OP in PopART.
以名为 LeakyRelu
的自定义算子为例, 首先需要编写一个自定义算子的 C++ 代码:
1// Copyright (c) 2020 Graphcore Ltd. All rights reserved.
2
3// This example demonstrates how to create a custom operator for PopART, in this
4// case a Leaky ReLU op that returns `x` for any element `x >= 0` and `x *
5// alpha` for any element `x < 0`, where `alpha` is provided as a scalar
6// attribute to the operator.
7#include <popart/operatoridentifier.hpp>
8#include <popart/opmanager.hpp>
9#include <popart/opserialiser.hpp>
10#include <popart/popx/opxmanager.hpp>
11
12#include <popops/ElementWise.hpp>
13#include <popart/popx/opx.hpp>
14
15namespace CustomOperators {
16const popart::OperatorIdentifier LeakyReluId = {popart::Domain::ai_graphcore,
17 "LeakyRelu",
18 1};
19} // namespace CustomOperators
20
21class LeakyReluOp;
22class LeakyReluOpx;
23
24class LeakyReluOp : public popart::Op {
25public:
26 LeakyReluOp(const popart::OperatorIdentifier &_opid,
27 float _alpha,
28 const popart::Op::Settings &settings_)
29 : popart::Op(_opid, settings_), alpha(_alpha) {}
30
31 std::unique_ptr<Op> clone() const final {
32 return std::make_unique<LeakyReluOp>(*this);
33 }
34
35 void setup() final { outInfo(0) = inInfo(0); }
36
37 void appendAttributes(popart::OpSerialiserBase &os) const override {
38 Op::appendAttributes(os);
39 os.appendAttribute("alpha", getAlpha());
40 }
41
42 void appendOutlineAttributes(popart::OpSerialiserBase &os) const override {
43 Op::appendOutlineAttributes(os);
44 os.appendAttribute("alpha", getAlpha());
45 }
46
47 float getSubgraphValue() const final { return getHighSubgraphValue(); }
48
49 bool requiresRandomSeed() const override { return false; }
50
51 // Attributes
52 float getAlpha() const { return alpha; }
53
54private:
55 float alpha;
56};
57
58namespace {
59using popart::DataType;
60using popart::OpDefinition;
61
62static OpDefinition::DataTypes T = {DataType::FLOAT16, DataType::FLOAT};
63
64static OpDefinition
65 leakyReluOpDef({OpDefinition::Inputs({{"input", T}}),
66 OpDefinition::Outputs({{"output", T}}),
67 OpDefinition::Attributes({{"alpha", {"*"}}})});
68
69static popart::OpCreator<LeakyReluOp> leakyReluOpCreator(
70 popart::OpDefinitions({{CustomOperators::LeakyReluId, leakyReluOpDef}}),
71 [](const popart::OpCreatorInfo &info) {
72 // default alpha is 10**(-2)
73 float alpha = info.attributes.getAttribute<popart::Attributes::Float>(
74 "alpha", 1e-2f);
75 return std::make_unique<LeakyReluOp>(info.opid, alpha, info.settings);
76 },
77 true);
78} // namespace
79
80namespace pe = popops::expr;
81
82class LeakyReluOpx : public popart::popx::Opx {
83public:
84 LeakyReluOpx(popart::Op *op, popart::popx::Devicex *devicex)
85 : popart::popx::Opx(op, devicex) {
86 verifyOp<LeakyReluOp>(op, {CustomOperators::LeakyReluId});
87 }
88
89 void grow(poplar::program::Sequence &prog) const final {
90
91 auto op = getOp<LeakyReluOp>();
92
93 poplar::Tensor input = getInTensor(0);
94
95 float alpha = op.getAlpha();
96
97 // x < 0.0f ? alpha * x : x
98 auto expression = pe::Select(pe::Mul(pe::Const(alpha), pe::_1),
99 pe::_1,
100 pe::Lt(pe::_1, pe::Const(0.0f)));
101
102 popops::mapInPlace(graph(),
103 expression,
104 {input},
105 prog,
106 debugContext("LeakyRelu"),
107 poplar::OptionFlags());
108
109 setOutTensor(0, input);
110 }
111};
112
113static popart::popx::OpxCreator<LeakyReluOpx>
114 LeakyReluOpxCreator({CustomOperators::LeakyReluId});
Download leaky_relu_custom_op.cpp
编写 Makefile 并通过 make
命令生成 custom_ops.so
:
1CXX ?= g++
2CXXFLAGS = -std=c++14 -fPIC -g
3LDLIBS = -shared -lpopart
4ONNX_NAMESPACE = -DONNX_NAMESPACE=onnx
5
6BUILD_DIR = build
7SOURCES = leaky_relu_custom_op.cpp
8TARGET = $(BUILD_DIR)/custom_ops.so
9
10all: create_build_dir leaky_relu_custom_op
11
12.PHONY: create_build_dir
13create_build_dir:
14 mkdir -p $(BUILD_DIR)
15
16leaky_relu_custom_op: leaky_relu_custom_op.cpp
17 $(CXX) $(SOURCES) $(LDLIBS) $(CXXFLAGS) $(ONNX_NAMESPACE) -o $(TARGET)
18
19.PHONY: clean
20clean:
21 rm -rf $(BUILD_DIR)
编写自定义算子的 Shape-Inference 文件:
1# Copyright (c) 2022 Graphcore Ltd. All rights reserved.
2from typing import Tuple
3
4import onnx
5
6from poprt.passes.onnx_helper import get_dtype, get_shape
7from poprt.passes.shape_inference import ShapeInference, register
8
9
10@register(['LeakyRelu'])
11class LeakyRelu(ShapeInference):
12 """Function based on ONNX to infer the shape and dtype of Custom Op."""
13
14 def __init__(self) -> None:
15 super().__init__()
16
17 def __call__(
18 self,
19 model: onnx.ModelProto,
20 node: onnx.NodeProto,
21 ) -> Tuple[onnx.ModelProto, bool]:
22 graph = model.graph
23 input_name = node.input[0]
24 output_name = node.output[0]
25 # If the Op already has known shape and dtype of output, return True
26 if get_shape(model.graph, output_name) and get_dtype(model.graph, output_name):
27 return model, True
28
29 input_dtype = get_dtype(graph, input_name)
30 input_shape = get_shape(graph, input_name)
31 # If the Op is able to be inferred shape and dtype, return True
32 if input_dtype and input_shape and 0 not in input_shape:
33 # ![Shape-Inference Function begin]
34
35 # Step.1: Write the method following ONNX-Protobuf standard,
36 # to calc shape and dtype of output in terms of shape and dtype of input
37 # The LeakyRelu Op has same shape and dtype with input and output
38
39 # Step.2: Create new TensorProto with inferred shape and dtype of output
40 output_tensor = onnx.helper.make_tensor_value_info(
41 output_name, input_dtype, input_shape
42 )
43 # Step.3: Call update_value_info to update
44 model = self.update_value_info(model, output_tensor)
45 # Step.4: Call infer_shapes function
46 model = onnx.shape_inference.infer_shapes(model)
47 # ![Shape-Inference Function end]
48 return model, True
49 # If the Op is not able to be inferred, return False
50 else:
51 return model, False
Download custom_shape_inference.py
创建一个带有 LeakyRelu
OP 的 ONNX 模型文件
通过 Python3 运行以下测试代码生成用于测试的 ONNX 模型文件 custom_op_test.onnx
:
1# Copyright (c) 2022 Graphcore Ltd. All rights reserved.
2import argparse
3import os
4
5import onnx
6
7from onnx import helper
8
9
10def create_onnx_model_with_custom_op():
11 TensorProto = onnx.TensorProto
12
13 attributes = {"alpha": 0.01}
14 leaky_relu = helper.make_node(
15 "LeakyRelu", ["X"], ["Y"], domain="ai.graphcore", **attributes
16 )
17 relu = helper.make_node("Relu", ["Y"], ["Z"])
18
19 graph = helper.make_graph(
20 [leaky_relu, relu],
21 "custom_op_test",
22 [
23 helper.make_tensor_value_info("X", TensorProto.FLOAT, (8, 8)),
24 ],
25 [
26 helper.make_tensor_value_info("Z", TensorProto.FLOAT, (8, 8)),
27 ],
28 )
29 opset_imports = [helper.make_opsetid("", 11)]
30 model = helper.make_model(graph, opset_imports=opset_imports)
31 model.opset_import.append(onnx.helper.make_opsetid("ai.graphcore", 1))
32 return model
33
34
35if __name__ == '__main__':
36 parser = argparse.ArgumentParser(
37 description='Convert onnx model and run it on IPU.'
38 )
39 parser.add_argument(
40 '--output_dir',
41 type=str,
42 default='./',
43 help="Full path of the onnx model will be saved to.",
44 )
45 args = parser.parse_args()
46
47 if not os.path.isdir(args.output_dir):
48 raise ValueError("--output_dir should be an exist folder")
49
50 model_path = os.path.join(args.output_dir, 'custom_op_test.onnx')
51
52 model = create_onnx_model_with_custom_op()
53 onnx.save(model, model_path)
54
55 # Convert and Run
56 compile_cmd = "bash build.sh"
57 os.system(compile_cmd)
58 abs_path = os.path.abspath(os.path.dirname(__file__))
59 run_cmd = rf"""python -m poprt.cli \
60--input_model {model_path} \
61--custom_shape_inference {abs_path}/custom_shape_inference.py \
62--custom_library_so_paths {abs_path}/custom_ops.so \
63--run"""
64 os.system(run_cmd)
65 # 2022-12-30 07:01:54,408 INFO cli.py:446] Bs: 8
66 # 2022-12-30 07:01:54,408 INFO cli.py:449] Latency: 0.23ms
67 # 2022-12-30 07:01:54,408 INFO cli.py:450] Tput: 35469
在 PopRT 中使用自定义算子
可以通过 PopRT 的命令行 --custom_library_so_paths
来动态链接自定义算子的库文件, 并通过 --custom_shape_inference
来注册自定义算子的 Shape-Inference.
可以通过如下命令来执行上述生成的 ONNX 模型文件:
python -m poprt.cli \
--input_model custom_op_test.onnx \
--custom_library_so_paths custom_ops.so \
--custom_shape_inference custom_shape_inference.py \
--run