-
Notifications
You must be signed in to change notification settings - Fork 3.8k
[QNN] Requantize operator #3531
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from all commits
847dd52
ed11cd7
91b58a5
13fcc70
ac4dfdc
01cad3a
6405755
7a49bee
154e64f
324e75c
ffec47f
72436ff
9a721ad
fb9cece
be7101f
0a5642a
a9c1ce0
a0d0324
513b544
435ca27
e4f6a4e
10a20d3
927825d
48f5a52
1422f6d
66a4d76
99483c2
f8439e6
e756843
5d7938f
10ce99d
f2e09d1
65c0b46
8d2c3ad
2d15b54
ff17a91
c46b56c
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,71 @@ | ||
| /* | ||
| * Licensed to the Apache Software Foundation (ASF) under one | ||
| * or more contributor license agreements. See the NOTICE file | ||
| * distributed with this work for additional information | ||
| * regarding copyright ownership. The ASF licenses this file | ||
| * to you under the Apache License, Version 2.0 (the | ||
| * "License"); you may not use this file except in compliance | ||
| * with the License. You may obtain a copy of the License at | ||
| * | ||
| * http://www.apache.org/licenses/LICENSE-2.0 | ||
| * | ||
| * Unless required by applicable law or agreed to in writing, | ||
| * software distributed under the License is distributed on an | ||
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | ||
| * KIND, either express or implied. See the License for the | ||
| * specific language governing permissions and limitations | ||
| * under the License. | ||
| */ | ||
|
|
||
| /*! | ||
| * \file tvm/relay/qnn/attrs.h | ||
| * \brief Auxiliary attributes for qnn operators. | ||
| */ | ||
| #ifndef TVM_RELAY_QNN_ATTRS_H_ | ||
| #define TVM_RELAY_QNN_ATTRS_H_ | ||
|
|
||
| #include <tvm/attrs.h> | ||
| #include <string> | ||
|
|
||
| namespace tvm { | ||
| namespace relay { | ||
| namespace qnn { | ||
|
|
||
| /*! \brief Attribute for requantize operator */ | ||
| struct RequantizeAttrs : public tvm::AttrsNode<RequantizeAttrs> { | ||
| double input_scale; | ||
| int32_t input_zero_point; | ||
| double output_scale; | ||
| int32_t output_zero_point; | ||
| std::string rounding; | ||
| DataType out_dtype; | ||
|
|
||
| TVM_DECLARE_ATTRS(RequantizeAttrs, "relay.attrs.RequantizeAttrs") { | ||
| TVM_ATTR_FIELD(input_scale) | ||
| .describe("The scale of the input tensor."); | ||
| TVM_ATTR_FIELD(input_zero_point) | ||
| .describe("The zero point of the input tensor."); | ||
| TVM_ATTR_FIELD(output_scale) | ||
| .describe("The scale of the output tensor."); | ||
| TVM_ATTR_FIELD(output_zero_point) | ||
| .describe("The zero point of the output tensor."); | ||
| TVM_ATTR_FIELD(rounding).set_default("TONEAREST") | ||
|
Member
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Please double check the choice of enums "TONEAREST", are there existing API choices that are similar? I do not have preference but would be great to survey the related APIs should it be "TO_NEAREST"? (The TF API convention seems to be TO_NEAREST)
Contributor
Author
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I had similar question while coding this. I used TONEAREST because the supporting document - https://www.gnu.org/software/libc/manual/html_node/Rounding.html |
||
| .describe("Defines the rounding direction when the value is midway between" | ||
| "two representable values. There are two supported modes - UPWARD" | ||
| "or TONEAREST. Both modes behave exactly same except at the" | ||
| "midpoints between the two representable values. At the midpoint," | ||
| "UPWARD rounds towards positive infinity (for example -1.5 will be" | ||
| "rounded to -1). TONEAREST is the standard rounding where the" | ||
| "value is rounded away from zero at midpoints (for example, -1.5" | ||
| "rounds to -2). More context can be found at following gblic manual" | ||
| "https://www.gnu.org/software/libc/manual/html_node/Rounding.html."); | ||
| TVM_ATTR_FIELD(out_dtype) | ||
| .set_default(NullValue<DataType>()) | ||
| .describe("Output data type, set to explicit type under mixed precision setting"); | ||
| } | ||
| }; | ||
|
|
||
| } // namespace qnn | ||
| } // namespace relay | ||
| } // namespace tvm | ||
| #endif // TVM_RELAY_QNN_ATTRS_H_ | ||
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,20 @@ | ||
| # Licensed to the Apache Software Foundation (ASF) under one | ||
| # or more contributor license agreements. See the NOTICE file | ||
| # distributed with this work for additional information | ||
| # regarding copyright ownership. The ASF licenses this file | ||
| # to you under the Apache License, Version 2.0 (the | ||
| # "License"); you may not use this file except in compliance | ||
| # with the License. You may obtain a copy of the License at | ||
| # | ||
| # http://www.apache.org/licenses/LICENSE-2.0 | ||
| # | ||
| # Unless required by applicable law or agreed to in writing, | ||
| # software distributed under the License is distributed on an | ||
| # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | ||
| # KIND, either express or implied. See the License for the | ||
| # specific language governing permissions and limitations | ||
| # under the License. | ||
| # pylint: disable=wildcard-import | ||
| """QNN dialect operators and IR passes.""" | ||
| from __future__ import absolute_import as _abs | ||
| from . import op |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,20 @@ | ||
| # Licensed to the Apache Software Foundation (ASF) under one | ||
| # or more contributor license agreements. See the NOTICE file | ||
| # distributed with this work for additional information | ||
| # regarding copyright ownership. The ASF licenses this file | ||
| # to you under the Apache License, Version 2.0 (the | ||
| # "License"); you may not use this file except in compliance | ||
| # with the License. You may obtain a copy of the License at | ||
| # | ||
| # http://www.apache.org/licenses/LICENSE-2.0 | ||
| # | ||
| # Unless required by applicable law or agreed to in writing, | ||
| # software distributed under the License is distributed on an | ||
| # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | ||
| # KIND, either express or implied. See the License for the | ||
| # specific language governing permissions and limitations | ||
| # under the License. | ||
| # pylint: disable=wildcard-import | ||
| """Neural network related operators.""" | ||
| from __future__ import absolute_import as _abs | ||
| from .qnn import * | ||
anijain2305 marked this conversation as resolved.
Show resolved
Hide resolved
|
||
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,20 @@ | ||
| # Licensed to the Apache Software Foundation (ASF) under one | ||
| # or more contributor license agreements. See the NOTICE file | ||
| # distributed with this work for additional information | ||
| # regarding copyright ownership. The ASF licenses this file | ||
| # to you under the Apache License, Version 2.0 (the | ||
| # "License"); you may not use this file except in compliance | ||
| # with the License. You may obtain a copy of the License at | ||
| # | ||
| # http://www.apache.org/licenses/LICENSE-2.0 | ||
| # | ||
| # Unless required by applicable law or agreed to in writing, | ||
| # software distributed under the License is distributed on an | ||
| # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | ||
| # KIND, either express or implied. See the License for the | ||
| # specific language governing permissions and limitations | ||
| # under the License. | ||
| """Constructor APIs""" | ||
| from ...._ffi.function import _init_api | ||
|
|
||
| _init_api("relay.qnn.op._make", __name__) |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,74 @@ | ||
| # Licensed to the Apache Software Foundation (ASF) under one | ||
| # or more contributor license agreements. See the NOTICE file | ||
| # distributed with this work for additional information | ||
| # regarding copyright ownership. The ASF licenses this file | ||
| # to you under the Apache License, Version 2.0 (the | ||
| # "License"); you may not use this file except in compliance | ||
| # with the License. You may obtain a copy of the License at | ||
| # | ||
| # http://www.apache.org/licenses/LICENSE-2.0 | ||
| # | ||
| # Unless required by applicable law or agreed to in writing, | ||
| # software distributed under the License is distributed on an | ||
| # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | ||
| # KIND, either express or implied. See the License for the | ||
| # specific language governing permissions and limitations | ||
| # under the License. | ||
| #pylint: disable=invalid-name | ||
| """QNN dialect operators.""" | ||
anijain2305 marked this conversation as resolved.
Show resolved
Hide resolved
|
||
|
|
||
| from __future__ import absolute_import as _abs | ||
| from . import _make | ||
|
|
||
| def requantize(data, | ||
| input_scale, | ||
| input_zero_point, | ||
| output_scale, | ||
| output_zero_point, | ||
| rounding="TONEAREST", | ||
| out_dtype="int8"): | ||
| r"""Requantized operator. | ||
|
|
||
| The requantize operator converts one quantized tensor representation to | ||
| another quantized tensor representation. For the output tensor, we are | ||
| provided with output scale and zero point. The computation is as follows | ||
|
|
||
| Q_output = zp_output + (scale_input)/(scale_output) * (Q_input - zp_input) | ||
|
|
||
| Parameters | ||
| ---------- | ||
| data : tvm.relay.Expr | ||
| The input data to the operator. | ||
anijain2305 marked this conversation as resolved.
Show resolved
Hide resolved
|
||
|
|
||
| input_scale: float | ||
| The quantization scale for the input tensor. | ||
|
|
||
| input_zero_point: int | ||
| The zero point of the input tensor. | ||
|
|
||
| output_scale: float | ||
| The quantization scale for the output tensor. | ||
|
|
||
| output_zero_point: int | ||
| The zero point of the output tensor. | ||
|
|
||
| rounding : string, optional | ||
| Defines the rounding direction when the value is midway between two | ||
| representable values. | ||
|
|
||
| out_dtype : str, optional | ||
| Specifies the output data type. | ||
|
|
||
| Returns | ||
| ------- | ||
| result : tvm.relay.Expr | ||
| The computed result. | ||
| """ | ||
|
|
||
| return _make.requantize(data, | ||
| input_scale, | ||
| input_zero_point, | ||
| output_scale, | ||
| output_zero_point, | ||
| rounding, | ||
| out_dtype) | ||
Uh oh!
There was an error while loading. Please reload this page.