- 
                Notifications
    You must be signed in to change notification settings 
- Fork 3.7k
[QNN] Requantize operator #3531
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from all commits
847dd52
              ed11cd7
              91b58a5
              13fcc70
              ac4dfdc
              01cad3a
              6405755
              7a49bee
              154e64f
              324e75c
              ffec47f
              72436ff
              9a721ad
              fb9cece
              be7101f
              0a5642a
              a9c1ce0
              a0d0324
              513b544
              435ca27
              e4f6a4e
              10a20d3
              927825d
              48f5a52
              1422f6d
              66a4d76
              99483c2
              f8439e6
              e756843
              5d7938f
              10ce99d
              f2e09d1
              65c0b46
              8d2c3ad
              2d15b54
              ff17a91
              c46b56c
              File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change | 
|---|---|---|
| @@ -0,0 +1,71 @@ | ||
| /* | ||
| * Licensed to the Apache Software Foundation (ASF) under one | ||
| * or more contributor license agreements. See the NOTICE file | ||
| * distributed with this work for additional information | ||
| * regarding copyright ownership. The ASF licenses this file | ||
| * to you under the Apache License, Version 2.0 (the | ||
| * "License"); you may not use this file except in compliance | ||
| * with the License. You may obtain a copy of the License at | ||
| * | ||
| * http://www.apache.org/licenses/LICENSE-2.0 | ||
| * | ||
| * Unless required by applicable law or agreed to in writing, | ||
| * software distributed under the License is distributed on an | ||
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | ||
| * KIND, either express or implied. See the License for the | ||
| * specific language governing permissions and limitations | ||
| * under the License. | ||
| */ | ||
|  | ||
| /*! | ||
| * \file tvm/relay/qnn/attrs.h | ||
| * \brief Auxiliary attributes for qnn operators. | ||
| */ | ||
| #ifndef TVM_RELAY_QNN_ATTRS_H_ | ||
| #define TVM_RELAY_QNN_ATTRS_H_ | ||
|  | ||
| #include <tvm/attrs.h> | ||
| #include <string> | ||
|  | ||
| namespace tvm { | ||
| namespace relay { | ||
| namespace qnn { | ||
|  | ||
| /*! \brief Attribute for requantize operator */ | ||
| struct RequantizeAttrs : public tvm::AttrsNode<RequantizeAttrs> { | ||
| double input_scale; | ||
| int32_t input_zero_point; | ||
| double output_scale; | ||
| int32_t output_zero_point; | ||
| std::string rounding; | ||
| DataType out_dtype; | ||
|  | ||
| TVM_DECLARE_ATTRS(RequantizeAttrs, "relay.attrs.RequantizeAttrs") { | ||
| TVM_ATTR_FIELD(input_scale) | ||
| .describe("The scale of the input tensor."); | ||
| TVM_ATTR_FIELD(input_zero_point) | ||
| .describe("The zero point of the input tensor."); | ||
| TVM_ATTR_FIELD(output_scale) | ||
| .describe("The scale of the output tensor."); | ||
| TVM_ATTR_FIELD(output_zero_point) | ||
| .describe("The zero point of the output tensor."); | ||
| TVM_ATTR_FIELD(rounding).set_default("TONEAREST") | ||
| There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Please double check the choice of enums "TONEAREST", are there existing API choices that are similar? I do not have preference but would be great to survey the related APIs should it be "TO_NEAREST"? (The TF API convention seems to be TO_NEAREST) There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I had similar question while coding this. I used TONEAREST because the supporting document - https://www.gnu.org/software/libc/manual/html_node/Rounding.html | ||
| .describe("Defines the rounding direction when the value is midway between" | ||
| "two representable values. There are two supported modes - UPWARD" | ||
| "or TONEAREST. Both modes behave exactly same except at the" | ||
| "midpoints between the two representable values. At the midpoint," | ||
| "UPWARD rounds towards positive infinity (for example -1.5 will be" | ||
| "rounded to -1). TONEAREST is the standard rounding where the" | ||
| "value is rounded away from zero at midpoints (for example, -1.5" | ||
| "rounds to -2). More context can be found at following gblic manual" | ||
| "https://www.gnu.org/software/libc/manual/html_node/Rounding.html."); | ||
| TVM_ATTR_FIELD(out_dtype) | ||
| .set_default(NullValue<DataType>()) | ||
| .describe("Output data type, set to explicit type under mixed precision setting"); | ||
| } | ||
| }; | ||
|  | ||
| } // namespace qnn | ||
| } // namespace relay | ||
| } // namespace tvm | ||
| #endif // TVM_RELAY_QNN_ATTRS_H_ | ||
| Original file line number | Diff line number | Diff line change | 
|---|---|---|
| @@ -0,0 +1,20 @@ | ||
| # Licensed to the Apache Software Foundation (ASF) under one | ||
| # or more contributor license agreements. See the NOTICE file | ||
| # distributed with this work for additional information | ||
| # regarding copyright ownership. The ASF licenses this file | ||
| # to you under the Apache License, Version 2.0 (the | ||
| # "License"); you may not use this file except in compliance | ||
| # with the License. You may obtain a copy of the License at | ||
| # | ||
| # http://www.apache.org/licenses/LICENSE-2.0 | ||
| # | ||
| # Unless required by applicable law or agreed to in writing, | ||
| # software distributed under the License is distributed on an | ||
| # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | ||
| # KIND, either express or implied. See the License for the | ||
| # specific language governing permissions and limitations | ||
| # under the License. | ||
| # pylint: disable=wildcard-import | ||
| """QNN dialect operators and IR passes.""" | ||
| from __future__ import absolute_import as _abs | ||
| from . import op | 
| Original file line number | Diff line number | Diff line change | 
|---|---|---|
| @@ -0,0 +1,20 @@ | ||
| # Licensed to the Apache Software Foundation (ASF) under one | ||
| # or more contributor license agreements. See the NOTICE file | ||
| # distributed with this work for additional information | ||
| # regarding copyright ownership. The ASF licenses this file | ||
| # to you under the Apache License, Version 2.0 (the | ||
| # "License"); you may not use this file except in compliance | ||
| # with the License. You may obtain a copy of the License at | ||
| # | ||
| # http://www.apache.org/licenses/LICENSE-2.0 | ||
| # | ||
| # Unless required by applicable law or agreed to in writing, | ||
| # software distributed under the License is distributed on an | ||
| # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | ||
| # KIND, either express or implied. See the License for the | ||
| # specific language governing permissions and limitations | ||
| # under the License. | ||
| # pylint: disable=wildcard-import | ||
| """Neural network related operators.""" | ||
| from __future__ import absolute_import as _abs | ||
| from .qnn import * | ||
|         
                  anijain2305 marked this conversation as resolved.
              Show resolved
            Hide resolved | ||
| Original file line number | Diff line number | Diff line change | 
|---|---|---|
| @@ -0,0 +1,20 @@ | ||
| # Licensed to the Apache Software Foundation (ASF) under one | ||
| # or more contributor license agreements. See the NOTICE file | ||
| # distributed with this work for additional information | ||
| # regarding copyright ownership. The ASF licenses this file | ||
| # to you under the Apache License, Version 2.0 (the | ||
| # "License"); you may not use this file except in compliance | ||
| # with the License. You may obtain a copy of the License at | ||
| # | ||
| # http://www.apache.org/licenses/LICENSE-2.0 | ||
| # | ||
| # Unless required by applicable law or agreed to in writing, | ||
| # software distributed under the License is distributed on an | ||
| # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | ||
| # KIND, either express or implied. See the License for the | ||
| # specific language governing permissions and limitations | ||
| # under the License. | ||
| """Constructor APIs""" | ||
| from ...._ffi.function import _init_api | ||
|  | ||
| _init_api("relay.qnn.op._make", __name__) | 
| Original file line number | Diff line number | Diff line change | 
|---|---|---|
| @@ -0,0 +1,74 @@ | ||
| # Licensed to the Apache Software Foundation (ASF) under one | ||
| # or more contributor license agreements. See the NOTICE file | ||
| # distributed with this work for additional information | ||
| # regarding copyright ownership. The ASF licenses this file | ||
| # to you under the Apache License, Version 2.0 (the | ||
| # "License"); you may not use this file except in compliance | ||
| # with the License. You may obtain a copy of the License at | ||
| # | ||
| # http://www.apache.org/licenses/LICENSE-2.0 | ||
| # | ||
| # Unless required by applicable law or agreed to in writing, | ||
| # software distributed under the License is distributed on an | ||
| # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | ||
| # KIND, either express or implied. See the License for the | ||
| # specific language governing permissions and limitations | ||
| # under the License. | ||
| #pylint: disable=invalid-name | ||
| """QNN dialect operators.""" | ||
|         
                  anijain2305 marked this conversation as resolved.
              Show resolved
            Hide resolved | ||
|  | ||
| from __future__ import absolute_import as _abs | ||
| from . import _make | ||
|  | ||
| def requantize(data, | ||
| input_scale, | ||
| input_zero_point, | ||
| output_scale, | ||
| output_zero_point, | ||
| rounding="TONEAREST", | ||
| out_dtype="int8"): | ||
| r"""Requantized operator. | ||
|  | ||
| The requantize operator converts one quantized tensor representation to | ||
| another quantized tensor representation. For the output tensor, we are | ||
| provided with output scale and zero point. The computation is as follows | ||
|  | ||
| Q_output = zp_output + (scale_input)/(scale_output) * (Q_input - zp_input) | ||
|  | ||
| Parameters | ||
| ---------- | ||
| data : tvm.relay.Expr | ||
| The input data to the operator. | ||
|         
                  anijain2305 marked this conversation as resolved.
              Show resolved
            Hide resolved | ||
|  | ||
| input_scale: float | ||
| The quantization scale for the input tensor. | ||
|  | ||
| input_zero_point: int | ||
| The zero point of the input tensor. | ||
|  | ||
| output_scale: float | ||
| The quantization scale for the output tensor. | ||
|  | ||
| output_zero_point: int | ||
| The zero point of the output tensor. | ||
|  | ||
| rounding : string, optional | ||
| Defines the rounding direction when the value is midway between two | ||
| representable values. | ||
|  | ||
| out_dtype : str, optional | ||
| Specifies the output data type. | ||
|  | ||
| Returns | ||
| ------- | ||
| result : tvm.relay.Expr | ||
| The computed result. | ||
| """ | ||
|  | ||
| return _make.requantize(data, | ||
| input_scale, | ||
| input_zero_point, | ||
| output_scale, | ||
| output_zero_point, | ||
| rounding, | ||
| out_dtype) | ||
Uh oh!
There was an error while loading. Please reload this page.