2021.3/ngraph_cpp_api/fake__quantize_8hpp_source.html

 //*****************************************************************************

 // Copyright 2017-2021 Intel Corporation

 //

 // Licensed under the Apache License, Version 2.0 (the "License");

 // you may not use this file except in compliance with the License.

 // You may obtain a copy of the License at

 //

 //     http://www.apache.org/licenses/LICENSE-2.0

 //

 // Unless required by applicable law or agreed to in writing, software

 // distributed under the License is distributed on an "AS IS" BASIS,

 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 // See the License for the specific language governing permissions and

 // limitations under the License.

 //*****************************************************************************


 #pragma once


 #include "ngraph/node.hpp"

 #include "ngraph/op/util/attr_types.hpp"

 #include "ngraph/op/util/fused_op.hpp"


 NGRAPH_SUPPRESS_DEPRECATED_START


 namespace ngraph

 {

     namespace op

     {

         namespace v0

         {

             ///

             /// \brief      Class performing element-wise linear quantization.

             ///

             /// \note       Input floating point values are quantized into a discrete

             ///             set of floating point values.

             ///

             /// \paragraph Implementation This class creates a node which performs the following

             ///            operation:

             ///

             ///            round((data - input_low) / (input_high - input_low) * (levels-1)) /

             ///                 (levels-1) * (output_high - output_low) + output_low

             ///

             ///

             class NGRAPH_API FakeQuantize : public ngraph::op::Op

             {

             public:

                 NGRAPH_RTTI_DECLARATION;


                 FakeQuantize();

                 ///

                 /// \brief      Constructs a FakeQuantize operation node.

                 ///

                 /// \param[in]  data            The input data tensor.

                 /// \param[in]  input_low       The minimum limit for input values.

                 /// \param[in]  input_high      The maximum limit for input values.

                 /// \param[in]  output_low      The minimum quantized value.

                 /// \param[in]  output_high     The maximum quantized value.

                 /// \param[in]  levels          The number of quantization levels.

                 /// \param[in]  auto_broadcast  AutoBroadcast mode to be used for broadcasting

                 ///                             limit values

                 ///

                 FakeQuantize(const Output<Node>& data,

                              const Output<Node>& input_low,

                              const Output<Node>& input_high,

                              const Output<Node>& output_low,

                              const Output<Node>& output_high,

                              std::size_t levels,

                              const AutoBroadcastSpec& auto_broadcast =

                                  AutoBroadcastSpec(AutoBroadcastType::NUMPY));


                 bool visit_attributes(AttributeVisitor& visitor) override;

                 virtual void validate_and_infer_types() override;


                 virtual std::shared_ptr<Node>

                     clone_with_new_inputs(const OutputVector& new_args) const override;


                 std::size_t get_levels() const { return m_levels; }

                 void set_levels(std::size_t levels) { m_levels = levels; }

                 const AutoBroadcastSpec& get_auto_broadcast() const { return m_auto_broadcast; }

                 void set_auto_broadcast(const AutoBroadcastSpec& auto_broadcast)

                 {

                     m_auto_broadcast = auto_broadcast;

                 }


             private:

                 std::size_t m_levels;

                 AutoBroadcastSpec m_auto_broadcast = op::AutoBroadcastType::NUMPY;

             };

         }

         using v0::FakeQuantize;

     }

 }


 NGRAPH_SUPPRESS_DEPRECATED_END

ngraph::AttributeVisitor
Visits the attributes of a node, primarily for serialization-like tasks.
Definition: attribute_visitor.hpp:71

ngraph::Output< Node >
A handle for one of a node's outputs.
Definition: node_output.hpp:42

ngraph::op::Op
Root of all actual ops.
Definition: op.hpp:29

ngraph::op::v0::FakeQuantize
Class performing element-wise linear quantization.
Definition: fake_quantize.hpp:45

ngraph::op::v0::FakeQuantize::FakeQuantize
FakeQuantize(const Output< Node > &data, const Output< Node > &input_low, const Output< Node > &input_high, const Output< Node > &output_low, const Output< Node > &output_high, std::size_t levels, const AutoBroadcastSpec &auto_broadcast=AutoBroadcastSpec(AutoBroadcastType::NUMPY))
Constructs a FakeQuantize operation node.

ngraph::op::v0::FakeQuantize::validate_and_infer_types
virtual void validate_and_infer_types() override
Verifies that attributes and inputs are consistent and computes output shapes and element types....

ngraph
The Intel nGraph C++ API.
Definition: attribute_adapter.hpp:28

ngraph::op::AutoBroadcastSpec
Implicit broadcast specification.
Definition: attr_types.hpp:323