pytorch/caffe2/quantization/server/quantization_error_minimization.h

#pragma once

#include "caffe2/quantization/server/dnnlowp.h"

namespace dnnlowp {

class QuantizationErrorMinimization {
 public:
  virtual TensorQuantizationParams ChooseQuantizationParams(
      const Histogram& hist,
      bool preserve_sparsity = false,
      int precision = 8) = 0;
  virtual ~QuantizationErrorMinimization(){};
};

class NormMinimization : public QuantizationErrorMinimization {
 public:
  enum Kind {
    L1,
    L2,
  };

  NormMinimization(Kind kind) : kind_(kind) {}

  /**
   * Faster approximate search
   */
  TensorQuantizationParams NonlinearQuantizationParamsSearch(
      const Histogram& hist,
      bool preserve_sparsity = false,
      int precision = 8);

  TensorQuantizationParams ChooseQuantizationParams(
      const Histogram& hist,
      bool preserve_sparsity = false,
      int precision = 8) override;

 protected:
  Kind kind_;
};

class L1ErrorMinimization : public NormMinimization {
 public:
  L1ErrorMinimization() : NormMinimization(L1) {}
};

class P99 : public QuantizationErrorMinimization {
 public:
  float threshold_;
  P99(float p99_threshold = 0.99) : threshold_(p99_threshold) {}
  TensorQuantizationParams ChooseQuantizationParams(
      const Histogram& hist,
      bool preserve_sparsity = true,
      int precision = 8) override;
}; // class P99QuantizationFactory

} // namespace dnnlowp
Migrate dnnlowp code to open source directory (#13500) Summary: Pull Request resolved: https://github.com/pytorch/pytorch/pull/13500 This diff migrate dnnlowp related files and operators from deeplearning/quantization/caffe2 and deeplearning/quantization/dnnlowp to the open source directory. Reviewed By: jspark1105 Differential Revision: D10842192 fbshipit-source-id: 53d0666d0ae47a01db9c48114345d746b0a4f11f 2018-11-02 16:32:30 +00:00			`#pragma once`

Remove AutoHeaders.RECURSIVE_GLOB from caffe2/ (#73227) Summary: Pull Request resolved: https://github.com/pytorch/pytorch/pull/73227 Reviewed By: christycylee Differential Revision: D34016914 fbshipit-source-id: 277937f3c13a54ea1180afac253ee9927e56e99e (cherry picked from commit d97777318170a406d89755e577386cde857dd59b) 2022-03-01 18:57:26 +00:00			`#include "caffe2/quantization/server/dnnlowp.h"`
Migrate dnnlowp code to open source directory (#13500) Summary: Pull Request resolved: https://github.com/pytorch/pytorch/pull/13500 This diff migrate dnnlowp related files and operators from deeplearning/quantization/caffe2 and deeplearning/quantization/dnnlowp to the open source directory. Reviewed By: jspark1105 Differential Revision: D10842192 fbshipit-source-id: 53d0666d0ae47a01db9c48114345d746b0a4f11f 2018-11-02 16:32:30 +00:00
			`namespace dnnlowp {`

			`class QuantizationErrorMinimization {`
			`public:`
			`virtual TensorQuantizationParams ChooseQuantizationParams(`
clang-format (#14160) Summary: Pull Request resolved: https://github.com/pytorch/pytorch/pull/14160 clang-format of C++ files Reviewed By: hx89 Differential Revision: D13115201 fbshipit-source-id: d2ad65f66209e00578ef90f87f41272de2d24aa9 2018-11-20 08:53:29 +00:00			`const Histogram& hist,`
			`bool preserve_sparsity = false,`
			`int precision = 8) = 0;`
			`virtual ~QuantizationErrorMinimization(){};`
Migrate dnnlowp code to open source directory (#13500) Summary: Pull Request resolved: https://github.com/pytorch/pytorch/pull/13500 This diff migrate dnnlowp related files and operators from deeplearning/quantization/caffe2 and deeplearning/quantization/dnnlowp to the open source directory. Reviewed By: jspark1105 Differential Revision: D10842192 fbshipit-source-id: 53d0666d0ae47a01db9c48114345d746b0a4f11f 2018-11-02 16:32:30 +00:00			`};`

			`class NormMinimization : public QuantizationErrorMinimization {`
			`public:`
			`enum Kind {`
			`L1,`
			`L2,`
			`};`

			`NormMinimization(Kind kind) : kind_(kind) {}`

			`/**`
			`* Faster approximate search`
			`*/`
			`TensorQuantizationParams NonlinearQuantizationParamsSearch(`
clang-format (#14160) Summary: Pull Request resolved: https://github.com/pytorch/pytorch/pull/14160 clang-format of C++ files Reviewed By: hx89 Differential Revision: D13115201 fbshipit-source-id: d2ad65f66209e00578ef90f87f41272de2d24aa9 2018-11-20 08:53:29 +00:00			`const Histogram& hist,`
			`bool preserve_sparsity = false,`
			`int precision = 8);`
Migrate dnnlowp code to open source directory (#13500) Summary: Pull Request resolved: https://github.com/pytorch/pytorch/pull/13500 This diff migrate dnnlowp related files and operators from deeplearning/quantization/caffe2 and deeplearning/quantization/dnnlowp to the open source directory. Reviewed By: jspark1105 Differential Revision: D10842192 fbshipit-source-id: 53d0666d0ae47a01db9c48114345d746b0a4f11f 2018-11-02 16:32:30 +00:00
			`TensorQuantizationParams ChooseQuantizationParams(`
clang-format (#14160) Summary: Pull Request resolved: https://github.com/pytorch/pytorch/pull/14160 clang-format of C++ files Reviewed By: hx89 Differential Revision: D13115201 fbshipit-source-id: d2ad65f66209e00578ef90f87f41272de2d24aa9 2018-11-20 08:53:29 +00:00			`const Histogram& hist,`
			`bool preserve_sparsity = false,`
			`int precision = 8) override;`
Migrate dnnlowp code to open source directory (#13500) Summary: Pull Request resolved: https://github.com/pytorch/pytorch/pull/13500 This diff migrate dnnlowp related files and operators from deeplearning/quantization/caffe2 and deeplearning/quantization/dnnlowp to the open source directory. Reviewed By: jspark1105 Differential Revision: D10842192 fbshipit-source-id: 53d0666d0ae47a01db9c48114345d746b0a4f11f 2018-11-02 16:32:30 +00:00
			`protected:`
			`Kind kind_;`
			`};`

			`class L1ErrorMinimization : public NormMinimization {`
			`public:`
			`L1ErrorMinimization() : NormMinimization(L1) {}`
			`};`

			`class P99 : public QuantizationErrorMinimization {`
			`public:`
Add P99 method with configurable thresholds Summary: Update the P99 quantization method with configurable thresholds. Add dnnlowp options for the configuration. Test Plan: buck run mode/opt experimental/summerdeng/xray_image:test_net_quantization -- --model_path=/mnt/public/summerdeng/xray_image/models/oct_resnext101_50_2B_pretrained.mdl --batch_size=1 --test_max_images=100 --octave_conv --octave_conv_ratio=0.5 --output_dir=/mnt/public/summerdeng/xray_image/output --quantize --histogram_file=/mnt/public/summerdeng/xray_image/activation_histograms/oct_resnext101_50_2B_pretrained_hist_200k_compiled.txt --int8_model_type="mdl" --int8_model_mdl_name="int8_oct_resnext101_50_2B_l2_nongroupwise.mdl" --skip_first_conv --weight_quant="l2" --activation_quant="p99" --activation_p99_threshold=0.999 --measure_quantization_error Reviewed By: amylittleyang Differential Revision: D16626158 fbshipit-source-id: 7718dcf429f73aa54e82a6b6f6e631d94e3a134c 2019-09-27 22:51:34 +00:00			`float threshold_;`
			`P99(float p99_threshold = 0.99) : threshold_(p99_threshold) {}`
Migrate dnnlowp code to open source directory (#13500) Summary: Pull Request resolved: https://github.com/pytorch/pytorch/pull/13500 This diff migrate dnnlowp related files and operators from deeplearning/quantization/caffe2 and deeplearning/quantization/dnnlowp to the open source directory. Reviewed By: jspark1105 Differential Revision: D10842192 fbshipit-source-id: 53d0666d0ae47a01db9c48114345d746b0a4f11f 2018-11-02 16:32:30 +00:00			`TensorQuantizationParams ChooseQuantizationParams(`
clang-format (#14160) Summary: Pull Request resolved: https://github.com/pytorch/pytorch/pull/14160 clang-format of C++ files Reviewed By: hx89 Differential Revision: D13115201 fbshipit-source-id: d2ad65f66209e00578ef90f87f41272de2d24aa9 2018-11-20 08:53:29 +00:00			`const Histogram& hist,`
			`bool preserve_sparsity = true,`
			`int precision = 8) override;`
Migrate dnnlowp code to open source directory (#13500) Summary: Pull Request resolved: https://github.com/pytorch/pytorch/pull/13500 This diff migrate dnnlowp related files and operators from deeplearning/quantization/caffe2 and deeplearning/quantization/dnnlowp to the open source directory. Reviewed By: jspark1105 Differential Revision: D10842192 fbshipit-source-id: 53d0666d0ae47a01db9c48114345d746b0a4f11f 2018-11-02 16:32:30 +00:00			`}; // class P99QuantizationFactory`

			`} // namespace dnnlowp`