forked from pytorch/pytorch
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathQScheme.h
50 lines (44 loc) · 1.53 KB
/
QScheme.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
#pragma once
#include <c10/util/Exception.h>
#include <cstdint>
#include <string>
namespace c10 {
/**
* QScheme is an enum that specifies the type of quantization. This has a one
* to one correspondence with Quantizer
* Please refer to ATen/quantized/Quantizer.h to see the Quantizers classes.
* Keep this file in sync with torch/nn/_qscheme.py
*/
enum class QScheme : uint8_t {
PER_TENSOR_AFFINE = 0,
PER_CHANNEL_AFFINE = 1,
PER_TENSOR_SYMMETRIC = 2,
PER_CHANNEL_SYMMETRIC = 3,
PER_CHANNEL_AFFINE_FLOAT_QPARAMS = 4,
COMPILE_TIME_NUM_QSCHEMES = 5,
};
constexpr auto kPerTensorAffine = QScheme::PER_TENSOR_AFFINE;
constexpr auto kPerChannelAffine = QScheme::PER_CHANNEL_AFFINE;
constexpr auto kPerTensorSymmetric = QScheme::PER_TENSOR_SYMMETRIC;
constexpr auto kPerChannelSymmetric = QScheme::PER_CHANNEL_SYMMETRIC;
constexpr auto kPerChannelAffineFloatQParams =
QScheme::PER_CHANNEL_AFFINE_FLOAT_QPARAMS;
constexpr int COMPILE_TIME_NUM_QSCHEMES =
static_cast<int>(QScheme::COMPILE_TIME_NUM_QSCHEMES);
inline std::string toString(QScheme qscheme) {
switch (qscheme) {
case kPerTensorAffine:
return "per_tensor_affine";
case kPerChannelAffine:
return "per_channel_affine";
case kPerTensorSymmetric:
return "per_tensor_symmetric";
case kPerChannelSymmetric:
return "per_channel_symmetric";
case kPerChannelAffineFloatQParams:
return "per_channel_affine_float_qparams";
default:
TORCH_CHECK(false, "Unrecognized qscheme: ", static_cast<int>(qscheme));
}
}
} // namespace c10