summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorFeng Liu <fengliuai@google.com>2019-07-18 11:25:53 -0700
committerMehdi Amini <joker.eph@gmail.com>2019-07-19 11:39:54 -0700
commit701266c47abab7180d36ae174f19d76a113a77a4 (patch)
tree697c3673664e24484f80ba7a58fdc74c68c1531a
parent90b5a381ce1ae04c4d67071c1098c946848cb342 (diff)
downloadbcm5719-llvm-701266c47abab7180d36ae174f19d76a113a77a4.tar.gz
bcm5719-llvm-701266c47abab7180d36ae174f19d76a113a77a4.zip
Add an "is_signed" attribute to the quant_ConstFakeQuant op
Some TensorFlow simulated quantize ops such as QuantizeAndDequantizeV2Op have attribute for the sign of the quantization, so quant_ConstFakeQuant should be able to represent it with the new attribute is added. The method for converting these attributes to an QuantizedType is updated to handle this new argument. PiperOrigin-RevId: 258810290
-rw-r--r--mlir/include/mlir/Dialect/QuantOps/QuantOps.td4
-rw-r--r--mlir/lib/Dialect/QuantOps/Transforms/ConvertSimQuant.cpp2
-rw-r--r--mlir/lib/Dialect/QuantOps/Utils/FakeQuantSupport.cpp12
-rw-r--r--mlir/test/Dialect/QuantOps/convert-fakequant.mlir47
4 files changed, 59 insertions, 6 deletions
diff --git a/mlir/include/mlir/Dialect/QuantOps/QuantOps.td b/mlir/include/mlir/Dialect/QuantOps/QuantOps.td
index c76ad2d32cc..394d3a18ced 100644
--- a/mlir/include/mlir/Dialect/QuantOps/QuantOps.td
+++ b/mlir/include/mlir/Dialect/QuantOps/QuantOps.td
@@ -122,7 +122,9 @@ def quant_ConstFakeQuant : quant_Op<"const_fake_quant",
// The bitwidth of the quantization; between 2 and 16, inclusive.
I64Attr:$num_bits,
// Quantization range starts from 0 or 1; starts from 1 if true.
- DefaultValuedAttr<BoolAttr, "false">:$narrow_range
+ DefaultValuedAttr<BoolAttr, "false">:$narrow_range,
+ // The sign of the quantization.
+ DefaultValuedAttr<BoolAttr, "false">:$is_signed
);
let results = (outs
diff --git a/mlir/lib/Dialect/QuantOps/Transforms/ConvertSimQuant.cpp b/mlir/lib/Dialect/QuantOps/Transforms/ConvertSimQuant.cpp
index 0c93146a232..32d8c8a81c1 100644
--- a/mlir/lib/Dialect/QuantOps/Transforms/ConvertSimQuant.cpp
+++ b/mlir/lib/Dialect/QuantOps/Transforms/ConvertSimQuant.cpp
@@ -70,7 +70,7 @@ public:
UniformQuantizedType uniformElementType = fakeQuantAttrsToType(
fqOp.getLoc(), fqOp.num_bits().getSExtValue(),
fqOp.min().convertToFloat(), fqOp.max().convertToFloat(),
- fqOp.narrow_range(), converter.expressedType);
+ fqOp.narrow_range(), converter.expressedType, fqOp.is_signed());
if (!uniformElementType) {
// Note that the fakeQuantAttrsToType will have emitted the error.
diff --git a/mlir/lib/Dialect/QuantOps/Utils/FakeQuantSupport.cpp b/mlir/lib/Dialect/QuantOps/Utils/FakeQuantSupport.cpp
index 13c622e50d1..2667da98242 100644
--- a/mlir/lib/Dialect/QuantOps/Utils/FakeQuantSupport.cpp
+++ b/mlir/lib/Dialect/QuantOps/Utils/FakeQuantSupport.cpp
@@ -45,9 +45,15 @@ mlir::quant::fakeQuantAttrsToType(Location loc, unsigned numBits, double rmin,
}
} else if (numBits <= 16) {
storageType = IntegerType::get(16, ctx);
- flags = QuantizationFlags::Signed;
- qmin = -32768;
- qmax = 32767;
+ if (isSigned) {
+ flags = QuantizationFlags::Signed;
+ qmin = -32768;
+ qmax = 32767;
+ } else {
+ flags = 0;
+ qmin = 0;
+ qmax = 65535;
+ }
} else {
emitError(loc, "unsupported FakeQuant number of bits: ") << numBits;
return nullptr;
diff --git a/mlir/test/Dialect/QuantOps/convert-fakequant.mlir b/mlir/test/Dialect/QuantOps/convert-fakequant.mlir
index bd28c2c3516..61561c5e359 100644
--- a/mlir/test/Dialect/QuantOps/convert-fakequant.mlir
+++ b/mlir/test/Dialect/QuantOps/convert-fakequant.mlir
@@ -46,6 +46,51 @@ func @fakeQuantArgs_Quint8_SymmetricRange(tensor<8x4x3xf32>) -> tensor<8x4x3xf32
}
// -----
+// Verifies a qint8 asymmetric 0..1 range.
+// CHECK-LABEL: fakeQuantArgs_Qint8_0_1
+func @fakeQuantArgs_Qint8_0_1(tensor<8x4x3xf32>) -> tensor<8x4x3xf32> {
+^bb0(%arg0: tensor<8x4x3xf32>):
+ // CHECK: %0 = "quant.qcast"(%arg0) : (tensor<8x4x3xf32>)
+ // CHECK-SAME: -> tensor<8x4x3x!quant.uniform<i8:f32, 0.0039215686274509803:-128>>
+ // CHECK-NEXT: %1 = "quant.dcast"(%0) : (tensor<8x4x3x!quant.uniform<i8:f32, 0.0039215686274509803:-128>>)
+ // CHECK-SAME: -> tensor<8x4x3xf32>
+ %0 = "quant.const_fake_quant"(%arg0) {
+ min = 0.0 : f32, max = 1.0 : f32, num_bits = 8, is_signed = true
+ } : (tensor<8x4x3xf32>) -> tensor<8x4x3xf32>
+ return %0 : tensor<8x4x3xf32>
+}
+
+// -----
+// Verifies a qint8 asymmetric 0..1 range (with narrow_range = true).
+// CHECK_LABEL: fakeQuantArgs_Qint8_NarrowRange
+func @fakeQuantArgs_Qint8_NarrowRange(tensor<8x4x3xf32>) -> tensor<8x4x3xf32> {
+^bb0(%arg0: tensor<8x4x3xf32>):
+ // CHECK: %0 = "quant.qcast"(%arg0) : (tensor<8x4x3xf32>)
+ // CHECK-SAME: -> tensor<8x4x3x!quant.uniform<i8<-127:127>:f32, 0.003937007874015748:-127>>
+ // CHECK-NEXT: %1 = "quant.dcast"(%0) : (tensor<8x4x3x!quant.uniform<i8<-127:127>:f32, 0.003937007874015748:-127>>)
+ // CHECK-SAME: -> tensor<8x4x3xf32>
+ %0 = "quant.const_fake_quant"(%arg0) {
+ min = 0.0 : f32, max = 1.0 : f32, num_bits = 8, narrow_range = true, is_signed = true
+ } : (tensor<8x4x3xf32>) -> tensor<8x4x3xf32>
+ return %0 : tensor<8x4x3xf32>
+}
+
+// -----
+// Verifies a qint8 symmetric range of -1..127/128.
+// CHECK_LABEL: fakeQuantArgs_Qint8_SymmetricRange
+func @fakeQuantArgs_Qint8_SymmetricRange(tensor<8x4x3xf32>) -> tensor<8x4x3xf32> {
+^bb0(%arg0: tensor<8x4x3xf32>):
+ // CHECK: %0 = "quant.qcast"(%arg0) : (tensor<8x4x3xf32>)
+ // CHECK-SAME: -> tensor<8x4x3x!quant.uniform<i8:f32, 7.812500e-03>>
+ // CHECK-NEXT: %1 = "quant.dcast"(%0) : (tensor<8x4x3x!quant.uniform<i8:f32, 7.812500e-03>>)
+ // CHECK-SAME: -> tensor<8x4x3xf32>
+ %0 = "quant.const_fake_quant"(%arg0) {
+ min = -1.0 : f32, max = 0.9921875 : f32, num_bits = 8, narrow_range = false, is_signed = true
+ } : (tensor<8x4x3xf32>) -> tensor<8x4x3xf32>
+ return %0 : tensor<8x4x3xf32>
+}
+
+// -----
// Verifies a commonly used -1..1 symmetric 16bit range with a zero point of
// 0 and range -1.0 .. 32767/32768.
// CHECK-LABEL: fakeQuantArgs_Qint16_Symmetric
@@ -56,7 +101,7 @@ func @fakeQuantArgs_Qint16_Symmetric(tensor<8x4x3xf32>) -> tensor<8x4x3xf32> {
// CHECK-NEXT: %1 = "quant.dcast"(%0) : (tensor<8x4x3x!quant.uniform<i16:f32, 3.0517578125E-5>>)
// CHECK-SAME: -> tensor<8x4x3xf32>
%0 = "quant.const_fake_quant"(%arg0) {
- min = -1.0 : f32, max = 0.999969482 : f32, num_bits = 16
+ min = -1.0 : f32, max = 0.999969482 : f32, num_bits = 16, is_signed = true
} : (tensor<8x4x3xf32>) -> tensor<8x4x3xf32>
return %0 : tensor<8x4x3xf32>
}
OpenPOWER on IntegriCloud