Add Tactivation attribute for QuantizedMatmul and QuantizedMatmulMinMax to explicitly notify which quantizedtype output would be produced by following activation function.
Change: 142073731
This commit is contained in:
parent
a7cd5f671e
commit
811629aed4
@ -2245,6 +2245,7 @@ REGISTER_OP("QuantizedMatMul")
|
|||||||
.Attr("Toutput: quantizedtype = DT_QINT32")
|
.Attr("Toutput: quantizedtype = DT_QINT32")
|
||||||
.Attr("transpose_a: bool = false")
|
.Attr("transpose_a: bool = false")
|
||||||
.Attr("transpose_b: bool = false")
|
.Attr("transpose_b: bool = false")
|
||||||
|
.Attr("Tactivation: quantizedtype = DT_QUINT8")
|
||||||
.SetShapeFn([](InferenceContext* c) {
|
.SetShapeFn([](InferenceContext* c) {
|
||||||
TF_RETURN_IF_ERROR(shape_inference::MatMulShape(c));
|
TF_RETURN_IF_ERROR(shape_inference::MatMulShape(c));
|
||||||
ShapeHandle unused;
|
ShapeHandle unused;
|
||||||
@ -2275,6 +2276,8 @@ min_b: The float value that the lowest quantized `b` value represents.
|
|||||||
max_b: The float value that the highest quantized `b` value represents.
|
max_b: The float value that the highest quantized `b` value represents.
|
||||||
min_out: The float value that the lowest quantized output value represents.
|
min_out: The float value that the lowest quantized output value represents.
|
||||||
max_out: The float value that the highest quantized output value represents.
|
max_out: The float value that the highest quantized output value represents.
|
||||||
|
Tactivation: The type of output produced by activation function
|
||||||
|
following this operation.
|
||||||
|
|
||||||
)doc");
|
)doc");
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user