mlir/lib/Quantization/Transforms/LowerTF.cpp

//===- LowerTF.cpp - Passes for lowering from TensorFlow ------------------===//
//
// Copyright 2019 The MLIR Authors.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//   http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
// =============================================================================

#include "mlir/IR/Attributes.h"
#include "mlir/IR/PatternMatch.h"
#include "mlir/IR/StandardTypes.h"
#include "mlir/Pass/Pass.h"
#include "mlir/Quantization/FakeQuantSupport.h"
#include "mlir/Quantization/Passes.h"
#include "mlir/Quantization/QuantOps.h"
#include "mlir/Quantization/UniformSupport.h"
#include "mlir/TensorFlow/TFOps.h"

using namespace mlir;
using namespace mlir::quant;

namespace {

class LowerTFPass : public FunctionPass<LowerTFPass> {
public:
  void runOnFunction() override;
};

} // end anonymous namespace

/// Rewrites TensorFlow FakeQuantWithMinMaxArgs into a qbarrier/dbarrier pair.
class FakeQuantWithMinMaxArgsRewrite : public RewritePattern {
public:
  bool *hadFailure;

  FakeQuantWithMinMaxArgsRewrite(MLIRContext *context, bool *hadFailure)
      : RewritePattern(TF::FakeQuantWithMinMaxArgsOp::getOperationName(), 1,
                       context),
        hadFailure(hadFailure) {}

  PatternMatchResult match(Operation *op) const override {
    return matchSuccess();
  }

  void rewrite(Operation *op, PatternRewriter &rewriter) const override {
    // TODO: If this pattern comes up more frequently, consider adding core
    // support for failable rewrites.
    if (failableRewrite(op, rewriter)) {
      *hadFailure = true;
    }
  }

  bool failableRewrite(Operation *op, PatternRewriter &rewriter) const {
    auto fqOp = op->template cast<TF::FakeQuantWithMinMaxArgsOp>();

    auto converter =
        ExpressedToUniformQuantizedConverter::forInputType(fqOp.getType());
    if (!converter) {
      return (op->emitError("unsupported quantized type conversion"), true);
    }

    UniformQuantizedType uniformElementType = fakeQuantAttrsToType(
        fqOp.getLoc(), fqOp.num_bits().getSExtValue(),
        fqOp.min().convertToDouble(), fqOp.max().convertToDouble(),
        fqOp.narrow_range(), converter.expressedType);

    if (!uniformElementType) {
      // Note that the fakeQuantAttrsToType will have emitted the error.
      return true;
    }

    Type quantizedType = converter.convert(uniformElementType);
    assert(quantizedType &&
           "Converter accepted a type that it did not convert");

    // TODO: Map to a qbarrier with an attribute like [Forced] to signal that
    // this is a forced/hard-coded constraint.
    auto qbarrier = rewriter.create<QuantizeBarrierOp>(
        op->getLoc(), quantizedType, fqOp.inputs());
    rewriter.replaceOpWithNewOp<DequantizeBarrierOp>(op, converter.inputType,
                                                     qbarrier.getResult());

    return false;
  }
};

void LowerTFPass::runOnFunction() {
  bool hadFailure = false;
  OwningRewritePatternList patterns;
  auto &func = getFunction();
  auto *context = &getContext();
  patterns.push_back(
      llvm::make_unique<FakeQuantWithMinMaxArgsRewrite>(context, &hadFailure));
  applyPatternsGreedily(func, std::move(patterns));
  if (hadFailure)
    signalPassFailure();
}

FunctionPassBase *createLowerTFPass() { return new LowerTFPass(); }

static PassRegistration<LowerTFPass>
    pass("quant-lower-tf",
         "Lowers TensorFlow constraint ops to the quantization dialect");
Initial release of the Quantization dialect Includes a draft of documentation for the quantization setup. Given how many comments such docs have garnered in the past, I've biased towards a lightly edited first-draft so that people can argue about terminology, approach and structure without having spent too much time on it. Note that the sections under "Uniform quantization" were cribbed nearly verbatim from internal documentation that Daniel wrote. PiperOrigin-RevId: 241768668 2019-04-03 11:16:32 -07:00			`//===- LowerTF.cpp - Passes for lowering from TensorFlow ------------------===//`
			`//`
			`// Copyright 2019 The MLIR Authors.`
			`//`
			`// Licensed under the Apache License, Version 2.0 (the "License");`
			`// you may not use this file except in compliance with the License.`
			`// You may obtain a copy of the License at`
			`//`
			`// http://www.apache.org/licenses/LICENSE-2.0`
			`//`
			`// Unless required by applicable law or agreed to in writing, software`
			`// distributed under the License is distributed on an "AS IS" BASIS,`
			`// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`// See the License for the specific language governing permissions and`
			`// limitations under the License.`
			`// =============================================================================`

			`#include "mlir/IR/Attributes.h"`
			`#include "mlir/IR/PatternMatch.h"`
			`#include "mlir/IR/StandardTypes.h"`
			`#include "mlir/Pass/Pass.h"`
			`#include "mlir/Quantization/FakeQuantSupport.h"`
			`#include "mlir/Quantization/Passes.h"`
			`#include "mlir/Quantization/QuantOps.h"`
			`#include "mlir/Quantization/UniformSupport.h"`
			`#include "mlir/TensorFlow/TFOps.h"`

			`using namespace mlir;`
			`using namespace mlir::quant;`

			`namespace {`

			`class LowerTFPass : public FunctionPass<LowerTFPass> {`
			`public:`
			`void runOnFunction() override;`
			`};`

			`} // end anonymous namespace`

			`/// Rewrites TensorFlow FakeQuantWithMinMaxArgs into a qbarrier/dbarrier pair.`
			`class FakeQuantWithMinMaxArgsRewrite : public RewritePattern {`
			`public:`
			`bool *hadFailure;`

			`FakeQuantWithMinMaxArgsRewrite(MLIRContext context, bool hadFailure)`
			`: RewritePattern(TF::FakeQuantWithMinMaxArgsOp::getOperationName(), 1,`
			`context),`
			`hadFailure(hadFailure) {}`

			`PatternMatchResult match(Operation *op) const override {`
			`return matchSuccess();`
			`}`

			`void rewrite(Operation *op, PatternRewriter &rewriter) const override {`
			`// TODO: If this pattern comes up more frequently, consider adding core`
			`// support for failable rewrites.`
			`if (failableRewrite(op, rewriter)) {`
			`*hadFailure = true;`
			`}`
			`}`

			`bool failableRewrite(Operation *op, PatternRewriter &rewriter) const {`
			`auto fqOp = op->template cast<TF::FakeQuantWithMinMaxArgsOp>();`

			`auto converter =`
			`ExpressedToUniformQuantizedConverter::forInputType(fqOp.getType());`
			`if (!converter) {`
			`return (op->emitError("unsupported quantized type conversion"), true);`
			`}`

			`UniformQuantizedType uniformElementType = fakeQuantAttrsToType(`
			`fqOp.getLoc(), fqOp.num_bits().getSExtValue(),`
			`fqOp.min().convertToDouble(), fqOp.max().convertToDouble(),`
			`fqOp.narrow_range(), converter.expressedType);`

			`if (!uniformElementType) {`
			`// Note that the fakeQuantAttrsToType will have emitted the error.`
			`return true;`
			`}`

			`Type quantizedType = converter.convert(uniformElementType);`
			`assert(quantizedType &&`
			`"Converter accepted a type that it did not convert");`

			`// TODO: Map to a qbarrier with an attribute like [Forced] to signal that`
			`// this is a forced/hard-coded constraint.`
			`auto qbarrier = rewriter.create<QuantizeBarrierOp>(`
			`op->getLoc(), quantizedType, fqOp.inputs());`
			`rewriter.replaceOpWithNewOp<DequantizeBarrierOp>(op, converter.inputType,`
			`qbarrier.getResult());`

			`return false;`
			`}`
			`};`

			`void LowerTFPass::runOnFunction() {`
			`bool hadFailure = false;`
			`OwningRewritePatternList patterns;`
			`auto &func = getFunction();`
			`auto *context = &getContext();`
			`patterns.push_back(`
			`llvm::make_unique<FakeQuantWithMinMaxArgsRewrite>(context, &hadFailure));`
			`applyPatternsGreedily(func, std::move(patterns));`
			`if (hadFailure)`
			`signalPassFailure();`
			`}`

			`FunctionPassBase *createLowerTFPass() { return new LowerTFPass(); }`

			`static PassRegistration<LowerTFPass>`
			`pass("quant-lower-tf",`
			`"Lowers TensorFlow constraint ops to the quantization dialect");`