doxygen/DatapathFolds_8cpp_source.html

//===----------------------------------------------------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//


#include "circt/Dialect/Comb/CombOps.h"

#include "circt/Dialect/Datapath/DatapathDialect.h"

#include "circt/Dialect/Datapath/DatapathOps.h"

#include "circt/Dialect/HW/HWOps.h"

#include "mlir/IR/Matchers.h"

#include "mlir/IR/PatternMatch.h"

#include "llvm/Support/Casting.h"

#include "llvm/Support/KnownBits.h"

#include <algorithm>


using namespace mlir;

using namespace circt;

using namespace datapath;

using namespace matchers;


//===----------------------------------------------------------------------===//

// Utility Functions

//===----------------------------------------------------------------------===//


static FailureOr<size_t> calculateNonZeroBits(Value operand,

                                              size_t numResults) {

  // If the extracted bits are all known, then return the result.

  auto knownBits = comb::computeKnownBits(operand);

  if (knownBits.isUnknown())

    return failure(); // Skip if we don't know anything about the bits


  size_t nonZeroBits = operand.getType().getIntOrFloatBitWidth() -

                       knownBits.Zero.countLeadingOnes();


  // If all bits non-zero we will not reduce the number of results

  if (nonZeroBits == numResults)

    return failure();


  return nonZeroBits;

}


//===----------------------------------------------------------------------===//

// Compress Operation

//===----------------------------------------------------------------------===//

// Check that all compressor results are included in this list of operands

// If not we must take care as manipulating compressor results independently

// could easily introduce a non-equivalent representation.


static bool areAllCompressorResultsSummed(ValueRange compressResults,

                                          ValueRange operands) {

  for (auto result : compressResults) {

    if (!llvm::is_contained(operands, result))

      return false;

  }

  return true;

}


struct FoldCompressIntoCompress

    : public OpRewritePattern<datapath::CompressOp> {

  using OpRewritePattern::OpRewritePattern;


  // compress(compress(a,b,c), add(e,f)) -> compress(a,b,c,e,f)


  LogicalResult matchAndRewrite(datapath::CompressOp compOp,

                                PatternRewriter &rewriter) const override {

    auto operands = compOp.getOperands();

    llvm::SmallSetVector<Value, 8> processedCompressorResults;

    SmallVector<Value, 8> newCompressOperands;


    for (Value operand : operands) {


      // Skip if already processed this compressor

      if (processedCompressorResults.contains(operand))

        continue;


      // If the operand has multiple uses, we do not fold it into a compress

      // operation, so we treat it as a regular operand to maintain sharing.

      if (!operand.hasOneUse()) {

        newCompressOperands.push_back(operand);

        continue;

      }


      // Found a compress op - add its operands to our new list

      if (auto compressOp = operand.getDefiningOp<datapath::CompressOp>()) {


        // Check that all results of the compressor are summed in this add

        if (!areAllCompressorResultsSummed(compressOp.getResults(), operands))

          return failure();


        llvm::append_range(newCompressOperands, compressOp.getOperands());

        // Only process each compressor once as multiple operands will point

        // to the same defining operation

        processedCompressorResults.insert(compressOp.getResults().begin(),

                                          compressOp.getResults().end());

        continue;

      }


      if (auto addOp = operand.getDefiningOp<comb::AddOp>()) {

        llvm::append_range(newCompressOperands, addOp.getOperands());

        continue;

      }


      // Regular operand - just add it to our list

      newCompressOperands.push_back(operand);

    }


    // If unable to collect more operands then this pattern doesn't apply

    if (newCompressOperands.size() <= compOp.getNumOperands())

      return failure();


    // Create a new CompressOp with all collected operands

    rewriter.replaceOpWithNewOp<datapath::CompressOp>(

        compOp, newCompressOperands, compOp.getNumResults());

    return success();

  }


};


struct FoldAddIntoCompress : public OpRewritePattern<comb::AddOp> {

  using OpRewritePattern::OpRewritePattern;


  // add(compress(a,b,c),d) -> add(compress(a,b,c,d))

  // FIXME: This should be implemented as a canonicalization pattern for

  // compress op. Currently `hasDatapathOperand` flag prevents introducing

  // datapath operations from comb operations.


  LogicalResult matchAndRewrite(comb::AddOp addOp,

                                PatternRewriter &rewriter) const override {

    // comb.add canonicalization patterns handle folding add operations

    if (addOp.getNumOperands() <= 2)

      return failure();


    // Get operands of the AddOp

    auto operands = addOp.getOperands();

    llvm::SmallSetVector<Value, 8> processedCompressorResults;

    SmallVector<Value, 8> newCompressOperands;

    // Only construct compressor if can form a larger compressor than what

    // is currently an input of this add. Also check that there is at least

    // one datapath operand.

    bool shouldFold = false, hasDatapathOperand = false;


    for (Value operand : operands) {


      // Skip if already processed this compressor

      if (processedCompressorResults.contains(operand))

        continue;


      if (auto *op = operand.getDefiningOp())

        if (isa_and_nonnull<datapath::DatapathDialect>(op->getDialect()))

          hasDatapathOperand = true;


      // If the operand has multiple uses, we do not fold it into a compress

      // operation, so we treat it as a regular operand.

      if (!operand.hasOneUse()) {

        shouldFold |= !newCompressOperands.empty();

        newCompressOperands.push_back(operand);

        continue;

      }


      // Found a compress op - add its operands to our new list

      if (auto compressOp = operand.getDefiningOp<datapath::CompressOp>()) {


        // Check that all results of the compressor are summed in this add

        if (!areAllCompressorResultsSummed(compressOp.getResults(), operands))

          return failure();


        // If we've already added one operand it should be folded

        shouldFold |= !newCompressOperands.empty();

        llvm::append_range(newCompressOperands, compressOp.getOperands());

        // Only process each compressor once

        processedCompressorResults.insert(compressOp.getResults().begin(),

                                          compressOp.getResults().end());

        continue;

      }


      if (auto addOp = operand.getDefiningOp<comb::AddOp>()) {

        shouldFold |= !newCompressOperands.empty();

        llvm::append_range(newCompressOperands, addOp.getOperands());

        continue;

      }


      // Regular operand - just add it to our list

      shouldFold |= !newCompressOperands.empty();

      newCompressOperands.push_back(operand);

    }


    // Only fold if we have constructed a larger compressor than what was

    // already there

    if (!shouldFold || !hasDatapathOperand)

      return failure();


    // Create a new CompressOp with all collected operands

    auto newCompressOp = datapath::CompressOp::create(rewriter, addOp.getLoc(),

                                                      newCompressOperands, 2);


    // Replace the original AddOp with a new add(compress(inputs))

    rewriter.replaceOpWithNewOp<comb::AddOp>(addOp, newCompressOp.getResults(),

                                             true);

    return success();

  }


};


struct ConstantFoldCompress : public OpRewritePattern<CompressOp> {

  using OpRewritePattern::OpRewritePattern;


  LogicalResult matchAndRewrite(CompressOp op,

                                PatternRewriter &rewriter) const override {

    auto inputs = op.getInputs();

    auto size = inputs.size();


    APInt value;


    // compress(..., 0) -> compress(...) -- identity

    if (matchPattern(inputs.back(), m_ConstantInt(&value)) && value.isZero()) {


      // If only reducing by one row and contains zero - pass through operands

      if (size - 1 == op.getNumResults()) {

        rewriter.replaceOp(op, inputs.drop_back());

        return success();

      }


      // Default create a compressor with fewer arguments

      rewriter.replaceOpWithNewOp<CompressOp>(op, inputs.drop_back(),

                                              op.getNumResults());

      return success();

    }


    return failure();

  }


};


void CompressOp::getCanonicalizationPatterns(RewritePatternSet &results,

                                             MLIRContext *context) {


  results

      .add<FoldCompressIntoCompress, FoldAddIntoCompress, ConstantFoldCompress>(

          context);

}


//===----------------------------------------------------------------------===//

// Partial Product Operation

//===----------------------------------------------------------------------===//


struct ReduceNumPartialProducts : public OpRewritePattern<PartialProductOp> {

  using OpRewritePattern::OpRewritePattern;


  // pp(concat(0,a), concat(0,b)) -> reduced number of results


  LogicalResult matchAndRewrite(PartialProductOp op,

                                PatternRewriter &rewriter) const override {

    auto operands = op.getOperands();

    unsigned inputWidth = operands[0].getType().getIntOrFloatBitWidth();


    // TODO: implement a constant multiplication for the PartialProductOp


    auto op0NonZeroBits = calculateNonZeroBits(operands[0], op.getNumResults());

    auto op1NonZeroBits = calculateNonZeroBits(operands[1], op.getNumResults());


    if (failed(op0NonZeroBits) || failed(op1NonZeroBits))

      return failure();


    // Need the +1 for the carry-out

    size_t maxNonZeroBits = std::max(*op0NonZeroBits, *op1NonZeroBits);


    auto newPP = datapath::PartialProductOp::create(

        rewriter, op.getLoc(), op.getOperands(), maxNonZeroBits);


    auto zero = hw::ConstantOp::create(rewriter, op.getLoc(),

                                       APInt::getZero(inputWidth));


    // Collect newPP results and pad with zeros if needed

    SmallVector<Value> newResults(newPP.getResults().begin(),

                                  newPP.getResults().end());


    newResults.append(op.getNumResults() - newResults.size(), zero);


    rewriter.replaceOp(op, newResults);

    return success();

  }


};


struct PosPartialProducts : public OpRewritePattern<PartialProductOp> {

  using OpRewritePattern::OpRewritePattern;


  // pp(add(a,b),c) -> pos_pp(a,b,c)


  LogicalResult matchAndRewrite(PartialProductOp op,

                                PatternRewriter &rewriter) const override {

    auto width = op.getType(0).getIntOrFloatBitWidth();


    assert(op.getNumOperands() == 2);


    // Detect if any input is an AddOp

    auto lhsAdder = op.getOperand(0).getDefiningOp<comb::AddOp>();

    auto rhsAdder = op.getOperand(1).getDefiningOp<comb::AddOp>();

    if ((lhsAdder && rhsAdder) || !(lhsAdder || rhsAdder))

      return failure();

    auto addInput = lhsAdder ? lhsAdder : rhsAdder;

    auto otherInput = lhsAdder ? op.getOperand(1) : op.getOperand(0);


    if (addInput->getNumOperands() != 2)

      return failure();


    Value addend0 = addInput->getOperand(0);

    Value addend1 = addInput->getOperand(1);


    rewriter.replaceOpWithNewOp<PosPartialProductOp>(

        op, ValueRange{addend0, addend1, otherInput}, width);

    return success();

  }


};


void PartialProductOp::getCanonicalizationPatterns(RewritePatternSet &results,

                                                   MLIRContext *context) {


  results.add<ReduceNumPartialProducts, PosPartialProducts>(context);

}


//===----------------------------------------------------------------------===//

// Pos Partial Product Operation

//===----------------------------------------------------------------------===//


struct ReduceNumPosPartialProducts

    : public OpRewritePattern<PosPartialProductOp> {

  using OpRewritePattern::OpRewritePattern;


  // pos_pp(concat(0,a), concat(0,b), c) -> reduced number of results


  LogicalResult matchAndRewrite(PosPartialProductOp op,

                                PatternRewriter &rewriter) const override {

    unsigned inputWidth = op.getAddend0().getType().getIntOrFloatBitWidth();

    auto addend0NonZero =

        calculateNonZeroBits(op.getAddend0(), op.getNumResults());

    auto addend1NonZero =

        calculateNonZeroBits(op.getAddend1(), op.getNumResults());


    if (failed(addend0NonZero) || failed(addend1NonZero))

      return failure();


    // Need the +1 for the carry-out

    size_t maxNonZeroBits = std::max(*addend0NonZero, *addend1NonZero) + 1;


    if (maxNonZeroBits >= op.getNumResults())

      return failure();


    auto newPP = datapath::PosPartialProductOp::create(

        rewriter, op.getLoc(), op.getOperands(), maxNonZeroBits);


    auto zero = hw::ConstantOp::create(rewriter, op.getLoc(),

                                       APInt::getZero(inputWidth));


    // Collect newPP results and pad with zeros if needed

    SmallVector<Value> newResults(newPP.getResults().begin(),

                                  newPP.getResults().end());


    newResults.append(op.getNumResults() - newResults.size(), zero);


    rewriter.replaceOp(op, newResults);

    return success();

  }


};


void PosPartialProductOp::getCanonicalizationPatterns(

    RewritePatternSet &results, MLIRContext *context) {


  results.add<ReduceNumPosPartialProducts>(context);

}

assert
assert(baseType &&"element must be base type")

CombOps.h

DatapathDialect.h

areAllCompressorResultsSummed
static bool areAllCompressorResultsSummed(ValueRange compressResults, ValueRange operands)
Definition DatapathFolds.cpp:50

calculateNonZeroBits
static FailureOr< size_t > calculateNonZeroBits(Value operand, size_t numResults)
Definition DatapathFolds.cpp:27

DatapathOps.h

context
static std::unique_ptr< Context > context
Definition DpiEntryPoints.cpp:37

HWOps.h

comb.AddOp
Definition comb.py:253

hw.ConstantOp.create
create(data_type, value)
Definition hw.py:433

circt
The InstanceGraph op interface, see InstanceGraphInterface.td for more details.
Definition DebugAnalysis.h:21

mlir
Definition DebugAnalysis.h:16

ConstantFoldCompress
Definition DatapathFolds.cpp:201

ConstantFoldCompress::matchAndRewrite
LogicalResult matchAndRewrite(CompressOp op, PatternRewriter &rewriter) const override
Definition DatapathFolds.cpp:204

FoldAddIntoCompress
Definition DatapathFolds.cpp:118

FoldAddIntoCompress::matchAndRewrite
LogicalResult matchAndRewrite(comb::AddOp addOp, PatternRewriter &rewriter) const override
Definition DatapathFolds.cpp:125

FoldCompressIntoCompress
Definition DatapathFolds.cpp:60

FoldCompressIntoCompress::matchAndRewrite
LogicalResult matchAndRewrite(datapath::CompressOp compOp, PatternRewriter &rewriter) const override
Definition DatapathFolds.cpp:64

PosPartialProducts
Definition DatapathFolds.cpp:278

PosPartialProducts::matchAndRewrite
LogicalResult matchAndRewrite(PartialProductOp op, PatternRewriter &rewriter) const override
Definition DatapathFolds.cpp:282

ReduceNumPartialProducts
Definition DatapathFolds.cpp:241

ReduceNumPartialProducts::matchAndRewrite
LogicalResult matchAndRewrite(PartialProductOp op, PatternRewriter &rewriter) const override
Definition DatapathFolds.cpp:245

ReduceNumPosPartialProducts
Definition DatapathFolds.cpp:318

ReduceNumPosPartialProducts::matchAndRewrite
LogicalResult matchAndRewrite(PosPartialProductOp op, PatternRewriter &rewriter) const override
Definition DatapathFolds.cpp:322

mlir::OpRewritePattern
Definition LLVM.h:180