14#include "mlir/Analysis/TopologicalSortUtils.h"
15#include "mlir/Dialect/Func/IR/FuncOps.h"
16#include "mlir/IR/PatternMatch.h"
17#include "mlir/Pass/Pass.h"
18#include "mlir/Transforms/GreedyPatternRewriteDriver.h"
19#include "llvm/Support/Debug.h"
20#include "llvm/Support/KnownBits.h"
23#define DEBUG_TYPE "datapath-to-comb"
26#define GEN_PASS_DEF_CONVERTDATAPATHTOCOMB
27#include "circt/Conversion/Passes.h.inc"
31using namespace datapath;
34static SmallVector<Value>
extractBits(OpBuilder &builder, Value val) {
35 SmallVector<Value> bits;
36 comb::extractBits(builder, val, bits);
51 matchAndRewrite(CompressOp op,
52 mlir::PatternRewriter &rewriter)
const override {
53 Location loc = op.getLoc();
54 auto inputs = op.getOperands();
55 unsigned width = inputs[0].getType().getIntOrFloatBitWidth();
57 auto addOp = comb::AddOp::create(rewriter, loc, inputs,
true);
60 SmallVector<Value> results(op.getNumResults() - 1, zeroOp);
61 results.push_back(addOp);
62 rewriter.replaceOp(op, results);
69 DatapathCompressOpConversion(MLIRContext *context,
74 matchAndRewrite(CompressOp op,
75 mlir::PatternRewriter &rewriter)
const override {
76 Location loc = op.getLoc();
77 auto inputs = op.getOperands();
79 SmallVector<SmallVector<Value>> addends;
80 for (
auto input : inputs) {
86 auto width = inputs[0].getType().getIntOrFloatBitWidth();
87 auto targetAddends = op.getNumResults();
92 if (failed(comp.withInputDelays(
93 [&](Value v) { return analysis->getMaxDelay(v, 0); })))
97 rewriter.replaceOp(op, comp.compressToHeight(rewriter, targetAddends));
105struct DatapathPartialProductOpConversion :
OpRewritePattern<PartialProductOp> {
108 DatapathPartialProductOpConversion(MLIRContext *context,
bool forceBooth)
111 const bool forceBooth;
113 LogicalResult matchAndRewrite(PartialProductOp op,
114 PatternRewriter &rewriter)
const override {
116 Value a = op.getLhs();
117 Value b = op.getRhs();
118 unsigned width = a.getType().getIntOrFloatBitWidth();
122 rewriter.replaceOpWithNewOp<
hw::ConstantOp>(op, op.getType(0), 0);
139 return lowerSqrAndArray(rewriter, a, op, width);
143 if (op.getNumResults() > 16 || forceBooth)
144 return lowerBoothArray(rewriter, a, b, op, width);
146 return lowerAndArray(rewriter, a, b, op, width);
150 static LogicalResult lowerAndArray(PatternRewriter &rewriter, Value a,
151 Value b, PartialProductOp op,
154 Location loc = op.getLoc();
156 SmallVector<Value> bBits =
extractBits(rewriter, b);
158 auto rowWidth = width;
159 auto knownBitsA = comb::computeKnownBits(a);
160 if (!knownBitsA.Zero.isZero()) {
161 if (knownBitsA.Zero.countLeadingOnes() > 1) {
162 rowWidth -= knownBitsA.Zero.countLeadingOnes();
167 SmallVector<Value> partialProducts;
168 partialProducts.reserve(width);
171 assert(op.getNumResults() <= width &&
172 "Cannot return more results than the operator width");
174 for (
unsigned i = 0; i < op.getNumResults(); ++i) {
176 rewriter.createOrFold<comb::ReplicateOp>(loc, bBits[i], rowWidth);
177 auto ppRow = rewriter.createOrFold<
comb::AndOp>(loc, repl, a);
178 if (rowWidth < width) {
179 auto padding = width - rowWidth;
182 loc, ValueRange{zeroPad, ppRow});
186 partialProducts.push_back(ppRow);
191 comb::ConcatOp::create(rewriter, loc, ValueRange{ppRow, shiftBy});
193 loc, ppAlign, 0, width);
194 partialProducts.push_back(ppAlignTrunc);
197 rewriter.replaceOp(op, partialProducts);
201 static LogicalResult lowerSqrAndArray(PatternRewriter &rewriter, Value a,
202 PartialProductOp op,
unsigned width) {
204 Location loc = op.getLoc();
205 SmallVector<Value> aBits =
extractBits(rewriter, a);
207 SmallVector<Value> partialProducts;
208 partialProducts.reserve(width);
212 assert(op.getNumResults() <= width &&
213 "Cannot return more results than the operator width");
215 for (
unsigned i = 0; i < op.getNumResults(); ++i) {
216 SmallVector<Value> row;
219 if (2 * i >= width) {
222 partialProducts.push_back(zeroWidth);
228 row.push_back(shiftBy);
230 row.push_back(aBits[i]);
233 unsigned rowWidth = 2 * i + 1;
234 if (rowWidth < width) {
235 row.push_back(zeroFalse);
239 for (
unsigned j = i + 1; j < width; ++j) {
241 if (rowWidth == width)
247 if (j >= op.getNumResults()) {
248 row.push_back(zeroFalse);
253 rewriter.createOrFold<
comb::AndOp>(loc, aBits[i], aBits[j]);
254 row.push_back(ppBit);
256 std::reverse(row.begin(), row.end());
257 auto ppRow = comb::ConcatOp::create(rewriter, loc, row);
258 partialProducts.push_back(ppRow);
261 rewriter.replaceOp(op, partialProducts);
265 static LogicalResult lowerBoothArray(PatternRewriter &rewriter, Value a,
266 Value b, PartialProductOp op,
268 Location loc = op.getLoc();
275 auto rowWidth = width;
276 auto knownBitsA = comb::computeKnownBits(a);
277 if (!knownBitsA.Zero.isZero()) {
278 if (knownBitsA.Zero.countLeadingOnes() > 1) {
281 rowWidth -= knownBitsA.Zero.countLeadingOnes() - 1;
290 Value twoA = rewriter.createOrFold<
comb::ShlOp>(loc, a, oneRowWidth);
294 SmallVector<Value> bBits =
extractBits(rewriter, b);
297 auto knownBitsB = comb::computeKnownBits(b);
298 if (!knownBitsB.Zero.isZero()) {
299 for (
unsigned i = 0; i < width; ++i)
300 if (knownBitsB.Zero[i])
301 bBits[i] = zeroFalse;
304 SmallVector<Value> partialProducts;
305 partialProducts.reserve(width);
315 for (
unsigned i = 0; i <= width; i += 2) {
317 Value bim1 = (i == 0) ? zeroFalse : bBits[i - 1];
318 Value bi = (i < width) ? bBits[i] : zeroFalse;
319 Value bip1 = (i + 1 < width) ? bBits[i + 1] : zeroFalse;
324 Value encOne = rewriter.createOrFold<
comb::XorOp>(loc, bi, bim1,
true);
327 Value biInv = rewriter.createOrFold<
comb::XorOp>(loc, bi, constOne,
true);
329 rewriter.createOrFold<
comb::XorOp>(loc, bip1, constOne,
true);
331 rewriter.createOrFold<
comb::XorOp>(loc, bim1, constOne,
true);
333 Value andLeft = rewriter.createOrFold<
comb::AndOp>(
334 loc, ValueRange{bip1Inv, bi, bim1},
true);
335 Value andRight = rewriter.createOrFold<
comb::AndOp>(
336 loc, ValueRange{bip1, biInv, bim1Inv},
true);
338 rewriter.createOrFold<
comb::OrOp>(loc, andLeft, andRight,
true);
341 rewriter.createOrFold<comb::ReplicateOp>(loc, encNeg, rowWidth);
343 rewriter.createOrFold<comb::ReplicateOp>(loc, encOne, rowWidth);
345 rewriter.createOrFold<comb::ReplicateOp>(loc, encTwo, rowWidth);
348 Value selTwoA = rewriter.createOrFold<
comb::AndOp>(loc, encTwoRepl, twoA);
349 Value selOneA = rewriter.createOrFold<
comb::AndOp>(loc, encOneRepl, a);
351 rewriter.createOrFold<
comb::OrOp>(loc, selTwoA, selOneA,
true);
355 rewriter.createOrFold<
comb::XorOp>(loc, magA, encNegRepl,
true);
368 if (rowWidth < width) {
369 auto padding = width - rowWidth;
370 auto encNegInv = bip1Inv;
375 rewriter.createOrFold<comb::ReplicateOp>(loc, encNeg, padding);
377 loc, ValueRange{encNegPad, ppRow});
381 loc, ValueRange{encNegInv, encNeg, encNeg, ppRow});
385 loc, ValueRange{constOne, encNegInv, ppRow});
389 auto rowWidth = ppRow.getType().getIntOrFloatBitWidth();
390 if (rowWidth < width) {
394 loc, ValueRange{zeroPad, ppRow});
400 partialProducts.push_back(ppRow);
407 loc, ValueRange{ppRow, zeroFalse, encNegPrev});
409 loc, withSignCorrection, 0, width);
410 partialProducts.push_back(ppAlign);
419 loc, ValueRange{ppRow, zeroFalse, encNegPrev, shiftBy});
421 loc, withSignCorrection, 0, width);
423 partialProducts.push_back(ppAlign);
426 if (partialProducts.size() == op.getNumResults())
431 while (partialProducts.size() < op.getNumResults())
432 partialProducts.push_back(zeroWidth);
434 assert(partialProducts.size() == op.getNumResults() &&
435 "Expected number of booth partial products to match results");
437 rewriter.replaceOp(op, partialProducts);
442struct DatapathPosPartialProductOpConversion
446 DatapathPosPartialProductOpConversion(MLIRContext *context,
bool forceBooth)
448 forceBooth(forceBooth){};
450 const bool forceBooth;
452 LogicalResult matchAndRewrite(PosPartialProductOp op,
453 PatternRewriter &rewriter)
const override {
455 Value a = op.getAddend0();
456 Value b = op.getAddend1();
457 Value c = op.getMultiplicand();
458 unsigned width = a.getType().getIntOrFloatBitWidth();
462 rewriter.replaceOpWithNewOp<
hw::ConstantOp>(op, op.getType(0), 0);
467 return lowerAndArray(rewriter, a, b, c, op, width);
471 static LogicalResult lowerAndArray(PatternRewriter &rewriter, Value a,
472 Value b, Value c, PosPartialProductOp op,
475 Location loc = op.getLoc();
478 auto carry = rewriter.createOrFold<
comb::AndOp>(loc, a, b);
479 auto save = rewriter.createOrFold<
comb::XorOp>(loc, a, b);
481 SmallVector<Value> carryBits =
extractBits(rewriter, carry);
482 SmallVector<Value> saveBits =
extractBits(rewriter, save);
485 auto rowWidth = width;
486 auto knownBitsC = comb::computeKnownBits(c);
487 if (!knownBitsC.Zero.isZero()) {
488 if (knownBitsC.Zero.countLeadingOnes() > 1) {
491 rowWidth -= knownBitsC.Zero.countLeadingOnes() - 1;
499 comb::ConcatOp::create(rewriter, loc, ValueRange{c, zero});
504 SmallVector<Value> partialProducts;
505 partialProducts.reserve(width);
507 assert(op.getNumResults() <= width &&
508 "Cannot return more results than the operator width");
510 for (
unsigned i = 0; i < op.getNumResults(); ++i) {
512 rewriter.createOrFold<comb::ReplicateOp>(loc, saveBits[i], rowWidth);
514 rewriter.createOrFold<comb::ReplicateOp>(loc, carryBits[i], rowWidth);
516 auto ppRowSave = rewriter.createOrFold<
comb::AndOp>(loc, replSave, c);
518 rewriter.createOrFold<
comb::AndOp>(loc, replCarry, twoC);
520 rewriter.createOrFold<
comb::OrOp>(loc, ppRowSave, ppRowCarry);
521 auto ppAlign = ppRow;
525 comb::ConcatOp::create(rewriter, loc, ValueRange{ppRow, shiftBy});
529 if (rowWidth + i > width) {
532 partialProducts.push_back(ppAlignTrunc);
536 if (rowWidth + i < width) {
537 auto padding = width - rowWidth - i;
541 loc, ValueRange{zeroPad, ppAlign}));
545 partialProducts.push_back(ppAlign);
548 rewriter.replaceOp(op, partialProducts);
560struct ConvertDatapathToCombPass
561 :
public impl::ConvertDatapathToCombBase<ConvertDatapathToCombPass> {
562 void runOnOperation()
override;
563 using ConvertDatapathToCombBase<
564 ConvertDatapathToCombPass>::ConvertDatapathToCombBase;
569 Operation *op, RewritePatternSet &&
patterns,
573 mlir::GreedyRewriteConfig config;
578 config.setMaxIterations(2).setListener(analysis).setUseTopDownTraversal(
true);
581 if (failed(mlir::applyPatternsGreedily(op, std::move(
patterns), config)))
587void ConvertDatapathToCombPass::runOnOperation() {
588 RewritePatternSet
patterns(&getContext());
590 patterns.add<DatapathPartialProductOpConversion,
591 DatapathPosPartialProductOpConversion>(
patterns.getContext(),
595 analysis = &getAnalysis<synth::IncrementalLongestPathAnalysis>();
596 if (lowerCompressToAdd)
601 patterns.add<DatapathCompressOpConversion>(
patterns.getContext(), analysis);
604 getOperation(), std::move(
patterns), analysis)))
605 return signalPassFailure();
610 auto result = getOperation()->walk([&](Operation *op) {
611 if (llvm::isa_and_nonnull<datapath::DatapathDialect>(op->getDialect())) {
612 op->emitError(
"Datapath operation not converted: ") << *op;
613 return WalkResult::interrupt();
615 return WalkResult::advance();
617 if (result.wasInterrupted())
618 return signalPassFailure();
assert(baseType &&"element must be base type")
static SmallVector< Value > extractBits(OpBuilder &builder, Value val)
static SmallVector< Value > extractBits(OpBuilder &builder, Value val)
static LogicalResult applyPatternsGreedilyWithTimingInfo(Operation *op, RewritePatternSet &&patterns, synth::IncrementalLongestPathAnalysis *analysis)
The InstanceGraph op interface, see InstanceGraphInterface.td for more details.