14#include "mlir/Analysis/TopologicalSortUtils.h"
15#include "mlir/Dialect/Func/IR/FuncOps.h"
16#include "mlir/IR/PatternMatch.h"
17#include "mlir/Pass/Pass.h"
18#include "mlir/Transforms/GreedyPatternRewriteDriver.h"
19#include "llvm/Support/Debug.h"
20#include "llvm/Support/KnownBits.h"
23#define DEBUG_TYPE "datapath-to-comb"
26#define GEN_PASS_DEF_CONVERTDATAPATHTOCOMB
27#include "circt/Conversion/Passes.h.inc"
31using namespace datapath;
34static SmallVector<Value>
extractBits(OpBuilder &builder, Value val) {
35 SmallVector<Value> bits;
36 comb::extractBits(builder, val, bits);
51 matchAndRewrite(CompressOp op,
52 mlir::PatternRewriter &rewriter)
const override {
53 Location loc = op.getLoc();
54 auto inputs = op.getOperands();
55 unsigned width = inputs[0].getType().getIntOrFloatBitWidth();
57 auto addOp = comb::AddOp::create(rewriter, loc, inputs,
true);
60 SmallVector<Value> results(op.getNumResults() - 1, zeroOp);
61 results.push_back(addOp);
62 rewriter.replaceOp(op, results);
69 DatapathCompressOpConversion(MLIRContext *context,
74 matchAndRewrite(CompressOp op,
75 mlir::PatternRewriter &rewriter)
const override {
76 Location loc = op.getLoc();
77 auto inputs = op.getOperands();
79 SmallVector<SmallVector<Value>> addends;
80 for (
auto input : inputs) {
86 auto width = inputs[0].getType().getIntOrFloatBitWidth();
87 auto targetAddends = op.getNumResults();
92 if (failed(comp.withInputDelays(
93 [&](Value v) { return analysis->getMaxDelay(v, 0); })))
97 rewriter.replaceOp(op, comp.compressToHeight(rewriter, targetAddends));
105struct DatapathPartialProductOpConversion :
OpRewritePattern<PartialProductOp> {
108 DatapathPartialProductOpConversion(MLIRContext *context,
bool forceBooth)
111 const bool forceBooth;
113 LogicalResult matchAndRewrite(PartialProductOp op,
114 PatternRewriter &rewriter)
const override {
116 Value a = op.getLhs();
117 Value b = op.getRhs();
118 unsigned width = a.getType().getIntOrFloatBitWidth();
122 rewriter.replaceOpWithNewOp<
hw::ConstantOp>(op, op.getType(0), 0);
139 return lowerSqrAndArray(rewriter, a, op, width);
143 if (op.getNumResults() > 16 || forceBooth)
144 return lowerBoothArray(rewriter, a, b, op, width);
146 return lowerAndArray(rewriter, a, b, op, width);
150 static LogicalResult lowerAndArray(PatternRewriter &rewriter, Value a,
151 Value b, PartialProductOp op,
154 Location loc = op.getLoc();
156 SmallVector<Value> bBits =
extractBits(rewriter, b);
158 SmallVector<Value> partialProducts;
159 partialProducts.reserve(width);
162 assert(op.getNumResults() <= width &&
163 "Cannot return more results than the operator width");
165 for (
unsigned i = 0; i < op.getNumResults(); ++i) {
167 rewriter.createOrFold<comb::ReplicateOp>(loc, bBits[i], width);
168 auto ppRow = rewriter.createOrFold<
comb::AndOp>(loc, repl, a);
170 partialProducts.push_back(ppRow);
175 comb::ConcatOp::create(rewriter, loc, ValueRange{ppRow, shiftBy});
177 loc, ppAlign, 0, width);
178 partialProducts.push_back(ppAlignTrunc);
181 rewriter.replaceOp(op, partialProducts);
185 static LogicalResult lowerSqrAndArray(PatternRewriter &rewriter, Value a,
186 PartialProductOp op,
unsigned width) {
188 Location loc = op.getLoc();
189 SmallVector<Value> aBits =
extractBits(rewriter, a);
191 SmallVector<Value> partialProducts;
192 partialProducts.reserve(width);
196 assert(op.getNumResults() <= width &&
197 "Cannot return more results than the operator width");
199 for (
unsigned i = 0; i < op.getNumResults(); ++i) {
200 SmallVector<Value> row;
203 if (2 * i >= width) {
206 partialProducts.push_back(zeroWidth);
212 row.push_back(shiftBy);
214 row.push_back(aBits[i]);
217 unsigned rowWidth = 2 * i + 1;
218 if (rowWidth < width) {
219 row.push_back(zeroFalse);
223 for (
unsigned j = i + 1; j < width; ++j) {
225 if (rowWidth == width)
231 if (j >= op.getNumResults()) {
232 row.push_back(zeroFalse);
237 rewriter.createOrFold<
comb::AndOp>(loc, aBits[i], aBits[j]);
238 row.push_back(ppBit);
240 std::reverse(row.begin(), row.end());
241 auto ppRow = comb::ConcatOp::create(rewriter, loc, row);
242 partialProducts.push_back(ppRow);
245 rewriter.replaceOp(op, partialProducts);
249 static LogicalResult lowerBoothArray(PatternRewriter &rewriter, Value a,
250 Value b, PartialProductOp op,
252 Location loc = op.getLoc();
259 auto rowWidth = width;
260 auto knownBitsA = comb::computeKnownBits(a);
261 if (!knownBitsA.Zero.isZero()) {
262 if (knownBitsA.Zero.countLeadingOnes() > 1) {
265 rowWidth -= knownBitsA.Zero.countLeadingOnes() - 1;
274 Value twoA = rewriter.createOrFold<
comb::ShlOp>(loc, a, oneRowWidth);
278 SmallVector<Value> bBits =
extractBits(rewriter, b);
281 auto knownBitsB = comb::computeKnownBits(b);
282 if (!knownBitsB.Zero.isZero()) {
283 for (
unsigned i = 0; i < width; ++i)
284 if (knownBitsB.Zero[i])
285 bBits[i] = zeroFalse;
288 SmallVector<Value> partialProducts;
289 partialProducts.reserve(width);
299 for (
unsigned i = 0; i <= width; i += 2) {
301 Value bim1 = (i == 0) ? zeroFalse : bBits[i - 1];
302 Value bi = (i < width) ? bBits[i] : zeroFalse;
303 Value bip1 = (i + 1 < width) ? bBits[i + 1] : zeroFalse;
308 Value encOne = rewriter.createOrFold<
comb::XorOp>(loc, bi, bim1,
true);
311 Value biInv = rewriter.createOrFold<
comb::XorOp>(loc, bi, constOne,
true);
313 rewriter.createOrFold<
comb::XorOp>(loc, bip1, constOne,
true);
315 rewriter.createOrFold<
comb::XorOp>(loc, bim1, constOne,
true);
317 Value andLeft = rewriter.createOrFold<
comb::AndOp>(
318 loc, ValueRange{bip1Inv, bi, bim1},
true);
319 Value andRight = rewriter.createOrFold<
comb::AndOp>(
320 loc, ValueRange{bip1, biInv, bim1Inv},
true);
322 rewriter.createOrFold<
comb::OrOp>(loc, andLeft, andRight,
true);
325 rewriter.createOrFold<comb::ReplicateOp>(loc, encNeg, rowWidth);
327 rewriter.createOrFold<comb::ReplicateOp>(loc, encOne, rowWidth);
329 rewriter.createOrFold<comb::ReplicateOp>(loc, encTwo, rowWidth);
332 Value selTwoA = rewriter.createOrFold<
comb::AndOp>(loc, encTwoRepl, twoA);
333 Value selOneA = rewriter.createOrFold<
comb::AndOp>(loc, encOneRepl, a);
335 rewriter.createOrFold<
comb::OrOp>(loc, selTwoA, selOneA,
true);
339 rewriter.createOrFold<
comb::XorOp>(loc, magA, encNegRepl,
true);
352 if (rowWidth < width) {
353 auto padding = width - rowWidth;
354 auto encNegInv = bip1Inv;
359 rewriter.createOrFold<comb::ReplicateOp>(loc, encNeg, padding);
361 loc, ValueRange{encNegPad, ppRow});
365 loc, ValueRange{encNegInv, encNeg, encNeg, ppRow});
369 loc, ValueRange{constOne, encNegInv, ppRow});
373 auto rowWidth = ppRow.getType().getIntOrFloatBitWidth();
374 if (rowWidth < width) {
378 loc, ValueRange{zeroPad, ppRow});
384 partialProducts.push_back(ppRow);
390 assert(i >= 2 &&
"Expected i to be at least 2 for sign correction");
393 loc, ValueRange{ppRow, zeroFalse, encNegPrev});
395 loc, withSignCorrection, 0, width);
399 rewriter.createOrFold<
comb::ShlOp>(loc, ppAlignPre, shiftBy);
400 partialProducts.push_back(ppAlign);
403 if (partialProducts.size() == op.getNumResults())
408 while (partialProducts.size() < op.getNumResults())
409 partialProducts.push_back(zeroWidth);
411 assert(partialProducts.size() == op.getNumResults() &&
412 "Expected number of booth partial products to match results");
414 rewriter.replaceOp(op, partialProducts);
419struct DatapathPosPartialProductOpConversion
423 DatapathPosPartialProductOpConversion(MLIRContext *context,
bool forceBooth)
425 forceBooth(forceBooth){};
427 const bool forceBooth;
429 LogicalResult matchAndRewrite(PosPartialProductOp op,
430 PatternRewriter &rewriter)
const override {
432 Value a = op.getAddend0();
433 Value b = op.getAddend1();
434 Value c = op.getMultiplicand();
435 unsigned width = a.getType().getIntOrFloatBitWidth();
439 rewriter.replaceOpWithNewOp<
hw::ConstantOp>(op, op.getType(0), 0);
444 return lowerAndArray(rewriter, a, b, c, op, width);
448 static LogicalResult lowerAndArray(PatternRewriter &rewriter, Value a,
449 Value b, Value c, PosPartialProductOp op,
452 Location loc = op.getLoc();
455 auto carry = rewriter.createOrFold<
comb::AndOp>(loc, a, b);
456 auto save = rewriter.createOrFold<
comb::XorOp>(loc, a, b);
458 SmallVector<Value> carryBits =
extractBits(rewriter, carry);
459 SmallVector<Value> saveBits =
extractBits(rewriter, save);
462 auto rowWidth = width;
463 auto knownBitsC = comb::computeKnownBits(c);
464 if (!knownBitsC.Zero.isZero()) {
465 if (knownBitsC.Zero.countLeadingOnes() > 1) {
468 rowWidth -= knownBitsC.Zero.countLeadingOnes() - 1;
475 Value twoCWider = rewriter.create<
comb::ConcatOp>(loc, ValueRange{c, zero});
476 Value twoC = rewriter.create<
comb::ExtractOp>(loc, twoCWider, 0, rowWidth);
480 SmallVector<Value> partialProducts;
481 partialProducts.reserve(width);
483 assert(op.getNumResults() <= width &&
484 "Cannot return more results than the operator width");
486 for (
unsigned i = 0; i < op.getNumResults(); ++i) {
488 rewriter.createOrFold<comb::ReplicateOp>(loc, saveBits[i], rowWidth);
490 rewriter.createOrFold<comb::ReplicateOp>(loc, carryBits[i], rowWidth);
492 auto ppRowSave = rewriter.createOrFold<
comb::AndOp>(loc, replSave, c);
494 rewriter.createOrFold<
comb::AndOp>(loc, replCarry, twoC);
496 rewriter.createOrFold<
comb::OrOp>(loc, ppRowSave, ppRowCarry);
497 auto ppAlign = ppRow;
501 comb::ConcatOp::create(rewriter, loc, ValueRange{ppRow, shiftBy});
505 if (rowWidth + i > width) {
508 partialProducts.push_back(ppAlignTrunc);
512 if (rowWidth + i < width) {
513 auto padding = width - rowWidth - i;
517 loc, ValueRange{zeroPad, ppAlign}));
521 partialProducts.push_back(ppAlign);
524 rewriter.replaceOp(op, partialProducts);
536struct ConvertDatapathToCombPass
537 :
public impl::ConvertDatapathToCombBase<ConvertDatapathToCombPass> {
538 void runOnOperation()
override;
539 using ConvertDatapathToCombBase<
540 ConvertDatapathToCombPass>::ConvertDatapathToCombBase;
545 Operation *op, RewritePatternSet &&
patterns,
549 mlir::GreedyRewriteConfig config;
554 config.setMaxIterations(2).setListener(analysis).setUseTopDownTraversal(
true);
557 if (failed(mlir::applyPatternsGreedily(op, std::move(
patterns), config)))
563void ConvertDatapathToCombPass::runOnOperation() {
564 RewritePatternSet
patterns(&getContext());
566 patterns.add<DatapathPartialProductOpConversion,
567 DatapathPosPartialProductOpConversion>(
patterns.getContext(),
571 analysis = &getAnalysis<synth::IncrementalLongestPathAnalysis>();
572 if (lowerCompressToAdd)
577 patterns.add<DatapathCompressOpConversion>(
patterns.getContext(), analysis);
580 getOperation(), std::move(
patterns), analysis)))
581 return signalPassFailure();
586 auto result = getOperation()->walk([&](Operation *op) {
587 if (llvm::isa_and_nonnull<datapath::DatapathDialect>(op->getDialect())) {
588 op->emitError(
"Datapath operation not converted: ") << *op;
589 return WalkResult::interrupt();
591 return WalkResult::advance();
593 if (result.wasInterrupted())
594 return signalPassFailure();
assert(baseType &&"element must be base type")
static SmallVector< Value > extractBits(OpBuilder &builder, Value val)
static SmallVector< Value > extractBits(OpBuilder &builder, Value val)
static LogicalResult applyPatternsGreedilyWithTimingInfo(Operation *op, RewritePatternSet &&patterns, synth::IncrementalLongestPathAnalysis *analysis)
The InstanceGraph op interface, see InstanceGraphInterface.td for more details.