24#include "mlir/Conversion/ArithToLLVM/ArithToLLVM.h"
25#include "mlir/Conversion/ControlFlowToLLVM/ControlFlowToLLVM.h"
26#include "mlir/Conversion/FuncToLLVM/ConvertFuncToLLVM.h"
27#include "mlir/Conversion/IndexToLLVM/IndexToLLVM.h"
28#include "mlir/Conversion/LLVMCommon/ConversionTarget.h"
29#include "mlir/Conversion/LLVMCommon/TypeConverter.h"
30#include "mlir/Conversion/SCFToControlFlow/SCFToControlFlow.h"
31#include "mlir/Dialect/ControlFlow/IR/ControlFlowOps.h"
32#include "mlir/Dialect/Func/IR/FuncOps.h"
33#include "mlir/Dialect/Index/IR/IndexOps.h"
34#include "mlir/Dialect/LLVMIR/FunctionCallUtils.h"
35#include "mlir/Dialect/LLVMIR/LLVMAttrs.h"
36#include "mlir/Dialect/LLVMIR/LLVMDialect.h"
37#include "mlir/Dialect/SCF/IR/SCF.h"
38#include "mlir/IR/BuiltinDialect.h"
39#include "mlir/Pass/Pass.h"
40#include "mlir/Transforms/DialectConversion.h"
41#include "llvm/Support/Debug.h"
42#include "llvm/Support/FormatVariadic.h"
46#define DEBUG_TYPE "lower-arc-to-llvm"
49#define GEN_PASS_DEF_LOWERARCTOLLVM
50#include "circt/Conversion/Passes.h.inc"
57using namespace runtime;
64 return modelName +
"_eval";
70 using OpConversionPattern::OpConversionPattern;
72 matchAndRewrite(arc::ModelOp op, OpAdaptor adaptor,
73 ConversionPatternRewriter &rewriter)
const final {
75 IRRewriter::InsertionGuard guard(rewriter);
76 rewriter.setInsertionPointToEnd(&op.getBodyBlock());
77 func::ReturnOp::create(rewriter, op.getLoc());
82 rewriter.getFunctionType(op.getBody().getArgumentTypes(), {});
84 mlir::func::FuncOp::create(rewriter, op.getLoc(), funcName, funcType);
85 rewriter.inlineRegionBefore(op.getRegion(), func.getBody(), func.end());
91struct AllocStorageOpLowering
93 using OpConversionPattern::OpConversionPattern;
95 matchAndRewrite(arc::AllocStorageOp op, OpAdaptor adaptor,
96 ConversionPatternRewriter &rewriter)
const final {
97 auto type = typeConverter->convertType(op.getType());
98 if (!op.getOffset().has_value())
100 rewriter.replaceOpWithNewOp<LLVM::GEPOp>(op, type, rewriter.getI8Type(),
102 LLVM::GEPArg(*op.getOffset()));
107template <
class ConcreteOp>
111 using OpAdaptor =
typename ConcreteOp::Adaptor;
114 matchAndRewrite(ConcreteOp op, OpAdaptor adaptor,
115 ConversionPatternRewriter &rewriter)
const final {
117 auto offsetAttr = op->template getAttrOfType<IntegerAttr>(
"offset");
120 Value ptr = LLVM::GEPOp::create(
121 rewriter, op->getLoc(), adaptor.getStorage().getType(),
122 rewriter.getI8Type(), adaptor.getStorage(),
123 LLVM::GEPArg(offsetAttr.getValue().getZExtValue()));
124 rewriter.replaceOp(op, ptr);
130 using OpConversionPattern::OpConversionPattern;
132 matchAndRewrite(arc::StateReadOp op, OpAdaptor adaptor,
133 ConversionPatternRewriter &rewriter)
const final {
134 auto type = typeConverter->convertType(op.getType());
135 rewriter.replaceOpWithNewOp<LLVM::LoadOp>(op, type, adaptor.getState());
141 using OpConversionPattern::OpConversionPattern;
143 matchAndRewrite(arc::StateWriteOp op, OpAdaptor adaptor,
144 ConversionPatternRewriter &rewriter)
const final {
145 if (adaptor.getCondition()) {
146 rewriter.replaceOpWithNewOp<scf::IfOp>(
147 op, adaptor.getCondition(), [&](
auto &builder,
auto loc) {
148 LLVM::StoreOp::create(builder, loc, adaptor.getValue(),
150 scf::YieldOp::create(builder, loc);
153 rewriter.replaceOpWithNewOp<LLVM::StoreOp>(op, adaptor.getValue(),
161 using OpConversionPattern::OpConversionPattern;
163 matchAndRewrite(arc::AllocMemoryOp op, OpAdaptor adaptor,
164 ConversionPatternRewriter &rewriter)
const final {
165 auto offsetAttr = op->getAttrOfType<IntegerAttr>(
"offset");
168 Value ptr = LLVM::GEPOp::create(
169 rewriter, op.getLoc(), adaptor.getStorage().getType(),
170 rewriter.getI8Type(), adaptor.getStorage(),
171 LLVM::GEPArg(offsetAttr.getValue().getZExtValue()));
173 rewriter.replaceOp(op, ptr);
179 using OpConversionPattern::OpConversionPattern;
181 matchAndRewrite(arc::StorageGetOp op, OpAdaptor adaptor,
182 ConversionPatternRewriter &rewriter)
const final {
183 Value offset = LLVM::ConstantOp::create(
184 rewriter, op.getLoc(), rewriter.getI32Type(), op.getOffsetAttr());
185 Value ptr = LLVM::GEPOp::create(
186 rewriter, op.getLoc(), adaptor.getStorage().getType(),
187 rewriter.getI8Type(), adaptor.getStorage(), offset);
188 rewriter.replaceOp(op, ptr);
198static MemoryAccess prepareMemoryAccess(Location loc, Value memory,
199 Value address, MemoryType type,
200 ConversionPatternRewriter &rewriter) {
201 auto zextAddrType = rewriter.getIntegerType(
202 cast<IntegerType>(address.getType()).getWidth() + 1);
203 Value
addr = LLVM::ZExtOp::create(rewriter, loc, zextAddrType, address);
205 LLVM::ConstantOp::create(rewriter, loc, zextAddrType,
206 rewriter.getI32IntegerAttr(type.getNumWords()));
207 Value withinBounds = LLVM::ICmpOp::create(
208 rewriter, loc, LLVM::ICmpPredicate::ult, addr, addrLimit);
209 Value ptr = LLVM::GEPOp::create(
210 rewriter, loc, LLVM::LLVMPointerType::get(memory.getContext()),
211 rewriter.getIntegerType(type.getStride() * 8), memory, ValueRange{addr});
212 return {ptr, withinBounds};
216 using OpConversionPattern::OpConversionPattern;
218 matchAndRewrite(arc::MemoryReadOp op, OpAdaptor adaptor,
219 ConversionPatternRewriter &rewriter)
const final {
220 auto type = typeConverter->convertType(op.getType());
221 auto memoryType = cast<MemoryType>(op.getMemory().getType());
223 prepareMemoryAccess(op.getLoc(), adaptor.getMemory(),
224 adaptor.getAddress(), memoryType, rewriter);
228 rewriter.replaceOpWithNewOp<scf::IfOp>(
229 op, access.withinBounds,
230 [&](
auto &builder,
auto loc) {
231 Value loadOp = LLVM::LoadOp::create(
232 builder, loc, memoryType.getWordType(), access.ptr);
233 scf::YieldOp::create(builder, loc, loadOp);
235 [&](
auto &builder,
auto loc) {
236 Value zeroValue = LLVM::ConstantOp::create(
237 builder, loc, type, builder.getI64IntegerAttr(0));
238 scf::YieldOp::create(builder, loc, zeroValue);
245 using OpConversionPattern::OpConversionPattern;
247 matchAndRewrite(arc::MemoryWriteOp op, OpAdaptor adaptor,
248 ConversionPatternRewriter &rewriter)
const final {
249 auto access = prepareMemoryAccess(
250 op.getLoc(), adaptor.getMemory(), adaptor.getAddress(),
251 cast<MemoryType>(op.getMemory().getType()), rewriter);
252 auto enable = access.withinBounds;
253 if (adaptor.getEnable())
254 enable = LLVM::AndOp::create(rewriter, op.getLoc(), adaptor.getEnable(),
258 rewriter.replaceOpWithNewOp<scf::IfOp>(
259 op, enable, [&](
auto &builder,
auto loc) {
260 LLVM::StoreOp::create(builder, loc, adaptor.getData(), access.ptr);
261 scf::YieldOp::create(builder, loc);
269 using OpConversionPattern::OpConversionPattern;
271 matchAndRewrite(seq::ClockGateOp op, OpAdaptor adaptor,
272 ConversionPatternRewriter &rewriter)
const final {
273 rewriter.replaceOpWithNewOp<LLVM::AndOp>(op, adaptor.getInput(),
274 adaptor.getEnable());
281 using OpConversionPattern::OpConversionPattern;
283 matchAndRewrite(seq::ClockInverterOp op, OpAdaptor adaptor,
284 ConversionPatternRewriter &rewriter)
const final {
285 auto constTrue = LLVM::ConstantOp::create(rewriter, op->getLoc(),
286 rewriter.getI1Type(), 1);
287 rewriter.replaceOpWithNewOp<LLVM::XOrOp>(op, adaptor.getInput(), constTrue);
293 using OpConversionPattern::OpConversionPattern;
295 matchAndRewrite(arc::ZeroCountOp op, OpAdaptor adaptor,
296 ConversionPatternRewriter &rewriter)
const override {
298 IntegerAttr isZeroPoison = rewriter.getBoolAttr(
true);
300 if (op.getPredicate() == arc::ZeroCountPredicate::leading) {
301 rewriter.replaceOpWithNewOp<LLVM::CountLeadingZerosOp>(
302 op, adaptor.getInput().getType(), adaptor.getInput(), isZeroPoison);
306 rewriter.replaceOpWithNewOp<LLVM::CountTrailingZerosOp>(
307 op, adaptor.getInput().getType(), adaptor.getInput(), isZeroPoison);
313 using OpConversionPattern::OpConversionPattern;
315 matchAndRewrite(seq::ConstClockOp op, OpAdaptor adaptor,
316 ConversionPatternRewriter &rewriter)
const override {
317 rewriter.replaceOpWithNewOp<LLVM::ConstantOp>(
318 op, rewriter.getI1Type(),
static_cast<int64_t
>(op.getValue()));
323template <
typename OpTy>
326 using OpAdaptor =
typename OpTy::Adaptor;
328 matchAndRewrite(OpTy op, OpAdaptor adaptor,
329 ConversionPatternRewriter &rewriter)
const override {
330 rewriter.replaceOp(op, adaptor.getInput());
344 size_t numStateBytes;
345 llvm::DenseMap<StringRef, StateInfo> states;
346 mlir::FlatSymbolRefAttr initialFnSymbol;
347 mlir::FlatSymbolRefAttr finalFnSymbol;
350template <
typename OpTy>
352 ModelAwarePattern(
const TypeConverter &typeConverter, MLIRContext *
context,
353 llvm::DenseMap<StringRef, ModelInfoMap> &modelInfo)
355 modelInfo(modelInfo) {}
358 Value createPtrToPortState(ConversionPatternRewriter &rewriter, Location loc,
359 Value state,
const StateInfo &port)
const {
360 MLIRContext *ctx = rewriter.getContext();
361 return LLVM::GEPOp::create(rewriter, loc, LLVM::LLVMPointerType::get(ctx),
362 IntegerType::get(ctx, 8), state,
363 LLVM::GEPArg(port.offset));
366 llvm::DenseMap<StringRef, ModelInfoMap> &modelInfo;
371struct SimInstantiateOpLowering
372 :
public ModelAwarePattern<arc::SimInstantiateOp> {
373 using ModelAwarePattern::ModelAwarePattern;
376 matchAndRewrite(arc::SimInstantiateOp op, OpAdaptor adaptor,
377 ConversionPatternRewriter &rewriter)
const final {
378 auto modelIt = modelInfo.find(
379 cast<SimModelInstanceType>(op.getBody().getArgument(0).getType())
382 ModelInfoMap &model = modelIt->second;
384 bool useRuntime = op.getRuntimeModel().has_value();
386 ModuleOp moduleOp = op->getParentOfType<ModuleOp>();
390 ConversionPatternRewriter::InsertionGuard guard(rewriter);
394 Type convertedIndex = typeConverter->convertType(rewriter.getIndexType());
395 Location loc = op.getLoc();
400 auto ptrTy = LLVM::LLVMPointerType::get(getContext());
404 if (op.getRuntimeArgs().has_value()) {
405 SmallVector<int8_t> argStringVec(op.getRuntimeArgsAttr().begin(),
406 op.getRuntimeArgsAttr().end());
407 argStringVec.push_back(
'\0');
408 auto strAttr = mlir::DenseElementsAttr::get(
409 mlir::RankedTensorType::get({(int64_t)argStringVec.size()},
410 rewriter.getI8Type()),
411 llvm::ArrayRef(argStringVec));
413 auto arrayCst = LLVM::ConstantOp::create(
415 LLVM::LLVMArrayType::get(rewriter.getI8Type(), argStringVec.size()),
417 auto cst1 = LLVM::ConstantOp::create(rewriter, loc,
418 rewriter.getI32IntegerAttr(1));
419 runtimeArgs = LLVM::AllocaOp::create(rewriter, loc, ptrTy,
420 arrayCst.getType(), cst1);
421 LLVM::LifetimeStartOp::create(rewriter, loc, runtimeArgs);
422 LLVM::StoreOp::create(rewriter, loc, arrayCst, runtimeArgs);
424 runtimeArgs = LLVM::ZeroOp::create(rewriter, loc, ptrTy).getResult();
427 auto rtModelPtr = LLVM::AddressOfOp::create(rewriter, loc, ptrTy,
428 op.getRuntimeModelAttr())
431 LLVM::CallOp::create(rewriter, loc, {ptrTy},
432 runtime::APICallbacks::symNameAllocInstance,
433 {rtModelPtr, runtimeArgs})
436 if (op.getRuntimeArgs().has_value())
437 LLVM::LifetimeEndOp::create(rewriter, loc, runtimeArgs);
441 FailureOr<LLVM::LLVMFuncOp> mallocFunc =
442 LLVM::lookupOrCreateMallocFn(rewriter, moduleOp, convertedIndex);
443 if (failed(mallocFunc))
446 Value numStateBytes = LLVM::ConstantOp::create(
447 rewriter, loc, convertedIndex, model.numStateBytes);
448 allocated = LLVM::CallOp::create(rewriter, loc, mallocFunc.value(),
449 ValueRange{numStateBytes})
452 LLVM::ConstantOp::create(rewriter, loc, rewriter.getI8Type(), 0);
453 LLVM::MemsetOp::create(rewriter, loc, allocated, zero, numStateBytes,
458 if (model.initialFnSymbol) {
459 auto initialFnType = LLVM::LLVMFunctionType::get(
460 LLVM::LLVMVoidType::get(op.getContext()),
461 {LLVM::LLVMPointerType::get(op.getContext())});
462 LLVM::CallOp::create(rewriter, loc, initialFnType, model.initialFnSymbol,
463 ValueRange{allocated});
468 LLVM::CallOp::create(rewriter, loc, TypeRange{},
469 runtime::APICallbacks::symNameOnInitialized,
473 rewriter.inlineBlockBefore(&adaptor.getBody().getBlocks().front(), op,
477 if (model.finalFnSymbol) {
478 auto finalFnType = LLVM::LLVMFunctionType::get(
479 LLVM::LLVMVoidType::get(op.getContext()),
480 {LLVM::LLVMPointerType::get(op.getContext())});
481 LLVM::CallOp::create(rewriter, loc, finalFnType, model.finalFnSymbol,
482 ValueRange{allocated});
486 LLVM::CallOp::create(rewriter, loc, TypeRange{},
487 runtime::APICallbacks::symNameDeleteInstance,
490 FailureOr<LLVM::LLVMFuncOp> freeFunc =
491 LLVM::lookupOrCreateFreeFn(rewriter, moduleOp);
492 if (failed(freeFunc))
495 LLVM::CallOp::create(rewriter, loc, freeFunc.value(),
496 ValueRange{allocated});
499 rewriter.eraseOp(op);
504struct SimSetInputOpLowering :
public ModelAwarePattern<arc::SimSetInputOp> {
505 using ModelAwarePattern::ModelAwarePattern;
508 matchAndRewrite(arc::SimSetInputOp op, OpAdaptor adaptor,
509 ConversionPatternRewriter &rewriter)
const final {
511 modelInfo.find(cast<SimModelInstanceType>(op.getInstance().getType())
514 ModelInfoMap &model = modelIt->second;
516 auto portIt = model.states.find(op.getInput());
517 if (portIt == model.states.end()) {
520 rewriter.eraseOp(op);
524 StateInfo &port = portIt->second;
525 Value statePtr = createPtrToPortState(rewriter, op.getLoc(),
526 adaptor.getInstance(), port);
527 rewriter.replaceOpWithNewOp<LLVM::StoreOp>(op, adaptor.getValue(),
534struct SimGetPortOpLowering :
public ModelAwarePattern<arc::SimGetPortOp> {
535 using ModelAwarePattern::ModelAwarePattern;
538 matchAndRewrite(arc::SimGetPortOp op, OpAdaptor adaptor,
539 ConversionPatternRewriter &rewriter)
const final {
541 modelInfo.find(cast<SimModelInstanceType>(op.getInstance().getType())
544 ModelInfoMap &model = modelIt->second;
546 auto type = typeConverter->convertType(op.getValue().getType());
549 auto portIt = model.states.find(op.getPort());
550 if (portIt == model.states.end()) {
553 rewriter.replaceOpWithNewOp<LLVM::ConstantOp>(op, type, 0);
557 StateInfo &port = portIt->second;
558 Value statePtr = createPtrToPortState(rewriter, op.getLoc(),
559 adaptor.getInstance(), port);
560 rewriter.replaceOpWithNewOp<LLVM::LoadOp>(op, type, statePtr);
566struct SimStepOpLowering :
public ModelAwarePattern<arc::SimStepOp> {
567 using ModelAwarePattern::ModelAwarePattern;
570 matchAndRewrite(arc::SimStepOp op, OpAdaptor adaptor,
571 ConversionPatternRewriter &rewriter)
const final {
572 StringRef modelName = cast<SimModelInstanceType>(op.getInstance().getType())
576 StringAttr evalFunc =
578 rewriter.replaceOpWithNewOp<LLVM::CallOp>(op, mlir::TypeRange(), evalFunc,
579 adaptor.getInstance());
588 Value getOrCreate(OpBuilder &b, StringRef formatStr) {
589 auto it = cache.find(formatStr);
590 if (it != cache.end()) {
591 return LLVM::AddressOfOp::create(b, b.getUnknownLoc(), it->second);
594 Location loc = b.getUnknownLoc();
595 LLVM::GlobalOp global;
597 OpBuilder::InsertionGuard guard(b);
599 b.getInsertionBlock()->getParent()->getParentOfType<ModuleOp>();
600 b.setInsertionPointToStart(m.getBody());
602 SmallVector<char> strVec(formatStr.begin(), formatStr.end());
605 auto name = llvm::formatv(
"_arc_str_{0}", cache.size()).str();
606 auto globalType = LLVM::LLVMArrayType::get(b.getI8Type(), strVec.size());
607 global = LLVM::GlobalOp::create(b, loc, globalType,
true,
608 LLVM::Linkage::Internal,
609 name, b.getStringAttr(strVec),
613 cache[formatStr] = global;
614 return LLVM::AddressOfOp::create(b, loc, global);
618 llvm::StringMap<LLVM::GlobalOp> cache;
621FailureOr<LLVM::CallOp> emitPrintfCall(OpBuilder &builder, Location loc,
622 StringCache &cache, StringRef formatStr,
625 builder.getInsertionBlock()->getParent()->getParentOfType<ModuleOp>();
627 MLIRContext *ctx = builder.getContext();
628 auto printfFunc = LLVM::lookupOrCreateFn(builder, moduleOp,
"printf",
629 LLVM::LLVMPointerType::get(ctx),
630 LLVM::LLVMVoidType::get(ctx),
true);
631 if (failed(printfFunc))
634 Value formatStrPtr = cache.getOrCreate(builder, formatStr);
635 SmallVector<Value> argsVec(1, formatStrPtr);
636 argsVec.append(args.begin(), args.end());
637 return LLVM::CallOp::create(builder, loc, printfFunc.value(), argsVec);
643struct SimEmitValueOpLowering
645 SimEmitValueOpLowering(
const TypeConverter &typeConverter,
646 MLIRContext *
context, StringCache &formatStringCache)
648 formatStringCache(formatStringCache) {}
651 matchAndRewrite(arc::SimEmitValueOp op, OpAdaptor adaptor,
652 ConversionPatternRewriter &rewriter)
const final {
653 auto valueType = dyn_cast<IntegerType>(adaptor.getValue().getType());
657 Location loc = op.getLoc();
659 ModuleOp moduleOp = op->getParentOfType<ModuleOp>();
663 SmallVector<Value> printfVariadicArgs;
664 SmallString<16> printfFormatStr;
665 int remainingBits = valueType.getWidth();
666 Value value = adaptor.getValue();
670 constexpr llvm::StringRef intFormatter =
"llx";
671 auto intType = IntegerType::get(getContext(), 64);
672 Value shiftValue = LLVM::ConstantOp::create(
673 rewriter, loc, rewriter.getIntegerAttr(valueType, intType.getWidth()));
675 if (valueType.getWidth() < intType.getWidth()) {
676 int width = llvm::divideCeil(valueType.getWidth(), 4);
677 printfFormatStr = llvm::formatv(
"%0{0}{1}", width, intFormatter);
678 printfVariadicArgs.push_back(
679 LLVM::ZExtOp::create(rewriter, loc, intType, value));
684 int otherChunkWidth = intType.getWidth() / 4;
685 int firstChunkWidth =
686 llvm::divideCeil(valueType.getWidth() % intType.getWidth(), 4);
687 if (firstChunkWidth == 0) {
688 firstChunkWidth = otherChunkWidth;
691 std::string firstChunkFormat =
692 llvm::formatv(
"%0{0}{1}", firstChunkWidth, intFormatter);
693 std::string otherChunkFormat =
694 llvm::formatv(
"%0{0}{1}", otherChunkWidth, intFormatter);
696 for (
int i = 0; remainingBits > 0; ++i) {
699 printfVariadicArgs.push_back(
700 LLVM::TruncOp::create(rewriter, loc, intType, value));
703 printfFormatStr.append(i == 0 ? firstChunkFormat : otherChunkFormat);
706 LLVM::LShrOp::create(rewriter, loc, value, shiftValue).getResult();
707 remainingBits -= intType.getWidth();
711 std::reverse(printfVariadicArgs.begin(), printfVariadicArgs.end());
713 SmallString<16> formatStr = adaptor.getValueName();
714 formatStr.append(
" = ");
715 formatStr.append(printfFormatStr);
716 formatStr.append(
"\n");
718 auto callOp = emitPrintfCall(rewriter, op->getLoc(), formatStringCache,
719 formatStr, printfVariadicArgs);
722 rewriter.replaceOp(op, *callOp);
727 StringCache &formatStringCache;
736 SmallVector<FmtDescriptor> descriptors;
737 SmallVector<Value> args;
744static Value reg2mem(ConversionPatternRewriter &rewriter, Location loc,
747 int64_t origBitwidth = cast<IntegerType>(value.getType()).getWidth();
748 int64_t bitwidth = llvm::divideCeil(origBitwidth, 64) * 64;
749 int64_t numWords = bitwidth / 64;
752 LLVM::ConstantOp alloca_size =
753 LLVM::ConstantOp::create(rewriter, loc, rewriter.getI32Type(), numWords);
754 auto ptrType = LLVM::LLVMPointerType::get(rewriter.getContext());
755 auto allocaOp = LLVM::AllocaOp::create(rewriter, loc, ptrType,
756 rewriter.getI64Type(), alloca_size);
757 LLVM::LifetimeStartOp::create(rewriter, loc, allocaOp);
761 for (int64_t wordIdx = 0; wordIdx < numWords; ++wordIdx) {
762 Value cst = LLVM::ConstantOp::create(
763 rewriter, loc, rewriter.getIntegerType(origBitwidth), wordIdx * 64);
764 Value v = LLVM::LShrOp::create(rewriter, loc, value, cst);
765 if (origBitwidth > 64) {
766 v = LLVM::TruncOp::create(rewriter, loc, rewriter.getI64Type(), v);
767 }
else if (origBitwidth < 64) {
768 v = LLVM::ZExtOp::create(rewriter, loc, rewriter.getI64Type(), v);
770 Value gep = LLVM::GEPOp::create(rewriter, loc, ptrType,
771 rewriter.getI64Type(), allocaOp, {wordIdx});
772 LLVM::StoreOp::create(rewriter, loc, v, gep);
779static FailureOr<FormatInfo>
780foldFormatString(ConversionPatternRewriter &rewriter, Value fstringValue,
781 StringCache &cache) {
782 Operation *op = fstringValue.getDefiningOp();
783 return llvm::TypeSwitch<Operation *, FailureOr<FormatInfo>>(op)
784 .Case<sim::FormatCharOp>(
785 [&](sim::FormatCharOp op) -> FailureOr<FormatInfo> {
786 FmtDescriptor d = FmtDescriptor::createChar();
787 return FormatInfo{{d}, {op.getValue()}};
789 .Case<sim::FormatDecOp>([&](sim::FormatDecOp op)
790 -> FailureOr<FormatInfo> {
791 FmtDescriptor d = FmtDescriptor::createInt(
792 op.getValue().getType().getWidth(), 10, op.getIsLeftAligned(),
793 op.getSpecifierWidth().value_or(-1),
false, op.getIsSigned());
794 return FormatInfo{{d}, {reg2mem(rewriter, op.getLoc(), op.getValue())}};
796 .Case<sim::FormatHexOp>([&](sim::FormatHexOp op)
797 -> FailureOr<FormatInfo> {
798 FmtDescriptor d = FmtDescriptor::createInt(
799 op.getValue().getType().getWidth(), 16, op.getIsLeftAligned(),
800 op.getSpecifierWidth().value_or(-1), op.getIsHexUppercase(),
false);
801 return FormatInfo{{d}, {reg2mem(rewriter, op.getLoc(), op.getValue())}};
803 .Case<sim::FormatOctOp>([&](sim::FormatOctOp op)
804 -> FailureOr<FormatInfo> {
805 FmtDescriptor d = FmtDescriptor::createInt(
806 op.getValue().getType().getWidth(), 8, op.getIsLeftAligned(),
807 op.getSpecifierWidth().value_or(-1),
false,
false);
808 return FormatInfo{{d}, {reg2mem(rewriter, op.getLoc(), op.getValue())}};
810 .Case<sim::FormatLiteralOp>(
811 [&](sim::FormatLiteralOp op) -> FailureOr<FormatInfo> {
812 if (op.getLiteral().size() < 8 &&
813 op.getLiteral().find(
'\0') == StringRef::npos) {
816 FmtDescriptor::createSmallLiteral(op.getLiteral());
817 return FormatInfo{{d}, {}};
820 FmtDescriptor::createLiteral(op.getLiteral().size());
821 Value value = cache.getOrCreate(rewriter, op.getLiteral());
822 return FormatInfo{{d}, {value}};
824 .Case<sim::FormatStringConcatOp>(
825 [&](sim::FormatStringConcatOp op) -> FailureOr<FormatInfo> {
826 auto fmt = foldFormatString(rewriter, op.getInputs()[0], cache);
829 for (
auto input : op.getInputs().drop_front()) {
830 auto next = foldFormatString(rewriter, input, cache);
833 fmt->descriptors.append(next->descriptors);
834 fmt->args.append(next->args);
839 [](Operation *op) -> FailureOr<FormatInfo> {
return failure(); });
842FailureOr<LLVM::CallOp> emitFmtCall(OpBuilder &builder, Location loc,
843 StringCache &stringCache,
844 ArrayRef<FmtDescriptor> descriptors,
847 builder.getInsertionBlock()->getParent()->getParentOfType<ModuleOp>();
849 MLIRContext *ctx = builder.getContext();
850 auto func = LLVM::lookupOrCreateFn(
851 builder, moduleOp, runtime::APICallbacks::symNameFormat,
852 LLVM::LLVMPointerType::get(ctx), LLVM::LLVMVoidType::get(ctx),
true);
856 StringRef rawDescriptors(
reinterpret_cast<const char *
>(descriptors.data()),
857 descriptors.size() *
sizeof(FmtDescriptor));
858 Value fmtPtr = stringCache.getOrCreate(builder, rawDescriptors);
860 SmallVector<Value> argsVec(1, fmtPtr);
861 argsVec.append(args.begin(), args.end());
862 auto result = LLVM::CallOp::create(builder, loc, func.value(), argsVec);
864 for (Value arg : args) {
865 Operation *definingOp = arg.getDefiningOp();
866 if (
auto alloca = dyn_cast_if_present<LLVM::AllocaOp>(definingOp)) {
867 LLVM::LifetimeEndOp::create(builder, loc, arg);
874struct SimPrintFormattedProcOpLowering
876 SimPrintFormattedProcOpLowering(
const TypeConverter &typeConverter,
878 StringCache &stringCache)
880 stringCache(stringCache) {}
883 matchAndRewrite(sim::PrintFormattedProcOp op, OpAdaptor adaptor,
884 ConversionPatternRewriter &rewriter)
const override {
885 auto formatInfo = foldFormatString(rewriter, op.getInput(), stringCache);
886 if (failed(formatInfo))
887 return rewriter.notifyMatchFailure(op,
"unsupported format string");
890 formatInfo->descriptors.push_back(FmtDescriptor());
892 auto result = emitFmtCall(rewriter, op.getLoc(), stringCache,
893 formatInfo->descriptors, formatInfo->args);
896 rewriter.replaceOp(op, result.value());
901 StringCache &stringCache;
906static LogicalResult
convert(arc::ExecuteOp op, arc::ExecuteOp::Adaptor adaptor,
907 ConversionPatternRewriter &rewriter,
908 const TypeConverter &converter) {
910 if (failed(rewriter.convertRegionTypes(&op.getBody(), converter)))
916 auto *blockBefore = rewriter.getInsertionBlock();
918 rewriter.splitBlock(blockBefore, rewriter.getInsertionPoint());
921 rewriter.setInsertionPointToEnd(blockBefore);
922 mlir::cf::BranchOp::create(rewriter, op.getLoc(), &op.getBody().front(),
923 adaptor.getInputs());
927 for (
auto &block : op.getBody()) {
928 auto outputOp = dyn_cast<arc::OutputOp>(block.getTerminator());
931 rewriter.setInsertionPointToEnd(&block);
932 rewriter.replaceOpWithNewOp<mlir::cf::BranchOp>(outputOp, blockAfter,
933 outputOp.getOperands());
937 rewriter.inlineRegionBefore(op.getBody(), blockAfter);
941 SmallVector<Value> args;
942 args.reserve(op.getNumResults());
943 for (
auto result : op.getResults())
944 args.push_back(blockAfter->addArgument(result.getType(), result.getLoc()));
945 rewriter.replaceOp(op, args);
946 auto conversion = converter.convertBlockSignature(blockAfter);
949 rewriter.applySignatureConversion(blockAfter, *conversion, &converter);
957template <typename T, typename = std::enable_if_t<std::is_integral<T>::value>>
960 SmallVectorImpl<T> &data,
961 unsigned alignment =
alignof(T)) {
962 auto intType = builder.getIntegerType(8 *
sizeof(T));
963 Attribute denseAttr = mlir::DenseElementsAttr::get(
964 mlir::RankedTensorType::get({(int64_t)data.size()}, intType),
965 llvm::ArrayRef(data));
966 auto globalOp = LLVM::GlobalOp::create(
967 builder, loc, LLVM::LLVMArrayType::get(intType, data.size()),
968 true, LLVM::Linkage::Internal,
969 builder.getStringAttr(symName), denseAttr);
970 globalOp.setAlignmentAttr(builder.getI64IntegerAttr(alignment));
979 SmallVectorImpl<T> &array) {
981 static_assert(std::is_standard_layout<T>(),
982 "Runtime struct must have standard layout");
983 int64_t numBytes =
sizeof(T) * array.size();
984 Attribute denseAttr = mlir::DenseElementsAttr::get(
985 mlir::RankedTensorType::get({numBytes}, builder.getI8Type()),
986 llvm::ArrayRef(
reinterpret_cast<uint8_t *
>(array.data()), numBytes));
987 auto globalOp = LLVM::GlobalOp::create(
988 builder, loc, LLVM::LLVMArrayType::get(builder.getI8Type(), numBytes),
989 true, LLVM::Linkage::Internal,
990 builder.getStringAttr(symName), denseAttr,
alignof(T));
996 using OpConversionPattern::OpConversionPattern;
1003 ConversionPatternRewriter &rewriter)
const {
1004 if (!op.getTraceTaps().has_value() || op.getTraceTaps()->empty())
1007 SmallVector<char> namesArray;
1008 SmallVector<ArcTraceTap> tapArray;
1009 tapArray.reserve(op.getTraceTaps()->size());
1010 for (
auto attr : op.getTraceTapsAttr()) {
1011 auto tap = cast<TraceTapAttr>(attr);
1012 assert(!tap.getNames().empty() &&
1013 "Expected trace tap to have at least one name");
1014 for (
auto alias : tap.getNames()) {
1015 auto aliasStr = cast<StringAttr>(alias);
1016 namesArray.append(aliasStr.begin(), aliasStr.end());
1017 namesArray.push_back(
'\0');
1021 tapStruct.
nameOffset = namesArray.size() - 1;
1022 tapStruct.
typeBits = tap.getSigType().getValue().getIntOrFloatBitWidth();
1024 tapArray.emplace_back(tapStruct);
1026 auto ptrTy = LLVM::LLVMPointerType::get(getContext());
1028 rewriter, op.getLoc(),
"_arc_tap_names_" + op.getName(), namesArray);
1030 rewriter, op.getLoc(),
"_arc_trace_taps_" + op.getName(), tapArray);
1040 auto traceInfoStructType = LLVM::LLVMStructType::getLiteral(
1042 {rewriter.getI64Type(), ptrTy, ptrTy, rewriter.getI64Type()});
1044 "Unexpected size of ArcModelTraceInfo struct");
1046 auto globalSymName =
1047 rewriter.getStringAttr(
"_arc_trace_info_" + op.getName());
1048 auto traceInfoGlobalOp = LLVM::GlobalOp::create(
1049 rewriter, op.getLoc(), traceInfoStructType,
1050 false, LLVM::Linkage::Internal, globalSymName,
1052 OpBuilder::InsertionGuard g(rewriter);
1055 Region &initRegion = traceInfoGlobalOp.getInitializerRegion();
1056 Block *initBlock = rewriter.createBlock(&initRegion);
1057 rewriter.setInsertionPointToStart(initBlock);
1059 auto numTraceTapsCst = LLVM::ConstantOp::create(
1060 rewriter, op.getLoc(), rewriter.getI64IntegerAttr(tapArray.size()));
1061 auto traceTapArrayAddr =
1062 LLVM::AddressOfOp::create(rewriter, op.getLoc(), traceTapsArrayGlobal);
1063 auto tapNameArrayAddr =
1064 LLVM::AddressOfOp::create(rewriter, op.getLoc(), namesGlobal);
1065 auto bufferCapacityCst = LLVM::ConstantOp::create(
1066 rewriter, op.getLoc(),
1067 rewriter.getI64IntegerAttr(runtime::defaultTraceBufferCapacity));
1070 LLVM::PoisonOp::create(rewriter, op.getLoc(), traceInfoStructType);
1074 LLVM::InsertValueOp::create(rewriter, op.getLoc(), initStruct,
1075 numTraceTapsCst, ArrayRef<int64_t>{0});
1077 "Unexpected offset of field numTraceTaps");
1080 LLVM::InsertValueOp::create(rewriter, op.getLoc(), initStruct,
1081 traceTapArrayAddr, ArrayRef<int64_t>{1});
1083 "Unexpected offset of field traceTaps");
1086 LLVM::InsertValueOp::create(rewriter, op.getLoc(), initStruct,
1087 tapNameArrayAddr, ArrayRef<int64_t>{2});
1089 "Unexpected offset of field traceTapNames");
1092 LLVM::InsertValueOp::create(rewriter, op.getLoc(), initStruct,
1093 bufferCapacityCst, ArrayRef<int64_t>{3});
1095 "Unexpected offset of field traceBufferCapacity");
1096 LLVM::ReturnOp::create(rewriter, op.getLoc(), initStruct);
1098 return traceInfoGlobalOp;
1104 ConversionPatternRewriter &rewriter)
const final {
1106 auto ptrTy = LLVM::LLVMPointerType::get(getContext());
1107 auto modelInfoStructType = LLVM::LLVMStructType::getLiteral(
1109 {rewriter.getI64Type(), rewriter.getI64Type(), ptrTy, ptrTy});
1111 "Unexpected size of ArcRuntimeModelInfo struct");
1113 rewriter.setInsertionPoint(op);
1117 SmallVector<char, 16> modNameArray(op.getName().begin(),
1118 op.getName().end());
1119 modNameArray.push_back(
'\0');
1120 auto nameGlobalType =
1121 LLVM::LLVMArrayType::get(rewriter.getI8Type(), modNameArray.size());
1122 auto globalSymName =
1123 rewriter.getStringAttr(
"_arc_mod_name_" + op.getName());
1124 auto nameGlobal = LLVM::GlobalOp::create(
1125 rewriter, op.getLoc(), nameGlobalType,
true,
1126 LLVM::Linkage::Internal,
1127 globalSymName, rewriter.getStringAttr(modNameArray),
1134 auto modInfoGlobalOp =
1135 LLVM::GlobalOp::create(rewriter, op.getLoc(), modelInfoStructType,
1136 false, LLVM::Linkage::External,
1137 op.getSymName(), Attribute{});
1140 Region &initRegion = modInfoGlobalOp.getInitializerRegion();
1141 Block *initBlock = rewriter.createBlock(&initRegion);
1142 rewriter.setInsertionPointToStart(initBlock);
1143 auto apiVersionCst = LLVM::ConstantOp::create(
1145 auto numStateBytesCst = LLVM::ConstantOp::create(rewriter, op.getLoc(),
1146 op.getNumStateBytesAttr());
1148 LLVM::AddressOfOp::create(rewriter, op.getLoc(), nameGlobal);
1150 if (traceInfoGlobal)
1152 LLVM::AddressOfOp::create(rewriter, op.getLoc(), traceInfoGlobal);
1154 traceInfoPtr = LLVM::ZeroOp::create(rewriter, op.getLoc(), ptrTy);
1157 LLVM::PoisonOp::create(rewriter, op.getLoc(), modelInfoStructType);
1160 initStruct = LLVM::InsertValueOp::create(
1161 rewriter, op.getLoc(), initStruct, apiVersionCst, ArrayRef<int64_t>{0});
1163 "Unexpected offset of field apiVersion");
1166 LLVM::InsertValueOp::create(rewriter, op.getLoc(), initStruct,
1167 numStateBytesCst, ArrayRef<int64_t>{1});
1169 "Unexpected offset of field numStateBytes");
1171 initStruct = LLVM::InsertValueOp::create(rewriter, op.getLoc(), initStruct,
1172 nameAddr, ArrayRef<int64_t>{2});
1174 "Unexpected offset of field modelName");
1176 initStruct = LLVM::InsertValueOp::create(
1177 rewriter, op.getLoc(), initStruct, traceInfoPtr, ArrayRef<int64_t>{3});
1179 "Unexpected offset of field traceInfo");
1181 LLVM::ReturnOp::create(rewriter, op.getLoc(), initStruct);
1183 rewriter.replaceOp(op, modInfoGlobalOp);
1193struct LowerArcToLLVMPass
1194 :
public circt::impl::LowerArcToLLVMBase<LowerArcToLLVMPass> {
1195 void runOnOperation()
override;
1199void LowerArcToLLVMPass::runOnOperation() {
1203 DenseMap<Region *, hw::ConstantOp> zeros;
1204 getOperation().walk([&](Operation *op) {
1205 if (op->hasTrait<OpTrait::ConstantLike>())
1207 for (
auto result : op->getResults()) {
1208 auto type = dyn_cast<IntegerType>(result.getType());
1209 if (!type || type.getWidth() != 0)
1211 auto *region = op->getParentRegion();
1212 auto &zero = zeros[region];
1214 auto builder = OpBuilder::atBlockBegin(®ion->front());
1218 result.replaceAllUsesWith(zero);
1234 LLVMConversionTarget target(getContext());
1235 target.addLegalOp<mlir::ModuleOp>();
1236 target.addLegalOp<scf::YieldOp>();
1241 target.addLegalOp<sim::FormatLiteralOp, sim::FormatDecOp, sim::FormatHexOp,
1242 sim::FormatBinOp, sim::FormatOctOp, sim::FormatCharOp,
1243 sim::FormatStringConcatOp>();
1246 LLVMTypeConverter converter(&getContext());
1247 converter.addConversion([&](seq::ClockType type) {
1248 return IntegerType::get(type.getContext(), 1);
1250 converter.addConversion([&](StorageType type) {
1251 return LLVM::LLVMPointerType::get(type.getContext());
1253 converter.addConversion([&](MemoryType type) {
1254 return LLVM::LLVMPointerType::get(type.getContext());
1256 converter.addConversion([&](StateType type) {
1257 return LLVM::LLVMPointerType::get(type.getContext());
1259 converter.addConversion([&](SimModelInstanceType type) {
1260 return LLVM::LLVMPointerType::get(type.getContext());
1262 converter.addConversion([&](sim::FormatStringType type) {
1263 return LLVM::LLVMPointerType::get(type.getContext());
1270 populateSCFToControlFlowConversionPatterns(
patterns);
1271 populateFuncToLLVMConversionPatterns(converter,
patterns);
1272 cf::populateControlFlowToLLVMConversionPatterns(converter,
patterns);
1273 arith::populateArithToLLVMConversionPatterns(converter,
patterns);
1274 index::populateIndexToLLVMConversionPatterns(converter,
patterns);
1275 populateAnyFunctionOpInterfaceTypeConversionPattern(
patterns, converter);
1278 DenseMap<std::pair<Type, ArrayAttr>, LLVM::GlobalOp> constAggregateGlobalsMap;
1280 std::optional<HWToLLVMArraySpillCache> spillCacheOpt =
1283 OpBuilder spillBuilder(getOperation());
1284 spillCacheOpt->spillNonHWOps(spillBuilder, converter, getOperation());
1287 constAggregateGlobalsMap, spillCacheOpt);
1295 AllocMemoryOpLowering,
1296 AllocStateLikeOpLowering<arc::AllocStateOp>,
1297 AllocStateLikeOpLowering<arc::RootInputOp>,
1298 AllocStateLikeOpLowering<arc::RootOutputOp>,
1299 AllocStorageOpLowering,
1300 ClockGateOpLowering,
1302 MemoryReadOpLowering,
1303 MemoryWriteOpLowering,
1305 ReplaceOpWithInputPattern<seq::ToClockOp>,
1306 ReplaceOpWithInputPattern<seq::FromClockOp>,
1308 SeqConstClockLowering,
1309 StateReadOpLowering,
1310 StateWriteOpLowering,
1311 StorageGetOpLowering,
1313 >(converter, &getContext());
1317 StringCache stringCache;
1318 patterns.add<SimEmitValueOpLowering, SimPrintFormattedProcOpLowering>(
1319 converter, &getContext(), stringCache);
1321 auto &modelInfo = getAnalysis<ModelInfoAnalysis>();
1322 llvm::DenseMap<StringRef, ModelInfoMap> modelMap(modelInfo.infoMap.size());
1323 for (
auto &[_, modelInfo] : modelInfo.infoMap) {
1324 llvm::DenseMap<StringRef, StateInfo> states(modelInfo.states.size());
1325 for (StateInfo &stateInfo : modelInfo.states)
1326 states.insert({stateInfo.name, stateInfo});
1329 ModelInfoMap{modelInfo.numStateBytes, std::move(states),
1330 modelInfo.initialFnSym, modelInfo.finalFnSym}});
1333 patterns.add<SimInstantiateOpLowering, SimSetInputOpLowering,
1334 SimGetPortOpLowering, SimStepOpLowering>(
1335 converter, &getContext(), modelMap);
1338 ConversionConfig config;
1339 config.allowPatternRollback =
false;
1340 if (failed(applyFullConversion(getOperation(), target, std::move(
patterns),
1342 signalPassFailure();
1346 return std::make_unique<LowerArcToLLVMPass>();
assert(baseType &&"element must be base type")
static std::unique_ptr< Context > context
static LLVM::GlobalOp buildGlobalConstantIntArray(OpBuilder &builder, Location loc, Twine symName, SmallVectorImpl< T > &data, unsigned alignment=alignof(T))
static LLVM::GlobalOp buildGlobalConstantRuntimeStructArray(OpBuilder &builder, Location loc, Twine symName, SmallVectorImpl< T > &array)
static llvm::Twine evalSymbolFromModelName(StringRef modelName)
static LogicalResult convert(arc::ExecuteOp op, arc::ExecuteOp::Adaptor adaptor, ConversionPatternRewriter &rewriter, const TypeConverter &converter)
Extension of RewritePatternSet that allows adding matchAndRewrite functions with op adaptors and Conv...
A namespace that is used to store existing names and generate new names in some scope within the IR.
void add(mlir::ModuleOp module)
void addDefinitions(mlir::Operation *top)
Populate the symbol cache with all symbol-defining operations within the 'top' operation.
Default symbol cache implementation; stores associations between names (StringAttr's) to mlir::Operat...
#define ARC_RUNTIME_API_VERSION
Version of the combined public and internal API.
The InstanceGraph op interface, see InstanceGraphInterface.td for more details.
void populateCombToArithConversionPatterns(TypeConverter &converter, RewritePatternSet &patterns)
void populateCombToLLVMConversionPatterns(mlir::LLVMTypeConverter &converter, RewritePatternSet &patterns)
Get the Comb to LLVM conversion patterns.
void populateHWToLLVMTypeConversions(mlir::LLVMTypeConverter &converter)
Get the HW to LLVM type conversions.
void populateHWToLLVMConversionPatterns(mlir::LLVMTypeConverter &converter, RewritePatternSet &patterns, Namespace &globals, DenseMap< std::pair< Type, ArrayAttr >, mlir::LLVM::GlobalOp > &constAggregateGlobalsMap, std::optional< HWToLLVMArraySpillCache > &spillCacheOpt)
Get the HW to LLVM conversion patterns.
std::unique_ptr< OperationPass< ModuleOp > > createLowerArcToLLVMPass()
Static information for a compiled hardware model, generated by the MLIR lowering.
uint32_t typeBits
Bit width of the traced signal.
uint64_t stateOffset
Byte offset of the traced value within the model state.
uint64_t nameOffset
Byte offset to the null terminator of this signal's last alias in the names array.
uint32_t reserved
Padding and reserved for future use.
LLVM::GlobalOp buildTraceInfoStruct(arc::RuntimeModelOp &op, ConversionPatternRewriter &rewriter) const
static constexpr uint64_t runtimeApiVersion
LogicalResult matchAndRewrite(arc::RuntimeModelOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const final
Helper class mapping array values (HW or LLVM Dialect) to pointers to buffers containing the array va...