CIRCT 23.0.0git
Loading...
Searching...
No Matches
LongestPathAnalysis.cpp
Go to the documentation of this file.
1//===----------------------------------------------------------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This analysis computes the longest combinational paths through a circuit
10// represented in the AIG (And-Inverter Graph) dialect. The key aspects are:
11//
12// - Each AIG and-inverter operation is considered to have a unit delay of 1
13// - The analysis traverses the circuit graph from inputs/registers to outputs
14// - It handles hierarchical designs by analyzing modules bottom-up
15// - Results include full path information with delays and debug points
16// - Caching is used extensively to improve performance on large designs
17//
18// The core algorithm works as follows:
19// 1. Build an instance graph of the full design hierarchy
20// 2. Analyze modules in post-order (children before parents)
21// 3. For each module:
22// - Trace paths from inputs and registers
23// - Propagate delays through logic and across module boundaries
24// - Record maximum delay and path info for each node
25// 4. Combine results across hierarchy to get full chip critical paths
26//
27// The analysis handles both closed paths (register-to-register) and open
28// paths (input-to-register, register-to-output) across the full hierarchy.
29//===----------------------------------------------------------------------===//
30
40#include "circt/Support/LLVM.h"
41#include "mlir/IR/BuiltinAttributes.h"
42#include "mlir/IR/BuiltinOps.h"
43#include "mlir/IR/Diagnostics.h"
44#include "mlir/IR/Operation.h"
45#include "mlir/IR/Threading.h"
46#include "mlir/IR/Value.h"
47#include "mlir/IR/Visitors.h"
48#include "mlir/Pass/AnalysisManager.h"
49#include "mlir/Pass/PassManager.h"
50#include "mlir/Pass/PassRegistry.h"
51#include "mlir/Support/FileUtilities.h"
52#include "mlir/Support/LLVM.h"
53#include "llvm/ADT//MapVector.h"
54#include "llvm/ADT/ArrayRef.h"
55#include "llvm/ADT/DenseMapInfoVariant.h"
56#include "llvm/ADT/EquivalenceClasses.h"
57#include "llvm/ADT/ImmutableList.h"
58#include "llvm/ADT/MapVector.h"
59#include "llvm/ADT/PostOrderIterator.h"
60#include "llvm/ADT/STLExtras.h"
61#include "llvm/ADT/SmallVector.h"
62#include "llvm/ADT/StringRef.h"
63#include "llvm/Support/Debug.h"
64#include "llvm/Support/ErrorHandling.h"
65#include "llvm/Support/JSON.h"
66#include "llvm/Support/LogicalResult.h"
67#include "llvm/Support/MathExtras.h"
68#include "llvm/Support/Mutex.h"
69#include "llvm/Support/raw_ostream.h"
70#include <condition_variable>
71#include <cstddef>
72#include <cstdint>
73#include <memory>
74#include <mutex>
75
76#define DEBUG_TYPE "aig-longest-path-analysis"
77using namespace circt;
78using namespace synth;
79
80static size_t getBitWidth(Value value) {
81 if (auto vecType = dyn_cast<seq::ClockType>(value.getType()))
82 return 1;
83 if (auto memory = dyn_cast<seq::FirMemType>(value.getType()))
84 return memory.getWidth();
85 return hw::getBitWidth(value.getType());
86}
87
88template <typename T, typename Key>
89static void
90deduplicatePathsImpl(SmallVectorImpl<T> &results, size_t startIndex,
91 llvm::function_ref<Key(const T &)> keyFn,
92 llvm::function_ref<int64_t(const T &)> delayFn) {
93 // Take only maximum for each path destination.
94 DenseMap<Key, size_t> keyToIndex;
95 for (size_t i = startIndex; i < results.size(); ++i) {
96 auto &path = results[i];
97 auto key = keyFn(path);
98 auto delay = delayFn(path);
99 auto it = keyToIndex.find(key);
100 if (it == keyToIndex.end()) {
101 // Insert a new entry.
102 size_t newIndex = keyToIndex.size() + startIndex;
103 keyToIndex[key] = newIndex;
104 results[newIndex] = std::move(results[i]);
105 continue;
106 }
107 if (delay > delayFn(results[it->second]))
108 results[it->second] = std::move(results[i]);
109 }
110
111 results.resize(keyToIndex.size() + startIndex);
112}
113
114// Filter and optimize OpenPaths based on analysis configuration.
115static void filterPaths(SmallVectorImpl<OpenPath> &results,
116 bool keepOnlyMaxDelay, bool isLocalScope) {
117 if (results.empty())
118 return;
119
120 // Fast path for local scope with max-delay filtering:
121 // Simply find and keep only the single longest delay path
122 if (keepOnlyMaxDelay && isLocalScope) {
123 OpenPath maxDelay;
124 maxDelay.delay = -1; // Initialize to invalid delay
125
126 // Find the path with maximum delay
127 for (auto &path : results) {
128 if (path.delay > maxDelay.delay)
129 maxDelay = path;
130 }
131
132 // Replace all paths with just the maximum delay path
133 results.clear();
134 if (maxDelay.delay >= 0) // Only add if we found a valid path
135 results.push_back(maxDelay);
136 return;
137 }
138
139 // Remove paths with identical start point, keeping only the longest delay
140 // path for each unique points.
141 deduplicatePathsImpl<OpenPath, Object>(
142 results, 0, [](const auto &path) { return path.startPoint; },
143 [](const auto &path) { return path.delay; });
144
145 // Global scope max-delay filtering:
146 // Keep all module input ports (BlockArguments) but only the single
147 // longest internal path to preserve boundary information
148 if (keepOnlyMaxDelay) {
149 assert(!isLocalScope);
150 size_t writeIndex = 0;
151 OpenPath maxDelay;
152 maxDelay.delay = -1; // Initialize to invalid delay
153
154 for (size_t i = 0; i < results.size(); ++i) {
155 // Preserve all module input port paths (BlockArguments) since the input
156 // port might be the critical path.
157 if (isa<BlockArgument>(results[i].getStartPoint().value)) {
158 // Keep all module input port paths, as inputs themselves may be
159 // critical
160 results[writeIndex++] = results[i];
161 } else {
162 // For internal paths, track only the maximum delay path
163 if (results[i].delay > maxDelay.delay)
164 maxDelay = results[i];
165 }
166 }
167
168 // Resize to remove processed internal paths, then add the max delay path
169 results.resize(writeIndex);
170 if (maxDelay.delay >= 0) // Only add if we found a valid internal path
171 results.push_back(maxDelay);
172 }
173}
174
175static void filterPaths(SmallVectorImpl<DataflowPath> &results,
176 size_t startIndex = 0) {
178 std::pair<DataflowPath::EndPointType, Object>>(
179 results, startIndex,
180 [](const DataflowPath &path) {
181 return std::pair(path.getEndPoint(), path.getStartPoint());
182 },
183 [](const DataflowPath &path) { return path.getDelay(); });
184}
185
186static llvm::ImmutableList<DebugPoint>
187mapList(llvm::ImmutableListFactory<DebugPoint> *debugPointFactory,
188 llvm::ImmutableList<DebugPoint> list,
189 llvm::function_ref<DebugPoint(DebugPoint)> fn) {
190 if (list.isEmpty())
191 return list;
192 auto &head = list.getHead();
193 return debugPointFactory->add(fn(head),
194 mapList(debugPointFactory, list.getTail(), fn));
195}
196
197static llvm::ImmutableList<DebugPoint>
198concatList(llvm::ImmutableListFactory<DebugPoint> *debugPointFactory,
199 llvm::ImmutableList<DebugPoint> lhs,
200 llvm::ImmutableList<DebugPoint> rhs) {
201 if (lhs.isEmpty())
202 return rhs;
203 return debugPointFactory->add(
204 lhs.getHead(), concatList(debugPointFactory, lhs.getTail(), rhs));
205}
206
207static StringAttr getNameImpl(Value value) {
208 if (auto arg = dyn_cast<BlockArgument>(value)) {
209 auto op = dyn_cast<hw::HWModuleOp>(arg.getParentBlock()->getParentOp());
210 if (!op) {
211 // TODO: Handle other operations.
212 return StringAttr::get(value.getContext(), "<unknown-argument>");
213 }
214 return op.getArgName(arg.getArgNumber());
215 }
216 return TypeSwitch<Operation *, StringAttr>(value.getDefiningOp())
217 .Case<seq::CompRegOp, seq::FirRegOp>(
218 [](auto op) { return op.getNameAttr(); })
219 .Case<hw::InstanceOp>([&](hw::InstanceOp op) {
220 SmallString<16> str;
221 str += op.getInstanceName();
222 str += ".";
223 str += cast<StringAttr>(
224 op.getResultNamesAttr()[cast<OpResult>(value).getResultNumber()]);
225 return StringAttr::get(op.getContext(), str);
226 })
227 .Case<seq::FirMemReadOp>([&](seq::FirMemReadOp op) {
228 llvm::SmallString<16> str;
229 str += op.getMemory().getDefiningOp<seq::FirMemOp>().getNameAttr();
230 str += ".read_port";
231 return StringAttr::get(value.getContext(), str);
232 })
233 .Case<seq::FirMemReadWriteOp>([&](seq::FirMemReadWriteOp op) {
234 llvm::SmallString<16> str;
235 str += op.getMemory().getDefiningOp<seq::FirMemOp>().getNameAttr();
236 str += ".rw_port";
237 return StringAttr::get(value.getContext(), str);
238 })
239 .Case<seq::FirMemOp>([&](seq::FirMemOp op) {
240 llvm::SmallString<16> str;
241 str += op.getMemory().getDefiningOp<seq::FirMemOp>().getNameAttr();
242 str += ".write_port";
243 return StringAttr::get(value.getContext(), str);
244 })
245 .Default([&](auto op) {
246 if (auto name = op->template getAttrOfType<StringAttr>("sv.namehint"))
247 return name;
248 llvm::errs() << "Unknown op: " << *op << "\n";
249 return StringAttr::get(value.getContext(), "");
250 });
251}
252
253static void printObjectImpl(llvm::raw_ostream &os, const Object &object,
254 int64_t delay = -1,
255 llvm::ImmutableList<DebugPoint> history = {},
256 StringRef comment = "") {
257 std::string pathString;
258 llvm::raw_string_ostream osPath(pathString);
259 object.instancePath.print(osPath);
260 os << "Object(" << pathString << "." << object.getName().getValue() << "["
261 << object.bitPos << "]";
262 if (delay != -1)
263 os << ", delay=" << delay;
264 if (!history.isEmpty()) {
265 os << ", history=[";
266 llvm::interleaveComma(history, os, [&](DebugPoint p) { p.print(os); });
267 os << "]";
268 }
269 if (!comment.empty())
270 os << ", comment=\"" << comment << "\"";
271 os << ")";
272}
273
274template <typename T>
275static int64_t getMaxDelayInPaths(ArrayRef<T> paths) {
276 int64_t maxDelay = 0;
277 for (auto &path : paths)
278 maxDelay = std::max(maxDelay, path.getDelay());
279 return maxDelay;
280}
281
282using namespace circt;
283using namespace aig;
284
285//===----------------------------------------------------------------------===//
286// Printing
287//===----------------------------------------------------------------------===//
288
289void OpenPath::print(llvm::raw_ostream &os) const {
290 printObjectImpl(os, startPoint, delay, history);
291}
292
293void DebugPoint::print(llvm::raw_ostream &os) const {
294 printObjectImpl(os, object, delay, {}, comment);
295}
296
297void Object::print(llvm::raw_ostream &os) const { printObjectImpl(os, *this); }
298
299StringAttr Object::getName() const { return getNameImpl(value); }
300
301void DataflowPath::printEndPoint(llvm::raw_ostream &os) {
302 if (auto *object = std::get_if<Object>(&endPoint)) {
303 object->print(os);
304 } else {
305 auto &[module, resultNumber, bitPos] =
306 *std::get_if<DataflowPath::OutputPort>(&endPoint);
307 auto outputPortName = root.getOutputName(resultNumber);
308 os << "Object($root." << outputPortName << "[" << bitPos << "])";
309 }
310}
311
312void DataflowPath::print(llvm::raw_ostream &os) {
313 os << "root=" << root.getModuleName() << ", ";
314 os << "endPoint=";
315 printEndPoint(os);
316 os << ", ";
317 os << "startPoint=";
318 path.print(os);
319}
320
321//===----------------------------------------------------------------------===//
322// OpenPath
323//===----------------------------------------------------------------------===//
324
327 instancePath = cache.concatPath(path, instancePath);
328 return *this;
329}
330
333 llvm::ImmutableListFactory<DebugPoint> *debugPointFactory,
335 startPoint.prependPaths(cache, path);
336 if (debugPointFactory)
337 this->history = mapList(debugPointFactory, this->history,
338 [&](DebugPoint p) -> DebugPoint {
339 p.object.prependPaths(cache, path);
340 return p;
341 });
342 return *this;
343}
344
345//===----------------------------------------------------------------------===//
346// DataflowPath
347//===----------------------------------------------------------------------===//
348
351 llvm::ImmutableListFactory<DebugPoint> *debugPointFactory,
353 this->path.prependPaths(cache, debugPointFactory, path);
354 if (!path.empty()) {
355 auto root = path.top()->getParentOfType<hw::HWModuleOp>();
356 assert(root && "root is not a hw::HWModuleOp");
357 this->root = root;
358 }
359
360 // If the end point is an object, prepend the path.
361 if (auto *object = std::get_if<Object>(&endPoint))
362 object->prependPaths(cache, path);
363
364 return *this;
365}
366
368 // If the end point is an object, return the location of the object.
369 if (auto *object = std::get_if<Object>(&endPoint))
370 return object->value.getLoc();
371
372 // Return output port location.
373 auto &[module, resultNumber, bitPos] =
374 *std::get_if<DataflowPath::OutputPort>(&endPoint);
375 return module.getOutputLoc(resultNumber);
376}
377
378//===----------------------------------------------------------------------===//
379// JSON serialization
380//===----------------------------------------------------------------------===//
381
382static llvm::json::Value toJSON(const circt::igraph::InstancePath &path) {
383 llvm::json::Array result;
384 for (auto op : path) {
385 llvm::json::Object obj;
386 obj["instance_name"] = op.getInstanceName();
387 obj["module_name"] = op.getReferencedModuleNames()[0];
388 result.push_back(std::move(obj));
389 }
390 return result;
391}
392
393static llvm::json::Value toJSON(const circt::synth::Object &object) {
394 return llvm::json::Object{
395 {"instance_path", toJSON(object.instancePath)},
396 {"name", object.getName().getValue()},
397 {"bit_pos", object.bitPos},
398 };
399}
400
401static llvm::json::Value toJSON(const DataflowPath::EndPointType &path,
402 hw::HWModuleOp root) {
403 using namespace llvm::json;
404 if (auto *object = std::get_if<circt::synth::Object>(&path))
405 return toJSON(*object);
406
407 auto &[module, resultNumber, bitPos] =
408 *std::get_if<DataflowPath::OutputPort>(&path);
409 return llvm::json::Object{
410 {"instance_path", {}}, // Instance path is empty for output ports.
411 {"name", root.getOutputName(resultNumber)},
412 {"bit_pos", bitPos},
413 };
414}
415
416static llvm::json::Value toJSON(const DebugPoint &point) {
417 return llvm::json::Object{
418 {"object", toJSON(point.object)},
419 {"delay", point.delay},
420 {"comment", point.comment},
421 };
422}
423
424static llvm::json::Value toJSON(const OpenPath &path) {
425 llvm::json::Array history;
426 for (auto &point : path.history)
427 history.push_back(toJSON(point));
428 return llvm::json::Object{{"start_point", toJSON(path.startPoint)},
429 {"delay", path.delay},
430 {"history", std::move(history)}};
431}
432
433llvm::json::Value circt::synth::toJSON(const DataflowPath &path) {
434 return llvm::json::Object{
435 {"end_point", ::toJSON(path.getEndPoint(), path.getRoot())},
436 {"path", ::toJSON(path.getPath())},
437 {"root", path.getRoot().getModuleName()},
438 };
439}
440
441class LocalVisitor;
442
443//===----------------------------------------------------------------------===//
444// Context
445//===----------------------------------------------------------------------===//
446/// This class provides a thread-safe interface to access the analysis results.
447
448class Context {
449public:
451 const LongestPathAnalysisOptions &option)
452 : instanceGraph(instanceGraph), option(option) {}
453 void notifyStart(StringAttr name) {
454 std::lock_guard<llvm::sys::SmartMutex<true>> lock(mutex);
455 running.insert(name);
456 llvm::dbgs() << "[Timing] " << name << " started. running=[";
457 for (auto &name : running)
458 llvm::dbgs() << name << " ";
459 llvm::dbgs() << "]\n";
460 }
461
462 void notifyEnd(StringAttr name) {
463 std::lock_guard<llvm::sys::SmartMutex<true>> lock(mutex);
464 running.remove(name);
465
466 llvm::dbgs() << "[Timing] " << name << " finished. running=[";
467 for (auto &name : running)
468 llvm::dbgs() << name << " ";
469 llvm::dbgs() << "]\n";
470 }
471
472 // Lookup a local visitor for `name`.
473 const LocalVisitor *getLocalVisitor(StringAttr name) const;
474
475 // Lookup a mutable local visitor for `name`.
476 LocalVisitor *getLocalVisitorMutable(StringAttr name) const;
477
478 // A map from the module name to the local visitor.
480
481 // This is non-null only if `module` is a ModuleOp.
482 circt::igraph::InstanceGraph *instanceGraph = nullptr;
483
484 bool doTraceDebugPoints() const { return option.collectDebugInfo; }
485 bool doLazyComputation() const { return option.lazyComputation; }
486 bool doKeepOnlyMaxDelayPaths() const { return option.keepOnlyMaxDelayPaths; }
487 bool isLocalScope() const { return instanceGraph == nullptr; }
488 StringAttr getTopModuleName() const { return option.topModuleName; }
489
490private:
491 bool isRunningParallel() const { return !doLazyComputation(); }
492 llvm::sys::SmartMutex<true> mutex;
493 llvm::SetVector<StringAttr> running;
494 LongestPathAnalysisOptions option;
495};
496
497//===----------------------------------------------------------------------===//
498// OperationAnalyzer
499//===----------------------------------------------------------------------===//
500
501// OperationAnalyzer handles timing analysis for individual operations that
502// haven't been converted to AIG yet. It creates isolated modules for each
503// unique operation type/signature combination, runs the conversion pipeline
504// (HW -> Comb -> AIG), and analyzes the resulting AIG representation.
505//
506// This is used as a fallback when the main analysis encounters operations
507// that don't have direct AIG equivalents. The analyzer:
508// 1. Creates a wrapper HW module for the operation
509// 2. Runs the standard conversion pipeline to lower it to AIG
510// 3. Analyzes the resulting AIG to compute timing paths
511// 4. Caches results based on operation name and function signature
513public:
514 // Constructor creates a new analyzer with an empty module for building
515 // temporary operation wrappers.
516 // The analyzer needs its own Context separate from the main analysis
517 // to avoid using onlyMaxDelay mode, as we require precise input
518 // dependency information for accurate delay propagation
519 OperationAnalyzer(Location loc)
520 : ctx(nullptr, LongestPathAnalysisOptions(false, true, false)), loc(loc) {
521 mlir::OpBuilder builder(loc->getContext());
522 moduleOp = mlir::ModuleOp::create(builder, loc);
523 emptyName = StringAttr::get(loc->getContext(), "");
524 }
525
526 // Initialize the pass pipeline used to lower operations to AIG.
527 // This sets up the standard conversion sequence: HW -> Comb -> AIG -> cleanup
528 LogicalResult initializePipeline();
529
530 // Analyze timing paths for a specific operation result and bit position.
531 // Creates a wrapper module if needed, runs conversion, and returns timing
532 // information as input dependencies.
533 // Results are tuples of (input operand index, bit position in operand, delay)
534 LogicalResult analyzeOperation(
535 OpResult value, size_t bitPos,
536 SmallVectorImpl<std::tuple<size_t, size_t, int64_t>> &results);
537
538private:
539 // Get or create a LocalVisitor for analyzing the given operation.
540 // Uses caching based on operation name and function signature to avoid
541 // recomputing analysis for identical operations.
542 FailureOr<LocalVisitor *> getOrComputeLocalVisitor(Operation *op);
543
544 // Extract the function signature (input/output types) from an operation.
545 // This is used as part of the cache key to distinguish operations with
546 // different type signatures.
547 static mlir::FunctionType getFunctionTypeForOp(Operation *op);
548
549 // Cache mapping (operation_name, function_type) -> analyzed LocalVisitor
550 // This avoids recomputing analysis for operations with identical signatures
551 llvm::DenseMap<std::pair<mlir::OperationName, mlir::FunctionType>,
552 std::unique_ptr<LocalVisitor>>
554
555 // Standard conversion pipeline: HW -> Comb -> AIG -> cleanup passes
556 // This pipeline is applied to wrapper modules to prepare them for analysis
557 constexpr static StringRef pipelineStr =
558 "hw.module(hw-aggregate-to-comb,convert-comb-to-synth,cse,canonicalize)";
559 std::unique_ptr<mlir::PassManager> passManager;
560
561 // Temporary module used to hold wrapper modules during analysis
562 // Each operation gets its own wrapper module created inside this parent
564
565 Context ctx; // Analysis context and configuration
566 Location loc; // Source location for error reporting
567 StringAttr emptyName;
568};
569
570mlir::FunctionType OperationAnalyzer::getFunctionTypeForOp(Operation *op) {
571 return mlir::FunctionType::get(op->getContext(), op->getOperandTypes(),
572 op->getResultTypes());
573}
574
575// -----------------------------------------------------------------------------
576// LocalVisitor
577// -----------------------------------------------------------------------------
578
580public:
581 LocalVisitor(hw::HWModuleOp module, Context *ctx);
582 LogicalResult initializeAndRun();
583 // Wait until the thread is done.
584 void waitUntilDone() const;
585
586 // Get the longest paths for the given value and bit position.
587 // If the result is not cached, compute it and cache it.
588 FailureOr<ArrayRef<OpenPath>> getOrComputePaths(Value value, size_t bitPos);
589
590 // Get the longest paths for the given value and bit position. This returns
591 // an empty array if not pre-computed.
592 ArrayRef<OpenPath> getCachedPaths(Value value, size_t bitPos) const;
593
594 // A map from the object to the maximum distance and history.
597 std::pair<int64_t, llvm::ImmutableList<DebugPoint>>>;
598
599 void getInternalPaths(SmallVectorImpl<DataflowPath> &results) const;
600 void setTopLevel() { this->topLevel = true; }
601 bool isTopLevel() const { return topLevel; }
602 hw::HWModuleOp getHWModuleOp() const { return module; }
603
604 const auto &getFromInputPortToEndPoint() const {
605 return fromInputPortToEndPoint;
606 }
607 const auto &getFromOutputPortToStartPoint() const {
608 return fromOutputPortToStartPoint;
609 }
610 const auto &getEndPointResults() const { return endPointResults; }
611
613 return instancePathCache.get();
614 }
615
616 llvm::ImmutableListFactory<DebugPoint> *getDebugPointFactory() const {
617 return debugPointFactory.get();
618 }
619
620private:
621 void putUnclosedResult(const Object &object, int64_t delay,
622 llvm::ImmutableList<DebugPoint> history,
623 ObjectToMaxDistance &objectToMaxDistance);
624
625 // A map from the input port to the farthest end point.
628
629 // A map from the output port to the farthest start point.
632
633 LogicalResult initializeAndRun(hw::InstanceOp instance);
634 LogicalResult initializeAndRun(hw::OutputOp output);
635
636 // --------------------------------------------------------------------------
637 // Visitors
638 // --------------------------------------------------------------------------
639 LogicalResult visitValue(Value value, size_t bitPos,
640 SmallVectorImpl<OpenPath> &results);
641 // Module boundary.
642 LogicalResult visit(mlir::BlockArgument argument, size_t bitPos,
643 SmallVectorImpl<OpenPath> &results);
644 LogicalResult visit(hw::InstanceOp op, size_t bitPos, size_t resultNum,
645 SmallVectorImpl<OpenPath> &results);
646
647 // Data-movement ops.
648 LogicalResult visit(hw::WireOp op, size_t bitPos,
649 SmallVectorImpl<OpenPath> &results);
650 LogicalResult visit(comb::ConcatOp op, size_t bitPos,
651 SmallVectorImpl<OpenPath> &results);
652 LogicalResult visit(comb::ExtractOp op, size_t bitPos,
653 SmallVectorImpl<OpenPath> &results);
654 LogicalResult visit(comb::ReplicateOp op, size_t bitPos,
655 SmallVectorImpl<OpenPath> &results);
656 // Track equivalence classes for data movement ops
657 // Treat output as equivalent to input for pure data movement operations
658 llvm::EquivalenceClasses<std::pair<Value, size_t>> ec;
659 DenseMap<std::pair<Value, size_t>, std::pair<Value, size_t>> ecMap;
660 std::pair<Value, size_t> findLeader(Value value, size_t bitpos) const {
661 return ec.getLeaderValue({value, bitpos});
662 }
663 LogicalResult markEquivalent(Value from, size_t fromBitPos, Value to,
664 size_t toBitPos,
665 SmallVectorImpl<OpenPath> &results);
666
667 // Bit-logical ops.
668 LogicalResult visit(BooleanLogicOpInterface op, size_t bitPos,
669 SmallVectorImpl<OpenPath> &results);
670 LogicalResult visit(comb::AndOp op, size_t bitPos,
671 SmallVectorImpl<OpenPath> &results);
672 LogicalResult visit(comb::XorOp op, size_t bitPos,
673 SmallVectorImpl<OpenPath> &results);
674 LogicalResult visit(comb::OrOp op, size_t bitPos,
675 SmallVectorImpl<OpenPath> &results);
676 LogicalResult visit(comb::MuxOp op, size_t bitPos,
677 SmallVectorImpl<OpenPath> &results);
678 LogicalResult addLogicOp(Operation *op, size_t bitPos,
679 SmallVectorImpl<OpenPath> &results);
680 LogicalResult visit(comb::TruthTableOp op, size_t bitPos,
681 SmallVectorImpl<OpenPath> &results);
682
683 // Constants.
684 LogicalResult visit(hw::ConstantOp op, size_t bitPos,
685 SmallVectorImpl<OpenPath> &results) {
686 return success();
687 }
688
689 // Registers are start point.
690 LogicalResult visit(seq::FirRegOp op, size_t bitPos,
691 SmallVectorImpl<OpenPath> &results) {
692 return markStartPoint(op, bitPos, results);
693 }
694
695 LogicalResult visit(seq::CompRegOp op, size_t bitPos,
696 SmallVectorImpl<OpenPath> &results) {
697 return markStartPoint(op, bitPos, results);
698 }
699
700 LogicalResult visit(seq::FirMemReadOp op, size_t bitPos,
701 SmallVectorImpl<OpenPath> &results) {
702 return markStartPoint(op, bitPos, results);
703 }
704
705 LogicalResult visit(seq::FirMemReadWriteOp op, size_t bitPos,
706 SmallVectorImpl<OpenPath> &results) {
707 return markStartPoint(op, bitPos, results);
708 }
709
710 LogicalResult visitDefault(OpResult result, size_t bitPos,
711 SmallVectorImpl<OpenPath> &results);
712
713 // Helper functions.
714 LogicalResult addEdge(Value to, size_t toBitPos, int64_t delay,
715 SmallVectorImpl<OpenPath> &results);
716 LogicalResult markStartPoint(Value value, size_t bitPos,
717 SmallVectorImpl<OpenPath> &results);
718 LogicalResult markRegEndPoint(Value endPoint, Value start, Value reset = {},
719 Value resetValue = {}, Value enable = {});
720
721 // The module we are visiting.
722 hw::HWModuleOp module;
724
725 // Thread-local data structures.
726 std::unique_ptr<circt::igraph::InstancePathCache> instancePathCache;
727 // TODO: Make debug points optional.
728 std::unique_ptr<llvm::ImmutableListFactory<DebugPoint>> debugPointFactory;
729
730 // A map from the value point to the longest paths.
731 DenseMap<std::pair<Value, size_t>, std::unique_ptr<SmallVector<OpenPath>>>
733
734 // A map from the object to the longest paths.
735 DenseMap<Object, SmallVector<OpenPath>> endPointResults;
736
737 // The operation analyzer for comb/hw operations remaining in the circuit.
738 std::unique_ptr<OperationAnalyzer> operationAnalyzer;
739
740 // This is set to true when the thread is done.
741 std::atomic_bool done;
742 mutable std::condition_variable cv;
743 mutable std::mutex mutex;
744
745 // A flag to indicate the module is top-level.
746 bool topLevel = false;
747};
748
750 : module(module), ctx(ctx) {
752 std::make_unique<llvm::ImmutableListFactory<DebugPoint>>();
753 instancePathCache = ctx->instanceGraph
754 ? std::make_unique<circt::igraph::InstancePathCache>(
755 *ctx->instanceGraph)
756 : nullptr;
757 operationAnalyzer = std::make_unique<OperationAnalyzer>(module->getLoc());
758
759 done = false;
760}
761
762ArrayRef<OpenPath> LocalVisitor::getCachedPaths(Value value,
763 size_t bitPos) const {
764 std::pair<Value, size_t> valueAndBitPos(value, bitPos);
765 auto leader = ec.findLeader(valueAndBitPos);
766 if (leader != ec.member_end()) {
767 if (*leader != valueAndBitPos) {
768 // If this is not the leader, then use the leader.
769 return getCachedPaths(leader->first, leader->second);
770 }
771 }
772
773 auto it = cachedResults.find(valueAndBitPos);
774 // If not found, then consider it to be a constant.
775 if (it == cachedResults.end())
776 return {};
777 return *it->second;
778}
779
780void LocalVisitor::putUnclosedResult(const Object &object, int64_t delay,
781 llvm::ImmutableList<DebugPoint> history,
782 ObjectToMaxDistance &objectToMaxDistance) {
783 auto &slot = objectToMaxDistance[object];
784 if (slot.first >= delay && delay != 0)
785 return;
786 slot = {delay, history};
787}
788
790 // Wait for the thread to finish.
791 std::unique_lock<std::mutex> lock(mutex);
792 cv.wait(lock, [this] { return done.load(); });
793}
794
795LogicalResult LocalVisitor::markRegEndPoint(Value endPoint, Value start,
796 Value reset, Value resetValue,
797 Value enable) {
798 auto bitWidth = getBitWidth(endPoint);
799 auto record = [&](size_t endPointBitPos, Value value, size_t bitPos) {
800 auto result = getOrComputePaths(value, bitPos);
801 if (failed(result))
802 return failure();
803 for (auto &path : *result) {
804 if (auto blockArg = dyn_cast<BlockArgument>(path.startPoint.value)) {
805 // Not closed.
807 {{}, endPoint, endPointBitPos}, path.delay, path.history,
808 fromInputPortToEndPoint[{blockArg, path.startPoint.bitPos}]);
809 } else {
810 // If the start point is not a port, record to the results.
811 endPointResults[{{}, endPoint, endPointBitPos}].push_back(path);
812 }
813 }
814 return success();
815 };
816
817 // Get paths for each bit, and record them.
818 for (size_t i = 0, e = bitWidth; i < e; ++i) {
819 // Call getOrComputePaths to make sure the paths are computed for endPoint.
820 // This avoids a race condition.
821 if (failed(getOrComputePaths(endPoint, i)))
822 return failure();
823 if (failed(record(i, start, i)))
824 return failure();
825 }
826
827 // Edge from a reg to reset/resetValue.
828 if (reset)
829 for (size_t i = 0, e = bitWidth; i < e; ++i) {
830 if (failed(record(i, reset, 0)) || failed(record(i, resetValue, i)))
831 return failure();
832 }
833
834 // Edge from a reg to enable signal.
835 if (enable)
836 for (size_t i = 0, e = bitWidth; i < e; ++i) {
837 if (failed(record(i, enable, 0)))
838 return failure();
839 }
840
841 return success();
842}
843
844LogicalResult LocalVisitor::markEquivalent(Value from, size_t fromBitPos,
845 Value to, size_t toBitPos,
846 SmallVectorImpl<OpenPath> &results) {
847 [[maybe_unused]] auto leader = ec.getOrInsertLeaderValue({to, toBitPos});
848 // Merge classes, and visit the leader.
849 [[maybe_unused]] auto newLeader =
850 ec.unionSets({to, toBitPos}, {from, fromBitPos});
851 assert(leader == *newLeader);
852 return visitValue(to, toBitPos, results);
853}
854
855LogicalResult LocalVisitor::addEdge(Value to, size_t bitPos, int64_t delay,
856 SmallVectorImpl<OpenPath> &results) {
857 auto result = getOrComputePaths(to, bitPos);
858 if (failed(result))
859 return failure();
860 for (auto &path : *result) {
861 auto newPath = path;
862 newPath.delay += delay;
863 results.push_back(newPath);
864 }
865 return success();
866}
867
868LogicalResult LocalVisitor::visit(BooleanLogicOpInterface op, size_t bitPos,
869 SmallVectorImpl<OpenPath> &results) {
870 return addLogicOp(op, bitPos, results);
871}
872
873LogicalResult LocalVisitor::visit(comb::AndOp op, size_t bitPos,
874 SmallVectorImpl<OpenPath> &results) {
875 return addLogicOp(op, bitPos, results);
876}
877
878LogicalResult LocalVisitor::visit(comb::OrOp op, size_t bitPos,
879 SmallVectorImpl<OpenPath> &results) {
880 return addLogicOp(op, bitPos, results);
881}
882
883LogicalResult LocalVisitor::visit(comb::XorOp op, size_t bitPos,
884 SmallVectorImpl<OpenPath> &results) {
885 return addLogicOp(op, bitPos, results);
886}
887
888LogicalResult LocalVisitor::visit(comb::MuxOp op, size_t bitPos,
889 SmallVectorImpl<OpenPath> &results) {
890 // Add a cost of 1 for the mux.
891 if (failed(addEdge(op.getCond(), 0, 1, results)) ||
892 failed(addEdge(op.getTrueValue(), bitPos, 1, results)) ||
893 failed(addEdge(op.getFalseValue(), bitPos, 1, results)))
894 return failure();
895 filterPaths(results, ctx->doKeepOnlyMaxDelayPaths(), ctx->isLocalScope());
896 return success();
897}
898
899LogicalResult LocalVisitor::visit(comb::TruthTableOp op, size_t bitPos,
900 SmallVectorImpl<OpenPath> &results) {
901 for (auto input : op.getInputs()) {
902 if (failed(addEdge(input, 0, 1, results)))
903 return failure();
904 }
905 return success();
906}
907
908LogicalResult LocalVisitor::visit(comb::ExtractOp op, size_t bitPos,
909 SmallVectorImpl<OpenPath> &results) {
910 assert(getBitWidth(op.getInput()) > bitPos + op.getLowBit());
911 auto result = markEquivalent(op, bitPos, op.getInput(),
912 bitPos + op.getLowBit(), results);
913 return result;
914}
915
916LogicalResult LocalVisitor::visit(comb::ReplicateOp op, size_t bitPos,
917 SmallVectorImpl<OpenPath> &results) {
918 return markEquivalent(op, bitPos, op.getInput(),
919 bitPos % getBitWidth(op.getInput()), results);
920}
921
922LogicalResult LocalVisitor::markStartPoint(Value value, size_t bitPos,
923 SmallVectorImpl<OpenPath> &results) {
924 results.emplace_back(circt::igraph::InstancePath(), value, bitPos);
925 return success();
926}
927
928LogicalResult LocalVisitor::visit(hw::WireOp op, size_t bitPos,
929 SmallVectorImpl<OpenPath> &results) {
930 return markEquivalent(op, bitPos, op.getInput(), bitPos, results);
931}
932
933LogicalResult LocalVisitor::visit(hw::InstanceOp op, size_t bitPos,
934 size_t resultNum,
935 SmallVectorImpl<OpenPath> &results) {
936 auto moduleName = op.getReferencedModuleNameAttr();
937 auto value = op->getResult(resultNum);
938
939 // If an instance graph is not available, we treat instance results as a
940 // start point.
941 if (!ctx->instanceGraph)
942 return markStartPoint(value, bitPos, results);
943
944 // If an instance graph is available, then we can look up the module.
945 auto *node = ctx->instanceGraph->lookup(moduleName);
946 assert(node && "module not found");
947
948 // Otherwise, if the module is not a HWModuleOp, then we should treat it as a
949 // start point.
950 if (!isa<hw::HWModuleOp>(node->getModule()))
951 return markStartPoint(value, bitPos, results);
952
953 auto *localVisitor = ctx->getLocalVisitorMutable(moduleName);
954
955 auto module = localVisitor->getHWModuleOp();
956 auto operand = module.getBodyBlock()->getTerminator()->getOperand(resultNum);
957 auto result = localVisitor->getOrComputePaths(operand, bitPos);
958 if (failed(result))
959 return failure();
960
961 for (auto &path : *result) {
962 auto delay = path.delay;
963 auto history = path.history;
964 auto newPath =
965 instancePathCache->prependInstance(op, path.startPoint.instancePath);
966 auto startPointPoint = path.startPoint;
967 // If the start point is not a block argument, record it directly.
968 auto arg = dyn_cast<BlockArgument>(startPointPoint.value);
969 if (!arg) {
970 // Update the history to have correct instance path.
971 auto newHistory = debugPointFactory->getEmptyList();
972 if (ctx->doTraceDebugPoints()) {
973 newHistory =
974 mapList(debugPointFactory.get(), history, [&](DebugPoint p) {
975 p.object.instancePath =
976 instancePathCache->prependInstance(op, p.object.instancePath);
977 return p;
978 });
979 newHistory = debugPointFactory->add(
980 DebugPoint({}, value, bitPos, delay, "output port"), newHistory);
981 }
982
983 results.emplace_back(newPath, startPointPoint.value,
984 startPointPoint.bitPos, delay, newHistory);
985 continue;
986 }
987
988 // Otherwise, we need to look up the instance operand.
989 auto result = getOrComputePaths(op->getOperand(arg.getArgNumber()),
990 startPointPoint.bitPos);
991 if (failed(result))
992 return failure();
993 for (auto path : *result) {
994 auto newHistory = debugPointFactory->getEmptyList();
995 if (ctx->doTraceDebugPoints()) {
996 // Update the history to have correct instance path.
997 newHistory =
998 mapList(debugPointFactory.get(), history, [&](DebugPoint p) {
999 p.object.instancePath =
1000 instancePathCache->prependInstance(op, p.object.instancePath);
1001 p.delay += path.delay;
1002 return p;
1003 });
1004 DebugPoint debugPoint({}, value, bitPos, delay + path.delay,
1005 "output port");
1006 newHistory = debugPointFactory->add(debugPoint, newHistory);
1007 }
1008
1009 path.delay += delay;
1010 path.history =
1011 concatList(debugPointFactory.get(), newHistory, path.history);
1012 results.push_back(path);
1013 }
1014 }
1015 return success();
1016}
1017
1018LogicalResult LocalVisitor::visit(comb::ConcatOp op, size_t bitPos,
1019 SmallVectorImpl<OpenPath> &results) {
1020 // Find the exact bit pos in the concat.
1021 size_t newBitPos = bitPos;
1022 for (auto operand : llvm::reverse(op.getInputs())) {
1023 auto size = getBitWidth(operand);
1024 if (newBitPos >= size) {
1025 newBitPos -= size;
1026 continue;
1027 }
1028 return markEquivalent(op, bitPos, operand, newBitPos, results);
1029 }
1030
1031 llvm::report_fatal_error("Should not reach here");
1032 return failure();
1033}
1034
1035LogicalResult LocalVisitor::addLogicOp(Operation *op, size_t bitPos,
1036 SmallVectorImpl<OpenPath> &results) {
1037 auto cost = isa<BooleanLogicOpInterface>(op)
1038 ? cast<BooleanLogicOpInterface>(op).getLogicDepthCost()
1039 : llvm::Log2_64_Ceil(op->getNumOperands());
1040 // Create edges each operand with cost ceil(log(size)).
1041 for (auto operand : op->getOperands())
1042 if (failed(addEdge(operand, bitPos, cost, results)))
1043 return failure();
1044 filterPaths(results, ctx->doKeepOnlyMaxDelayPaths(), ctx->isLocalScope());
1045 return success();
1046}
1047
1048LogicalResult LocalVisitor::visitDefault(OpResult value, size_t bitPos,
1049 SmallVectorImpl<OpenPath> &results) {
1050 if (!isa_and_nonnull<hw::HWDialect, comb::CombDialect>(
1051 value.getDefiningOp()->getDialect()))
1052 return success();
1053 // Query it to an operation analyzer.
1054 LLVM_DEBUG({
1055 llvm::dbgs() << "Visiting default: ";
1056 llvm::dbgs() << " " << value << "[" << bitPos << "]\n";
1057 });
1058 SmallVector<std::tuple<size_t, size_t, int64_t>> oracleResults;
1059 auto paths =
1060 operationAnalyzer->analyzeOperation(value, bitPos, oracleResults);
1061 if (failed(paths)) {
1062 LLVM_DEBUG({
1063 llvm::dbgs() << "Failed to get results for: " << value << "[" << bitPos
1064 << "]\n";
1065 });
1066 return success();
1067 }
1068 auto *op = value.getDefiningOp();
1069 for (auto [inputPortIndex, startPointBitPos, delay] : oracleResults) {
1070 LLVM_DEBUG({
1071 llvm::dbgs() << "Adding edge: " << value << "[" << bitPos << "] -> "
1072 << op->getOperand(inputPortIndex) << "[" << startPointBitPos
1073 << "] with delay " << delay << "\n";
1074 });
1075 if (failed(addEdge(op->getOperand(inputPortIndex), startPointBitPos, delay,
1076 results)))
1077 return failure();
1078 }
1079 return success();
1080}
1081
1082LogicalResult LocalVisitor::visit(mlir::BlockArgument arg, size_t bitPos,
1083 SmallVectorImpl<OpenPath> &results) {
1084 assert(arg.getOwner() == module.getBodyBlock());
1085
1086 // Record a debug point.
1087 auto newHistory = ctx->doTraceDebugPoints()
1088 ? debugPointFactory->add(
1089 DebugPoint({}, arg, bitPos, 0, "input port"), {})
1090 : debugPointFactory->getEmptyList();
1091 OpenPath newPoint({}, arg, bitPos, 0, newHistory);
1092 results.push_back(newPoint);
1093 return success();
1094}
1095
1096FailureOr<ArrayRef<OpenPath>> LocalVisitor::getOrComputePaths(Value value,
1097 size_t bitPos) {
1098 if (auto *op = value.getDefiningOp())
1099 if (op->hasTrait<OpTrait::ConstantLike>())
1100 return ArrayRef<OpenPath>{};
1101
1102 if (ec.contains({value, bitPos})) {
1103 auto leader = ec.findLeader({value, bitPos});
1104 // If this is not the leader, then use the leader.
1105 if (*leader != std::pair(value, bitPos)) {
1106 return getOrComputePaths(leader->first, leader->second);
1107 }
1108 }
1109
1110 auto it = cachedResults.find({value, bitPos});
1111 if (it != cachedResults.end())
1112 return ArrayRef<OpenPath>(*it->second);
1113
1114 auto results = std::make_unique<SmallVector<OpenPath>>();
1115 if (failed(visitValue(value, bitPos, *results)))
1116 return {};
1117
1118 // Unique the results.
1119 filterPaths(*results, ctx->doKeepOnlyMaxDelayPaths(), ctx->isLocalScope());
1120 LLVM_DEBUG({
1121 llvm::dbgs() << value << "[" << bitPos << "] "
1122 << "Found " << results->size() << " paths\n";
1123 llvm::dbgs() << "====Paths:\n";
1124 for (auto &path : *results) {
1125 path.print(llvm::dbgs());
1126 llvm::dbgs() << "\n";
1127 }
1128 llvm::dbgs() << "====\n";
1129 });
1130
1131 auto insertedResult =
1132 cachedResults.try_emplace({value, bitPos}, std::move(results));
1133 assert(insertedResult.second);
1134 return ArrayRef<OpenPath>(*insertedResult.first->second);
1135}
1136
1137LogicalResult LocalVisitor::visitValue(Value value, size_t bitPos,
1138 SmallVectorImpl<OpenPath> &results) {
1139 LLVM_DEBUG({
1140 llvm::dbgs() << "Visiting: ";
1141 llvm::dbgs() << " " << value << "[" << bitPos << "]\n";
1142 });
1143
1144 if (auto blockArg = dyn_cast<mlir::BlockArgument>(value))
1145 return visit(blockArg, bitPos, results);
1146
1147 auto *op = value.getDefiningOp();
1148
1149 if (op->hasTrait<OpTrait::ConstantLike>())
1150 return success();
1151
1152 auto result =
1153 TypeSwitch<Operation *, LogicalResult>(op)
1154 .Case<comb::ConcatOp, comb::ExtractOp, comb::ReplicateOp,
1155 BooleanLogicOpInterface, comb::AndOp, comb::OrOp, comb::MuxOp,
1156 comb::XorOp, comb::TruthTableOp, seq::FirRegOp, seq::CompRegOp,
1157 seq::FirMemReadOp, seq::FirMemReadWriteOp, hw::WireOp>(
1158 [&](auto op) {
1159 size_t idx = results.size();
1160 auto result = visit(op, bitPos, results);
1161 if (ctx->doTraceDebugPoints())
1162 if (auto name = op->template getAttrOfType<StringAttr>(
1163 "sv.namehint")) {
1164
1165 for (auto i = idx, e = results.size(); i < e; ++i) {
1166 DebugPoint debugPoint({}, value, bitPos, results[i].delay,
1167 "namehint");
1168 auto newHistory = debugPointFactory->add(
1169 debugPoint, results[i].history);
1170 results[i].history = newHistory;
1171 }
1172 }
1173 return result;
1174 })
1175 .Case<hw::InstanceOp>([&](hw::InstanceOp op) {
1176 return visit(op, bitPos, cast<OpResult>(value).getResultNumber(),
1177 results);
1178 })
1179 .Default([&](auto op) {
1180 return visitDefault(cast<OpResult>(value), bitPos, results);
1181 });
1182 return result;
1183}
1184
1185LogicalResult LocalVisitor::initializeAndRun(hw::InstanceOp instance) {
1186 const auto *childVisitor =
1187 ctx->getLocalVisitorMutable(instance.getReferencedModuleNameAttr());
1188 // If not found, the module is blackbox so skip it.
1189 if (!childVisitor)
1190 return success();
1191
1192 // Connect dataflow from instance input ports to end point in the child.
1193 for (const auto &[object, openPaths] :
1194 childVisitor->getFromInputPortToEndPoint()) {
1195 auto [arg, argBitPos] = object;
1196 for (auto [point, delayAndHistory] : openPaths) {
1197 auto [instancePath, endPoint, endPointBitPos] = point;
1198 auto [delay, history] = delayAndHistory;
1199 // Prepend the instance path.
1201 auto newPath = instancePathCache->prependInstance(instance, instancePath);
1202 auto computedResults =
1203 getOrComputePaths(instance.getOperand(arg.getArgNumber()), argBitPos);
1204 if (failed(computedResults))
1205 return failure();
1206
1207 for (auto &result : *computedResults) {
1208 // Update debug history for this path segment if tracing is enabled.
1209 auto newHistory = ctx->doTraceDebugPoints()
1210 ? mapList(debugPointFactory.get(), history,
1211 [&](DebugPoint p) {
1212 // Update the instance path to
1213 // prepend the current instance.
1214 p.object.instancePath = newPath;
1215 p.delay += result.delay;
1216 return p;
1217 })
1218 : debugPointFactory->getEmptyList();
1219 Object newEndPoint(newPath, endPoint, endPointBitPos);
1220 // Determine if this path continues upward or terminates here.
1221 // If the start point is a module input port, the path
1222 // continues to the parent module and needs further propagation.
1223 if (auto newPort = dyn_cast<BlockArgument>(result.startPoint.value)) {
1224 // Record as "unclosed" - this path segment crosses module
1225 // boundaries and needs to be combined with paths in the parent.
1227 newEndPoint, result.delay + delay, newHistory,
1228 fromInputPortToEndPoint[{newPort, result.startPoint.bitPos}]);
1229 } else {
1230 // This path originates from an internal sequential element
1231 // in the parent module, so it's a complete register-to-register path
1232 // that can be recorded as closed.
1233 endPointResults[newEndPoint].emplace_back(
1234 result.startPoint, result.delay + delay,
1235 ctx->doTraceDebugPoints() ? concatList(debugPointFactory.get(),
1236 newHistory, result.history)
1237 : debugPointFactory->getEmptyList());
1238 }
1239 }
1240 }
1241 }
1242
1243 // Pre-compute the results for the instance output ports.
1244 for (auto instance : instance->getResults()) {
1245 for (size_t i = 0, e = getBitWidth(instance); i < e; ++i) {
1246 auto computedResults = getOrComputePaths(instance, i);
1247 if (failed(computedResults))
1248 return failure();
1249 }
1250 }
1251 return success();
1252}
1253
1254LogicalResult LocalVisitor::initializeAndRun(hw::OutputOp output) {
1255 for (OpOperand &operand : output->getOpOperands()) {
1256 for (size_t i = 0, e = getBitWidth(operand.get()); i < e; ++i) {
1257 auto &recordOutput =
1258 fromOutputPortToStartPoint[{operand.getOperandNumber(), i}];
1259 auto computedResults = getOrComputePaths(operand.get(), i);
1260 if (failed(computedResults))
1261 return failure();
1262 for (const auto &result : *computedResults) {
1263 putUnclosedResult(result.startPoint, result.delay, result.history,
1264 recordOutput);
1265 }
1266 }
1267 }
1268 return success();
1269}
1270
1272 LLVM_DEBUG({ ctx->notifyStart(module.getModuleNameAttr()); });
1273 if (ctx->doLazyComputation())
1274 return success();
1275
1276 // Initialize the results for the block arguments.
1277 for (auto blockArgument : module.getBodyBlock()->getArguments())
1278 for (size_t i = 0, e = getBitWidth(blockArgument); i < e; ++i)
1279 (void)getOrComputePaths(blockArgument, i);
1280
1281 auto walkResult = module->walk([&](Operation *op) {
1282 auto result =
1283 mlir::TypeSwitch<Operation *, LogicalResult>(op)
1284 .Case<seq::FirRegOp>([&](seq::FirRegOp op) {
1285 return markRegEndPoint(op, op.getNext(), op.getReset(),
1286 op.getResetValue());
1287 })
1288 .Case<seq::CompRegOp>([&](auto op) {
1289 return markRegEndPoint(op, op.getInput(), op.getReset(),
1290 op.getResetValue());
1291 })
1292 .Case<seq::FirMemWriteOp>([&](auto op) {
1293 // TODO: Add address.
1294 return markRegEndPoint(op.getMemory(), op.getData(), {}, {},
1295 op.getEnable());
1296 })
1297 .Case<seq::FirMemReadWriteOp>([&](seq::FirMemReadWriteOp op) {
1298 // TODO: Add address.
1299 return markRegEndPoint(op.getMemory(), op.getWriteData(), {}, {},
1300 op.getEnable());
1301 })
1302 .Case<BooleanLogicOpInterface, comb::AndOp, comb::OrOp, comb::XorOp,
1303 comb::MuxOp, seq::FirMemReadOp>([&](auto op) {
1304 // NOTE: Visiting and-inverter is not necessary but
1305 // useful to reduce recursion depth.
1306 Value result = op->getResult(0);
1307 for (size_t i = 0, e = getBitWidth(result); i < e; ++i)
1308 if (failed(getOrComputePaths(result, i)))
1309 return failure();
1310 return success();
1311 })
1312 .Case<hw::InstanceOp, hw::OutputOp>(
1313 [&](auto op) { return initializeAndRun(op); })
1314 .Default([](auto op) { return success(); });
1315 if (failed(result))
1316 return WalkResult::interrupt();
1317 return WalkResult::advance();
1318 });
1319
1320 {
1321 std::lock_guard<std::mutex> lock(mutex);
1322 done.store(true);
1323 cv.notify_all();
1324 }
1325 LLVM_DEBUG({ ctx->notifyEnd(module.getModuleNameAttr()); });
1326 return failure(walkResult.wasInterrupted());
1327}
1328
1329//===----------------------------------------------------------------------===//
1330// Context
1331//===----------------------------------------------------------------------===//
1332
1333const LocalVisitor *Context::getLocalVisitor(StringAttr name) const {
1334 return getLocalVisitorMutable(name);
1335}
1336
1338 auto *it = localVisitors.find(name);
1339 if (it == localVisitors.end())
1340 return nullptr;
1341
1342 if (isRunningParallel())
1343 it->second->waitUntilDone();
1344
1345 // NOTE: Don't call waitUntilDone here.
1346 return it->second.get();
1347}
1348
1349// ===----------------------------------------------------------------------===//
1350// OperationAnalyzer
1351// ===----------------------------------------------------------------------===//
1352
1353FailureOr<LocalVisitor *>
1355 // Check cache first.
1356 auto opName = op->getName();
1357 auto functionType = getFunctionTypeForOp(op);
1358 auto key = std::make_pair(opName, functionType);
1359 auto it = cache.find(key);
1360 if (it != cache.end())
1361 return it->second.get();
1362
1363 SmallVector<hw::PortInfo> ports;
1364 // Helper to convert types into integer types.
1365 auto getType = [&](Type type) -> Type {
1366 if (type.isInteger())
1367 return type;
1368 auto bitWidth = hw::getBitWidth(type);
1369 if (bitWidth < 0)
1370 return Type(); // Unsupported type
1371 return IntegerType::get(op->getContext(), bitWidth);
1372 };
1373
1374 // Helper to add a port to the module definition
1375 auto addPort = [&](Type type, hw::ModulePort::Direction dir) {
1376 hw::PortInfo portInfo;
1377 portInfo.dir = dir;
1378 portInfo.name = emptyName;
1379 portInfo.type = type;
1380 ports.push_back(portInfo);
1381 };
1382
1383 // Create input ports for each operand
1384 for (auto input : op->getOperands()) {
1385 auto type = getType(input.getType());
1386 if (!type)
1387 return failure(); // Unsupported operand type
1388 addPort(type, hw::ModulePort::Direction::Input);
1389 }
1390
1391 // Create output ports for each result.
1392 SmallVector<Type> resultsTypes;
1393 for (Value result : op->getResults()) {
1394 auto type = getType(result.getType());
1395 if (!type)
1396 return failure(); // Unsupported result type
1397 addPort(type, hw::ModulePort::Direction::Output);
1398 resultsTypes.push_back(type);
1399 }
1400
1401 // Build the wrapper HW module
1402 OpBuilder builder(op->getContext());
1403 builder.setInsertionPointToEnd(moduleOp->getBody());
1404
1405 // Generate unique module name.
1406 auto moduleName = builder.getStringAttr("module_" + Twine(cache.size()));
1407 hw::HWModuleOp hwModule =
1408 hw::HWModuleOp::create(builder, op->getLoc(), moduleName, ports);
1409
1410 // Clone the operation inside the wrapper module
1411 builder.setInsertionPointToStart(hwModule.getBodyBlock());
1412 auto *cloned = builder.clone(*op);
1413
1414 // Connect module inputs to cloned operation operands
1415 // Handle type mismatches with bitcast operations
1416 // Type mismatches can occur when the original operation uses non-integer
1417 // types (e.g., structs, arrays) that get converted to integer types for the
1418 // wrapper module ports. Since we use the same bit width via
1419 // hw::getBitWidth(), bitcast is safe for bit-compatible types.
1420 for (auto arg : hwModule.getBodyBlock()->getArguments()) {
1421 Value input = arg;
1422 auto idx = arg.getArgNumber();
1423
1424 // Insert bitcast if input port type differs from operand type
1425 if (input.getType() != cloned->getOperand(idx).getType())
1426 input = hw::BitcastOp::create(builder, op->getLoc(),
1427 cloned->getOperand(idx).getType(), input);
1428
1429 cloned->setOperand(idx, input);
1430 }
1431
1432 // Connect cloned operation results to module outputs
1433 // Handle type mismatches with bitcast operations
1434 SmallVector<Value> outputs;
1435 for (auto result : cloned->getResults()) {
1436 auto idx = result.getResultNumber();
1437
1438 // Insert bitcast if result type differs from output port type
1439 if (result.getType() != resultsTypes[idx])
1440 result = hw::BitcastOp::create(builder, op->getLoc(), resultsTypes[idx],
1441 result)
1442 ->getResult(0);
1443
1444 outputs.push_back(result);
1445 }
1446
1447 hwModule.getBodyBlock()->getTerminator()->setOperands(outputs);
1448
1449 // Run conversion pipeline (HW -> Comb -> AIG -> cleanup)
1450 if (!passManager && failed(initializePipeline()))
1451 return mlir::emitError(loc)
1452 << "Failed to initialize pipeline, possibly passes used in the "
1453 "analysis are not registered";
1454
1455 if (failed(passManager->run(moduleOp->getOperation())))
1456 return mlir::emitError(loc) << "Failed to run lowering pipeline";
1457
1458 // Create LocalVisitor to analyze the converted AIG module
1459 auto localVisitor = std::make_unique<LocalVisitor>(hwModule, &ctx);
1460 if (failed(localVisitor->initializeAndRun()))
1461 return failure();
1462
1463 // Cache the result and return
1464 auto [iterator, inserted] = cache.insert({key, std::move(localVisitor)});
1465 assert(inserted && "Cache insertion must succeed for new key");
1466 return iterator->second.get();
1467}
1468
1470 OpResult value, size_t bitPos,
1471 SmallVectorImpl<std::tuple<size_t, size_t, int64_t>> &results) {
1472 auto *op = value.getDefiningOp();
1473 auto localVisitorResult = getOrComputeLocalVisitor(op);
1474 if (failed(localVisitorResult))
1475 return failure();
1476
1477 auto *localVisitor = *localVisitorResult;
1478
1479 // Get output.
1480 Value operand =
1481 localVisitor->getHWModuleOp().getBodyBlock()->getTerminator()->getOperand(
1482 value.getResultNumber());
1483 auto openPaths = localVisitor->getOrComputePaths(operand, bitPos);
1484 if (failed(openPaths))
1485 return failure();
1486
1487 results.reserve(openPaths->size() + results.size());
1488 for (auto &path : *openPaths) {
1489 // end point is always a block argument since there is no other value that
1490 // could be a start point.
1491 BlockArgument blockArg = cast<BlockArgument>(path.startPoint.value);
1492 auto inputPortIndex = blockArg.getArgNumber();
1493 results.push_back(
1494 std::make_tuple(inputPortIndex, path.startPoint.bitPos, path.delay));
1495 }
1496
1497 return success();
1498}
1499
1501 passManager = std::make_unique<mlir::PassManager>(loc->getContext());
1502 return parsePassPipeline(pipelineStr, *passManager);
1503}
1504
1505//===----------------------------------------------------------------------===//
1506// LongestPathAnalysis::Impl
1507//===----------------------------------------------------------------------===//
1508
1509/// Internal implementation for LongestPathAnalysis.
1510///
1511/// This class owns per-module LocalVisitors, orchestrates initialization over
1512/// the instance graph, and provides the concrete implementations for the
1513/// public LongestPathAnalysis API.
1515 Impl(Operation *module, mlir::AnalysisManager &am,
1516 const LongestPathAnalysisOptions &option);
1517
1518 /// Initialize and run analysis for a full MLIR module (hierarchical).
1519 LogicalResult initializeAndRun(mlir::ModuleOp module);
1520
1521 /// Initialize and run analysis for a single HW module (local scope).
1522 LogicalResult initializeAndRun(hw::HWModuleOp module);
1523
1524 /// Return true if we have a LocalVisitor for the given HW module.
1525 bool isAnalysisAvailable(StringAttr moduleName) const;
1526
1527 /// Compute hierarchical timing paths to (value, bitPos) and append to
1528 /// results.
1529 LogicalResult computeGlobalPaths(Value value, size_t bitPos,
1530 SmallVectorImpl<DataflowPath> &results);
1531
1532 /// Collect register-to-register (closed) paths within the module. When
1533 /// 'elaborate' is true, paths are elaborated with instance paths from
1534 /// `moduleName`.
1535 template <bool elaborate>
1536 LogicalResult
1537 collectClosedPaths(StringAttr moduleName,
1538 SmallVectorImpl<DataflowPath> &results) const;
1539
1540 /// Collect open paths from module input ports to internal sequential sinks.
1541 LogicalResult
1542 collectInputToInternalPaths(StringAttr moduleName,
1543 SmallVectorImpl<DataflowPath> &results) const;
1544
1545 /// Collect open paths from internal sequential sources to module output
1546 /// ports.
1547 LogicalResult
1548 collectInternalToOutputPaths(StringAttr moduleName,
1549 SmallVectorImpl<DataflowPath> &results) const;
1550
1551 /// Top modules inferred or specified for this analysis run.
1552 llvm::ArrayRef<hw::HWModuleOp> getTopModules() const { return topModules; }
1553
1554 /// Return average of per-bit max delays for a value.
1555 FailureOr<int64_t> getAverageMaxDelay(Value value);
1556
1557 /// Return the max delay for a value.
1558 FailureOr<int64_t> getMaxDelay(Value value, int64_t bitPos);
1559
1560 /// Compute local open paths to (value, bitPos).
1561 FailureOr<ArrayRef<OpenPath>> computeLocalPaths(Value value, size_t bitPos);
1562
1563protected:
1565
1566private:
1567 /// Recursive helper for computeGlobalPaths.
1568 LogicalResult computeGlobalPaths(const Object &originalObject, Value value,
1569 size_t bitPos,
1570 SmallVectorImpl<DataflowPath> &results);
1571
1572 /// Analysis context.
1574 /// Top-level HW modules that seed hierarchical analysis.
1575 SmallVector<hw::HWModuleOp> topModules;
1576};
1577
1579 Value value, size_t bitPos, SmallVectorImpl<DataflowPath> &results) {
1580 return computeGlobalPaths(Object({}, value, bitPos), value, bitPos, results);
1581}
1582
1584 const Object &originalObject, Value value, size_t bitPos,
1585 SmallVectorImpl<DataflowPath> &results) {
1586 auto parentHWModule =
1587 value.getParentRegion()->getParentOfType<hw::HWModuleOp>();
1588 if (!parentHWModule)
1589 return mlir::emitError(value.getLoc())
1590 << "query value is not in a HWModuleOp";
1591 auto *localVisitor =
1592 ctx.getLocalVisitorMutable(parentHWModule.getModuleNameAttr());
1593 if (!localVisitor)
1594 return success();
1595
1596 auto *instancePathCache = localVisitor->getInstancePathCache();
1597 size_t oldIndex = results.size();
1598 auto *node =
1599 ctx.instanceGraph
1600 ? ctx.instanceGraph->lookup(parentHWModule.getModuleNameAttr())
1601 : nullptr;
1602 LLVM_DEBUG({
1603 llvm::dbgs() << "Running " << parentHWModule.getModuleNameAttr() << " "
1604 << value << " " << bitPos << "\n";
1605 });
1606 auto paths = localVisitor->getOrComputePaths(value, bitPos);
1607 if (failed(paths))
1608 return failure();
1609
1610 for (auto &path : *paths) {
1611 auto arg = dyn_cast<BlockArgument>(path.startPoint.value);
1612 if (!arg || localVisitor->isTopLevel()) {
1613 // If the value is not a block argument, then we are done.
1614 results.push_back({originalObject, path, parentHWModule});
1615 continue;
1616 }
1617
1618 auto newObject = originalObject;
1619 assert(node && "If an instance graph is not available, localVisitor must "
1620 "be a toplevel");
1621 for (auto *inst : node->uses()) {
1622 auto startIndex = results.size();
1623 if (instancePathCache)
1624 newObject.instancePath = instancePathCache->appendInstance(
1625 originalObject.instancePath, inst->getInstance());
1626
1627 auto result = computeGlobalPaths(
1628 newObject, inst->getInstance()->getOperand(arg.getArgNumber()),
1629 path.startPoint.bitPos, results);
1630 if (failed(result))
1631 return result;
1632 for (auto i = startIndex, e = results.size(); i < e; ++i)
1633 results[i].setDelay(results[i].getDelay() + path.delay);
1634 }
1635 }
1636
1637 filterPaths(results, oldIndex);
1638 return success();
1639}
1640
1641template <bool elaborate>
1643 StringAttr moduleName, SmallVectorImpl<DataflowPath> &results) const {
1644 auto collectClosedPaths = [&](StringAttr name,
1645 SmallVectorImpl<DataflowPath> &localResults,
1646 igraph::InstanceGraphNode *top = nullptr) {
1647 if (!isAnalysisAvailable(name))
1648 return;
1649 auto *visitor = ctx.getLocalVisitorMutable(name);
1650 for (auto &[point, state] : visitor->getEndPointResults()) {
1651 for (const auto &dataFlow : state) {
1652 if constexpr (elaborate) {
1653 // If elaborate, we need to prepend the path to the root.
1654 auto *instancePathCache = visitor->getInstancePathCache();
1655 auto topToRoot = instancePathCache->getRelativePaths(
1656 visitor->getHWModuleOp(), top);
1657 for (auto &instancePath : topToRoot) {
1658 localResults.emplace_back(point, dataFlow,
1659 top->getModule<hw::HWModuleOp>());
1660 localResults.back().prependPaths(*visitor->getInstancePathCache(),
1661 visitor->getDebugPointFactory(),
1662 instancePath);
1663 }
1664 } else {
1665 localResults.emplace_back(point, dataFlow, visitor->getHWModuleOp());
1666 }
1667 }
1668 }
1669 };
1670
1671 if (ctx.instanceGraph) {
1672 // Accumulate all closed results under the given module.
1673 auto *node = ctx.instanceGraph->lookup(moduleName);
1675 // Prepare the results map for parallel processing.
1676 for (auto *child : llvm::post_order(node))
1677 resultsMap[child->getModule().getModuleNameAttr()] = {};
1678
1679 mlir::parallelForEach(
1680 node->getModule().getContext(), resultsMap,
1681 [&](auto &it) { collectClosedPaths(it.first, it.second, node); });
1682
1683 for (auto &[name, localResults] : resultsMap)
1684 results.append(localResults.begin(), localResults.end());
1685 } else {
1686 collectClosedPaths(moduleName, results);
1687 }
1688
1689 return success();
1690}
1691
1693 StringAttr moduleName, SmallVectorImpl<DataflowPath> &results) const {
1694 auto *visitor = ctx.getLocalVisitor(moduleName);
1695 if (!visitor)
1696 return failure();
1697
1698 for (auto &[key, value] : visitor->getFromInputPortToEndPoint()) {
1699 auto [arg, argBitPos] = key;
1700 for (auto [point, delayAndHistory] : value) {
1701 auto [path, start, startBitPos] = point;
1702 auto [delay, history] = delayAndHistory;
1703 results.emplace_back(Object(path, start, startBitPos),
1704 OpenPath({}, arg, argBitPos, delay, history),
1705 visitor->getHWModuleOp());
1706 }
1707 }
1708
1709 return success();
1710}
1711
1713 StringAttr moduleName, SmallVectorImpl<DataflowPath> &results) const {
1714 auto *visitor = ctx.getLocalVisitor(moduleName);
1715 if (!visitor)
1716 return failure();
1717
1718 for (auto &[key, value] : visitor->getFromOutputPortToStartPoint()) {
1719 auto [resultNum, bitPos] = key;
1720 for (auto [point, delayAndHistory] : value) {
1721 auto [path, start, startBitPos] = point;
1722 auto [delay, history] = delayAndHistory;
1723 results.emplace_back(
1724 std::make_tuple(visitor->getHWModuleOp(), resultNum, bitPos),
1725 OpenPath(path, start, startBitPos, delay, history),
1726 visitor->getHWModuleOp());
1727 }
1728 }
1729
1730 return success();
1731}
1732
1733LongestPathAnalysis::Impl::Impl(Operation *moduleOp, mlir::AnalysisManager &am,
1734 const LongestPathAnalysisOptions &option)
1735 : ctx(isa<mlir::ModuleOp>(moduleOp)
1736 ? &am.getAnalysis<igraph::InstanceGraph>()
1737 : nullptr,
1738 option) {
1739 if (auto module = dyn_cast<mlir::ModuleOp>(moduleOp)) {
1740 if (failed(initializeAndRun(module)))
1741 llvm::report_fatal_error("Failed to run longest path analysis");
1742 } else if (auto hwMod = dyn_cast<hw::HWModuleOp>(moduleOp)) {
1743 if (failed(initializeAndRun(hwMod)))
1744 llvm::report_fatal_error("Failed to run longest path analysis");
1745 } else {
1746 llvm::report_fatal_error("Analysis scheduled on invalid operation");
1747 }
1748}
1749
1750LogicalResult
1752 auto it =
1753 ctx.localVisitors.insert({module.getModuleNameAttr(),
1754 std::make_unique<LocalVisitor>(module, &ctx)});
1755 assert(it.second);
1756 it.first->second->setTopLevel();
1757 return it.first->second->initializeAndRun();
1758}
1759
1760LogicalResult
1762 auto topNameAttr = ctx.getTopModuleName();
1763 topModules.clear();
1764 llvm::SetVector<Operation *> visited;
1765 auto *instanceGraph = ctx.instanceGraph;
1766 if (topNameAttr && topNameAttr.getValue() != "") {
1767 auto *topNode = instanceGraph->lookupOrNull(topNameAttr);
1768 if (!topNode || !topNode->getModule() ||
1769 !isa<hw::HWModuleOp>(topNode->getModule())) {
1770 module.emitError() << "top module not found in instance graph "
1771 << topNameAttr;
1772 return failure();
1773 }
1774 topModules.push_back(topNode->getModule<hw::HWModuleOp>());
1775 } else {
1776 auto inferredResults = instanceGraph->getInferredTopLevelNodes();
1777 if (failed(inferredResults))
1778 return inferredResults;
1779
1780 for (auto *node : *inferredResults) {
1781 if (auto top = dyn_cast<hw::HWModuleOp>(*node->getModule()))
1782 topModules.push_back(top);
1783 }
1784 }
1785
1786 SmallVector<igraph::InstanceGraphNode *> worklist;
1787 for (auto topNode : topModules)
1788 worklist.push_back(instanceGraph->lookup(topNode.getModuleNameAttr()));
1789 // Get a set of design modules that are reachable from the top nodes,
1790 // excluding bound instances.
1791 while (!worklist.empty()) {
1792 auto *node = worklist.pop_back_val();
1793 assert(node && "node should not be null");
1794 auto op = node->getModule();
1795 if (!isa_and_nonnull<hw::HWModuleOp>(op) || !visited.insert(op))
1796 continue;
1797
1798 for (auto *child : *node) {
1799 auto childOp = child->getInstance();
1800 if (!childOp || childOp->hasAttr("doNotPrint"))
1801 continue;
1802
1803 worklist.push_back(child->getTarget());
1804 }
1805 }
1806
1807 // Initialize the local visitors if the module was visited, in the
1808 // post-order of the instance graph.
1809 for (auto module : topModules) {
1810 auto *topNode = instanceGraph->lookup(module.getModuleNameAttr());
1811 for (auto *node : llvm::post_order(topNode))
1812 if (node && node->getModule())
1813 if (auto hwMod = dyn_cast<hw::HWModuleOp>(*node->getModule())) {
1814 if (visited.contains(hwMod))
1815 ctx.localVisitors.insert(
1816 {hwMod.getModuleNameAttr(),
1817 std::make_unique<LocalVisitor>(hwMod, &ctx)});
1818 }
1819
1820 ctx.localVisitors[topNode->getModule().getModuleNameAttr()]->setTopLevel();
1821 }
1822
1823 return mlir::failableParallelForEach(
1824 module.getContext(), ctx.localVisitors,
1825 [&](auto &it) { return it.second->initializeAndRun(); });
1826}
1827
1829 StringAttr moduleName) const {
1830 return ctx.localVisitors.find(moduleName) != ctx.localVisitors.end();
1831}
1832// Return the average of the maximum delays across all bits of the given
1833// value, which is useful approximation for the delay of the value. For each
1834// bit position, finds all paths and takes the maximum delay. Then averages
1835// these maximum delays across all bits of the value.
1836FailureOr<int64_t> LongestPathAnalysis::Impl::getAverageMaxDelay(Value value) {
1837 SmallVector<DataflowPath> results;
1838 size_t bitWidth = getBitWidth(value);
1839 if (bitWidth == 0)
1840 return 0;
1841 int64_t totalDelay = 0;
1842 for (size_t i = 0; i < bitWidth; ++i) {
1843 // Clear results from previous iteration.
1844 results.clear();
1845 auto result = computeGlobalPaths(value, i, results);
1846 if (failed(result))
1847 return failure();
1848
1849 int64_t maxDelay = getMaxDelayInPaths(ArrayRef<DataflowPath>(results));
1850 totalDelay += maxDelay;
1851 }
1852 return llvm::divideCeil(totalDelay, bitWidth);
1853}
1854
1855FailureOr<int64_t> LongestPathAnalysis::Impl::getMaxDelay(Value value,
1856 int64_t bitPos) {
1857 SmallVector<DataflowPath> results;
1858 auto collectAndFindMax = ([&](int64_t bitPos) -> FailureOr<int64_t> {
1859 results.clear();
1860 auto result = computeGlobalPaths(value, bitPos, results);
1861 if (failed(result))
1862 return failure();
1863 return getMaxDelayInPaths(ArrayRef<DataflowPath>(results));
1864 });
1865 if (bitPos >= 0)
1866 return collectAndFindMax(bitPos);
1867
1868 size_t bitWidth = getBitWidth(value);
1869 if (bitWidth == 0)
1870 return 0;
1871
1872 int64_t maxDelay = 0;
1873 for (size_t i = 0; i < bitWidth; ++i) {
1874 auto result = collectAndFindMax(i);
1875 if (failed(result))
1876 return failure();
1877 maxDelay = std::max(maxDelay, *result);
1878 }
1879 return maxDelay;
1880}
1881
1882FailureOr<ArrayRef<OpenPath>>
1884 auto parentHWModule =
1885 value.getParentRegion()->getParentOfType<hw::HWModuleOp>();
1886 if (!parentHWModule)
1887 return mlir::emitError(value.getLoc())
1888 << "query value is not in a HWModuleOp";
1889 assert(ctx.localVisitors.size() == 1 &&
1890 "In incremental mode, there should be only one local visitor");
1891
1892 auto *localVisitor =
1893 ctx.getLocalVisitorMutable(parentHWModule.getModuleNameAttr());
1894 if (!localVisitor)
1895 return mlir::emitError(value.getLoc())
1896 << "the local visitor for the given value does not exist";
1897 return localVisitor->getOrComputePaths(value, bitPos);
1898}
1899
1900//===----------------------------------------------------------------------===//
1901// LongestPathAnalysis
1902//===----------------------------------------------------------------------===//
1903
1904LongestPathAnalysis::~LongestPathAnalysis() { delete impl; }
1905
1906LongestPathAnalysis::LongestPathAnalysis(
1907 Operation *moduleOp, mlir::AnalysisManager &am,
1908 const LongestPathAnalysisOptions &option)
1909 : impl(new Impl(moduleOp, am, option)), ctx(moduleOp->getContext()) {
1910 LLVM_DEBUG({
1911 llvm::dbgs() << "LongestPathAnalysis created\n";
1912 if (option.collectDebugInfo)
1913 llvm::dbgs() << " - Collecting debug info\n";
1914 if (option.lazyComputation)
1915 llvm::dbgs() << " - Lazy computation enabled\n";
1916 if (option.keepOnlyMaxDelayPaths)
1917 llvm::dbgs() << " - Keeping only max delay paths\n";
1918 });
1919}
1920
1921bool LongestPathAnalysis::isAnalysisAvailable(StringAttr moduleName) const {
1922 return impl->isAnalysisAvailable(moduleName);
1923}
1924
1925FailureOr<int64_t> LongestPathAnalysis::getAverageMaxDelay(Value value) {
1926 return impl->getAverageMaxDelay(value);
1927}
1928
1929FailureOr<int64_t> LongestPathAnalysis::getMaxDelay(Value value,
1930 int64_t bitPos) {
1931 return impl->getMaxDelay(value, bitPos);
1932}
1933
1934LogicalResult
1936 SmallVectorImpl<DataflowPath> &results,
1937 bool elaboratePaths) const {
1938 if (!isAnalysisValid)
1939 return failure();
1940 if (elaboratePaths)
1941 return impl->collectClosedPaths<true>(moduleName, results);
1942 return impl->collectClosedPaths<false>(moduleName, results);
1943}
1944
1946 StringAttr moduleName, SmallVectorImpl<DataflowPath> &results) const {
1947 if (!isAnalysisValid)
1948 return failure();
1949
1950 return impl->collectInputToInternalPaths(moduleName, results);
1951}
1952
1954 StringAttr moduleName, SmallVectorImpl<DataflowPath> &results) const {
1955 if (!isAnalysisValid)
1956 return failure();
1957
1958 return impl->collectInternalToOutputPaths(moduleName, results);
1959}
1960
1961LogicalResult
1963 SmallVectorImpl<DataflowPath> &results,
1964 bool elaboratePaths) const {
1965 if (failed(getInternalPaths(moduleName, results, elaboratePaths)))
1966 return failure();
1967 if (failed(getOpenPathsFromInputPortsToInternal(moduleName, results)))
1968 return failure();
1969 if (failed(getOpenPathsFromInternalToOutputPorts(moduleName, results)))
1970 return failure();
1971 return success();
1972}
1973
1974ArrayRef<hw::HWModuleOp> LongestPathAnalysis::getTopModules() const {
1975 return impl->getTopModules();
1976}
1977
1978FailureOr<ArrayRef<OpenPath>>
1979LongestPathAnalysis::computeLocalPaths(Value value, size_t bitPos) {
1980 if (!isAnalysisValid)
1981 return failure();
1982
1983 return impl->computeLocalPaths(value, bitPos);
1984}
1985
1987 Value value, size_t bitPos, SmallVectorImpl<DataflowPath> &results) {
1988 if (!isAnalysisValid)
1989 return mlir::emitError(value.getLoc()) << "analysis has been invalidated";
1990
1991 return impl->computeGlobalPaths(value, bitPos, results);
1992}
1993
1994//===----------------------------------------------------------------------===//
1995// IncrementalLongestPathAnalysis
1996//===----------------------------------------------------------------------===//
1997
1999 Operation *op) const {
2000 if (!isAnalysisValid)
2001 return false;
2002
2003 auto parentHWModule =
2004 op->getParentRegion()->getParentOfType<hw::HWModuleOp>();
2005 if (!parentHWModule)
2006 return true;
2007 auto *localVisitor =
2008 impl->ctx.getLocalVisitor(parentHWModule.getModuleNameAttr());
2009 if (!localVisitor)
2010 return true;
2011
2012 // If all results of the operation have no paths, then it is safe to mutate
2013 // the operation.
2014 return llvm::all_of(op->getResults(), [localVisitor](Value value) {
2015 for (int64_t i = 0, e = getBitWidth(value); i < e; ++i) {
2016 auto path = localVisitor->getCachedPaths(value, i);
2017 if (!path.empty())
2018 return false;
2019 }
2020 return true;
2021 });
2022}
2023
2029 Operation *op, ValueRange replacement) {
2031}
2032
2036
2037// ===----------------------------------------------------------------------===//
2038// LongestPathCollection
2039// ===----------------------------------------------------------------------===//
2040
2042 llvm::stable_sort(paths, [](const DataflowPath &a, const DataflowPath &b) {
2043 return a.getDelay() > b.getDelay();
2044 });
2045}
2046
2048 // Deduplicate paths by start/end-point, keeping only the worst-case delay.
2049 if (perEndPoint) {
2050 llvm::DenseSet<DataflowPath::EndPointType> seen;
2051 for (size_t i = 0; i < paths.size(); ++i) {
2052 if (seen.insert(paths[i].getEndPoint()).second)
2053 paths[seen.size() - 1] = std::move(paths[i]);
2054 }
2055
2056 paths.resize(seen.size());
2057 } else {
2058 llvm::DenseSet<Object> seen;
2059 for (size_t i = 0; i < paths.size(); ++i) {
2060 if (seen.insert(paths[i].getStartPoint()).second)
2061 paths[seen.size() - 1] = std::move(paths[i]);
2062 }
2063 paths.resize(seen.size());
2064 }
2065}
2066
2068 paths.append(other.paths.begin(), other.paths.end());
2070}
assert(baseType &&"element must be base type")
static void printObjectImpl(llvm::raw_ostream &os, const Object &object, int64_t delay=-1, llvm::ImmutableList< DebugPoint > history={}, StringRef comment="")
static llvm::ImmutableList< DebugPoint > mapList(llvm::ImmutableListFactory< DebugPoint > *debugPointFactory, llvm::ImmutableList< DebugPoint > list, llvm::function_ref< DebugPoint(DebugPoint)> fn)
static llvm::ImmutableList< DebugPoint > concatList(llvm::ImmutableListFactory< DebugPoint > *debugPointFactory, llvm::ImmutableList< DebugPoint > lhs, llvm::ImmutableList< DebugPoint > rhs)
static void filterPaths(SmallVectorImpl< OpenPath > &results, bool keepOnlyMaxDelay, bool isLocalScope)
static void deduplicatePathsImpl(SmallVectorImpl< T > &results, size_t startIndex, llvm::function_ref< Key(const T &)> keyFn, llvm::function_ref< int64_t(const T &)> delayFn)
static StringAttr getNameImpl(Value value)
static int64_t getMaxDelayInPaths(ArrayRef< T > paths)
This class provides a thread-safe interface to access the analysis results.
circt::igraph::InstanceGraph * instanceGraph
const LocalVisitor * getLocalVisitor(StringAttr name) const
void notifyEnd(StringAttr name)
bool doTraceDebugPoints() const
llvm::sys::SmartMutex< true > mutex
bool doKeepOnlyMaxDelayPaths() const
LongestPathAnalysisOptions option
llvm::MapVector< StringAttr, std::unique_ptr< LocalVisitor > > localVisitors
bool isRunningParallel() const
LocalVisitor * getLocalVisitorMutable(StringAttr name) const
StringAttr getTopModuleName() const
Context(igraph::InstanceGraph *instanceGraph, const LongestPathAnalysisOptions &option)
llvm::SetVector< StringAttr > running
bool isLocalScope() const
bool doLazyComputation() const
void notifyStart(StringAttr name)
hw::HWModuleOp getHWModuleOp() const
ArrayRef< OpenPath > getCachedPaths(Value value, size_t bitPos) const
LogicalResult addEdge(Value to, size_t toBitPos, int64_t delay, SmallVectorImpl< OpenPath > &results)
LogicalResult visitValue(Value value, size_t bitPos, SmallVectorImpl< OpenPath > &results)
LogicalResult addLogicOp(Operation *op, size_t bitPos, SmallVectorImpl< OpenPath > &results)
std::unique_ptr< llvm::ImmutableListFactory< DebugPoint > > debugPointFactory
DenseMap< std::pair< Value, size_t >, std::pair< Value, size_t > > ecMap
LogicalResult markRegEndPoint(Value endPoint, Value start, Value reset={}, Value resetValue={}, Value enable={})
std::pair< Value, size_t > findLeader(Value value, size_t bitpos) const
LogicalResult visitDefault(OpResult result, size_t bitPos, SmallVectorImpl< OpenPath > &results)
FailureOr< ArrayRef< OpenPath > > getOrComputePaths(Value value, size_t bitPos)
const auto & getFromInputPortToEndPoint() const
llvm::ImmutableListFactory< DebugPoint > * getDebugPointFactory() const
LogicalResult visit(seq::FirMemReadOp op, size_t bitPos, SmallVectorImpl< OpenPath > &results)
LogicalResult markStartPoint(Value value, size_t bitPos, SmallVectorImpl< OpenPath > &results)
LogicalResult markEquivalent(Value from, size_t fromBitPos, Value to, size_t toBitPos, SmallVectorImpl< OpenPath > &results)
const auto & getEndPointResults() const
llvm::MapVector< std::pair< BlockArgument, size_t >, ObjectToMaxDistance > fromInputPortToEndPoint
std::atomic_bool done
DenseMap< std::pair< Value, size_t >, std::unique_ptr< SmallVector< OpenPath > > > cachedResults
hw::HWModuleOp Context * ctx
llvm::MapVector< std::tuple< size_t, size_t >, ObjectToMaxDistance > fromOutputPortToStartPoint
LogicalResult visit(seq::CompRegOp op, size_t bitPos, SmallVectorImpl< OpenPath > &results)
void getInternalPaths(SmallVectorImpl< DataflowPath > &results) const
DenseMap< Object, SmallVector< OpenPath > > endPointResults
LogicalResult visit(seq::FirRegOp op, size_t bitPos, SmallVectorImpl< OpenPath > &results)
LogicalResult initializeAndRun()
llvm::EquivalenceClasses< std::pair< Value, size_t > > ec
bool isTopLevel() const
LogicalResult visit(seq::FirMemReadWriteOp op, size_t bitPos, SmallVectorImpl< OpenPath > &results)
LogicalResult visit(mlir::BlockArgument argument, size_t bitPos, SmallVectorImpl< OpenPath > &results)
std::unique_ptr< OperationAnalyzer > operationAnalyzer
LogicalResult visit(hw::ConstantOp op, size_t bitPos, SmallVectorImpl< OpenPath > &results)
std::condition_variable cv
void putUnclosedResult(const Object &object, int64_t delay, llvm::ImmutableList< DebugPoint > history, ObjectToMaxDistance &objectToMaxDistance)
std::unique_ptr< circt::igraph::InstancePathCache > instancePathCache
circt::igraph::InstancePathCache * getInstancePathCache() const
LocalVisitor(hw::HWModuleOp module, Context *ctx)
const auto & getFromOutputPortToStartPoint() const
void waitUntilDone() const
std::unique_ptr< mlir::PassManager > passManager
static constexpr StringRef pipelineStr
mlir::OwningOpRef< mlir::ModuleOp > moduleOp
FailureOr< LocalVisitor * > getOrComputeLocalVisitor(Operation *op)
llvm::DenseMap< std::pair< mlir::OperationName, mlir::FunctionType >, std::unique_ptr< LocalVisitor > > cache
static mlir::FunctionType getFunctionTypeForOp(Operation *op)
LogicalResult analyzeOperation(OpResult value, size_t bitPos, SmallVectorImpl< std::tuple< size_t, size_t, int64_t > > &results)
LogicalResult initializePipeline()
OperationAnalyzer(Location loc)
HW-specific instance graph with a virtual entry node linking to all publicly visible modules.
This is a Node in the InstanceGraph.
This graph tracks modules and where they are instantiated.
InstanceGraphNode * lookupOrNull(StringAttr name)
Lookup an module by name.
InstanceGraphNode * lookup(ModuleOpInterface op)
Look up an InstanceGraphNode for a module.
An instance path composed of a series of instances.
InstanceOpInterface top() const
std::variant< Object, OutputPort > EndPointType
DataflowPath & prependPaths(circt::igraph::InstancePathCache &cache, llvm::ImmutableListFactory< DebugPoint > *debugPointFactory, circt::igraph::InstancePath path)
const OpenPath & getPath() const
hw::HWModuleOp getRoot() const
void print(llvm::raw_ostream &os)
void printEndPoint(llvm::raw_ostream &os)
const EndPointType & getEndPoint() const
void notifyOperationReplaced(Operation *op, ValueRange replacement) override
FailureOr< int64_t > getAverageMaxDelay(Value value)
LogicalResult computeGlobalPaths(Value value, size_t bitPos, SmallVectorImpl< DataflowPath > &results)
FailureOr< int64_t > getMaxDelay(Value value, int64_t bitPos=-1)
LogicalResult getInternalPaths(StringAttr moduleName, SmallVectorImpl< DataflowPath > &results, bool elaboratePaths=false) const
FailureOr< ArrayRef< OpenPath > > computeLocalPaths(Value value, size_t bitPos)
LogicalResult getAllPaths(StringAttr moduleName, SmallVectorImpl< DataflowPath > &results, bool elaboratePaths=false) const
LogicalResult getOpenPathsFromInternalToOutputPorts(StringAttr moduleName, SmallVectorImpl< DataflowPath > &results) const
llvm::ArrayRef< hw::HWModuleOp > getTopModules() const
bool isAnalysisAvailable(StringAttr moduleName) const
LogicalResult getOpenPathsFromInputPortsToInternal(StringAttr moduleName, SmallVectorImpl< DataflowPath > &results) const
void merge(const LongestPathCollection &other)
llvm::SmallVector< DataflowPath, 64 > paths
void dropNonCriticalPaths(bool perEndPoint=true)
Impl(Context &ctxt, int port)
Start a server on the given port. -1 means to let the OS pick a port.
create(data_type, value)
Definition hw.py:441
str root(self)
Definition synth.py:153
Object object
Definition synth.py:112
Optional[Value] value(self)
Definition synth.py:89
int64_t getBitWidth(mlir::Type type)
Return the hardware bit width of a type.
Definition HWTypes.cpp:110
llvm::json::Value toJSON(const circt::synth::DataflowPath &path)
The InstanceGraph op interface, see InstanceGraphInterface.td for more details.
Definition synth.py:1
Internal implementation for LongestPathAnalysis.
LogicalResult collectInternalToOutputPaths(StringAttr moduleName, SmallVectorImpl< DataflowPath > &results) const
Collect open paths from internal sequential sources to module output ports.
LogicalResult computeGlobalPaths(Value value, size_t bitPos, SmallVectorImpl< DataflowPath > &results)
Compute hierarchical timing paths to (value, bitPos) and append to results.
llvm::ArrayRef< hw::HWModuleOp > getTopModules() const
Top modules inferred or specified for this analysis run.
FailureOr< ArrayRef< OpenPath > > computeLocalPaths(Value value, size_t bitPos)
Compute local open paths to (value, bitPos).
FailureOr< int64_t > getMaxDelay(Value value, int64_t bitPos)
Return the max delay for a value.
LogicalResult collectClosedPaths(StringAttr moduleName, SmallVectorImpl< DataflowPath > &results) const
Collect register-to-register (closed) paths within the module.
bool isAnalysisAvailable(StringAttr moduleName) const
Return true if we have a LocalVisitor for the given HW module.
LogicalResult initializeAndRun(mlir::ModuleOp module)
Initialize and run analysis for a full MLIR module (hierarchical).
FailureOr< int64_t > getAverageMaxDelay(Value value)
Return average of per-bit max delays for a value.
LogicalResult collectInputToInternalPaths(StringAttr moduleName, SmallVectorImpl< DataflowPath > &results) const
Collect open paths from module input ports to internal sequential sinks.
SmallVector< hw::HWModuleOp > topModules
Top-level HW modules that seed hierarchical analysis.
mlir::Type type
Definition HWTypes.h:31
mlir::StringAttr name
Definition HWTypes.h:30
This holds the name, type, direction of a module's ports.
A data structure that caches and provides paths to module instances in the IR.
ArrayRef< InstancePath > getRelativePaths(ModuleOpInterface op, InstanceGraphNode *node)
InstancePath concatPath(InstancePath path1, InstancePath path2)
Concatenate two paths.
void print(llvm::raw_ostream &os) const
Configuration options for the longest path analysis.
bool collectDebugInfo
Enable collection of debug points along timing paths.
bool lazyComputation
Enable lazy computation mode for on-demand analysis.
bool keepOnlyMaxDelayPaths
Keep only the maximum delay path per end point.
Object & prependPaths(circt::igraph::InstancePathCache &cache, circt::igraph::InstancePath path)
void print(llvm::raw_ostream &os) const
OpenPath & prependPaths(circt::igraph::InstancePathCache &cache, llvm::ImmutableListFactory< DebugPoint > *debugPointFactory, circt::igraph::InstancePath path)