CIRCT 22.0.0git
Loading...
Searching...
No Matches
FormatStrings.cpp
Go to the documentation of this file.
1//===- FormatStrings.cpp - Verilog format string conversion ---------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
10#include "slang/ast/SFormat.h"
11
12using namespace mlir;
13using namespace circt;
14using namespace ImportVerilog;
15using moore::IntAlign;
16using moore::IntFormat;
17using moore::IntPadding;
18using moore::RealFormat;
19using slang::ast::SFormat::FormatOptions;
20
21namespace {
22struct FormatStringParser {
23 Context &context;
24 OpBuilder &builder;
25 /// The remaining arguments to be parsed.
26 ArrayRef<const slang::ast::Expression *> arguments;
27 /// The current location to use for ops and diagnostics.
28 Location loc;
29 /// The default format for integer arguments not covered by a format string
30 /// literal.
31 IntFormat defaultFormat;
32 /// The interpolated string fragments that will be concatenated using a
33 /// `moore.fmt.concat` op.
34 SmallVector<Value> fragments;
35
36 FormatStringParser(Context &context,
37 ArrayRef<const slang::ast::Expression *> arguments,
38 Location loc, IntFormat defaultFormat)
39 : context(context), builder(context.builder), arguments(arguments),
40 loc(loc), defaultFormat(defaultFormat) {}
41
42 /// Entry point to the format string parser.
43 FailureOr<Value> parse(bool appendNewline) {
44 while (!arguments.empty()) {
45 const auto &arg = *arguments[0];
46 arguments = arguments.drop_front();
47 if (arg.kind == slang::ast::ExpressionKind::EmptyArgument)
48 continue;
49 loc = context.convertLocation(arg.sourceRange);
50 if (auto *lit = arg.as_if<slang::ast::StringLiteral>()) {
51 if (failed(parseFormat(lit->getValue())))
52 return failure();
53 } else {
54 if (failed(emitDefault(arg)))
55 return failure();
56 }
57 }
58
59 // Append the optional newline.
60 if (appendNewline)
61 emitLiteral("\n");
62
63 // Concatenate all string fragments into one formatted string, or return an
64 // empty literal if no fragments were generated.
65 if (fragments.empty())
66 return Value{};
67 if (fragments.size() == 1)
68 return fragments[0];
69 return moore::FormatConcatOp::create(builder, loc, fragments).getResult();
70 }
71
72 /// Parse a format string literal and consume and format the arguments
73 /// corresponding to the format specifiers it contains.
74 LogicalResult parseFormat(StringRef format) {
75 bool anyFailure = false;
76 auto onText = [&](auto text) {
77 if (anyFailure)
78 return;
79 emitLiteral(text);
80 };
81 auto onArg = [&](auto specifier, auto offset, auto len,
82 const auto &options) {
83 if (anyFailure)
84 return;
85 if (failed(emitArgument(specifier, format.substr(offset, len), options)))
86 anyFailure = true;
87 };
88 auto onError = [&](auto, auto, auto, auto) {
89 assert(false && "Slang should have already reported all errors");
90 };
91 slang::ast::SFormat::parse(format, onText, onArg, onError);
92 return failure(anyFailure);
93 }
94
95 /// Emit a string literal that requires no additional formatting.
96 void emitLiteral(StringRef literal) {
97 fragments.push_back(moore::FormatLiteralOp::create(builder, loc, literal));
98 }
99
100 /// Consume the next argument from the list and emit it according to the given
101 /// format specifier.
102 LogicalResult emitArgument(char specifier, StringRef fullSpecifier,
103 const FormatOptions &options) {
104 auto specifierLower = std::tolower(specifier);
105
106 // Special handling for format specifiers that consume no argument.
107 if (specifierLower == 'm' || specifierLower == 'l')
108 return mlir::emitError(loc)
109 << "unsupported format specifier `" << fullSpecifier << "`";
110
111 // Consume the next argument, which will provide the value to be
112 // formatted.
113 assert(!arguments.empty() && "Slang guarantees correct arg count");
114 const auto &arg = *arguments[0];
115 arguments = arguments.drop_front();
116
117 // Handle the different formatting options.
118 // See IEEE 1800-2017 § 21.2.1.2 "Format specifications".
119 switch (specifierLower) {
120 case 'b':
121 return emitInteger(arg, options, IntFormat::Binary);
122 case 'o':
123 return emitInteger(arg, options, IntFormat::Octal);
124 case 'd':
125 return emitInteger(arg, options, IntFormat::Decimal);
126 case 'h':
127 case 'x':
128 return emitInteger(arg, options,
129 std::isupper(specifier) ? IntFormat::HexUpper
130 : IntFormat::HexLower);
131
132 case 'e':
133 case 'g':
134 case 'f':
135 return emitReal(arg, options, RealFormat::Float);
136
137 case 't':
138 return emitTime(arg, options);
139
140 case 's':
141 return emitString(arg, options);
142
143 default:
144 return mlir::emitError(loc)
145 << "unsupported format specifier `" << fullSpecifier << "`";
146 }
147 }
148
149 /// Emit an integer value with the given format.
150 LogicalResult emitInteger(const slang::ast::Expression &arg,
151 const FormatOptions &options, IntFormat format) {
152
153 Type intTy = {};
154 Value val;
155 auto rVal = context.convertRvalueExpression(arg);
156 if (!rVal)
157 return failure();
158
159 // An IEEE 754 float number is represented using a sign bit s, n mantissa,
160 // and m exponent bits, representing (-1)**s * 1.fraction * 2**(E-bias).
161 // This means that the largest finite value is (2-2**(-n) * 2**(2**m-1)),
162 // just slightly less than ((2**(2**(m)))-1).
163 // Since we need signed value representation, we need integers that can
164 // represent values between [-(2**(2**(m))) ... (2**(2**(m)))-1], which
165 // requires an m+1 bit signed integer.
166 if (auto realTy = dyn_cast<moore::RealType>(rVal.getType())) {
167 if (realTy.getWidth() == moore::RealWidth::f32) {
168 // A 32 Bit IEEE 754 float number needs at most 129 integer bits
169 // (signed).
170 intTy = moore::IntType::getInt(context.getContext(), 129);
171 } else if (realTy.getWidth() == moore::RealWidth::f64) {
172 // A 64 Bit IEEE 754 float number needs at most 1025 integer bits
173 // (signed).
174 intTy = moore::IntType::getInt(context.getContext(), 1025);
175 } else
176 return failure();
177
178 val = moore::RealToIntOp::create(builder, loc, intTy, rVal);
179 } else {
180 val = rVal;
181 }
182
183 auto value = context.convertToSimpleBitVector(val);
184 if (!value)
185 return failure();
186
187 // Determine the width to which the formatted integer should be padded.
188 unsigned width;
189 if (options.width) {
190 width = *options.width;
191 } else {
192 width = cast<moore::IntType>(value.getType()).getWidth();
193 if (format == IntFormat::Octal)
194 // 3 bits per octal digit
195 width = (width + 2) / 3;
196 else if (format == IntFormat::HexLower || format == IntFormat::HexUpper)
197 // 4 bits per hex digit
198 width = (width + 3) / 4;
199 else if (format == IntFormat::Decimal)
200 // ca. 3.322 bits per decimal digit (ln(10)/ln(2))
201 width = std::ceil(width * std::log(2) / std::log(10));
202 }
203
204 // Determine the alignment and padding.
205 auto alignment = options.leftJustify ? IntAlign::Left : IntAlign::Right;
206 auto padding =
207 format == IntFormat::Decimal ? IntPadding::Space : IntPadding::Zero;
208
209 fragments.push_back(moore::FormatIntOp::create(builder, loc, value, format,
210 width, alignment, padding));
211 return success();
212 }
213
214 LogicalResult emitReal(const slang::ast::Expression &arg,
215 const FormatOptions &options, RealFormat format) {
216
217 // Ensures that the given value is moore.real
218 // i.e. $display("%f", 4) -> 4.000000, but 4 is not necessarily of real type
219 auto value = context.convertRvalueExpression(
220 arg, moore::RealType::get(context.getContext(), moore::RealWidth::f64));
221
222 if (!value)
223 return failure();
224
225 // TODO add support for specifics such as width etc
226
227 fragments.push_back(
228 moore::FormatRealOp::create(builder, loc, value, format));
229
230 return success();
231 }
232
233 // Format an integer with the %t specifier according to IEEE 1800-2023
234 // § 20.4.3 "$timeformat"
235 LogicalResult emitTime(const slang::ast::Expression &arg,
236 const FormatOptions &options) {
237
238 // Only handle `TimeType` values.
239 auto value = context.convertRvalueExpression(
240 arg, moore::TimeType::get(context.getContext()));
241 if (!value)
242 return failure();
243
244 mlir::IntegerAttr width = nullptr;
245 if (options.width) {
246 mlir::Type i32Ty =
247 mlir::IntegerType::get(context.getContext(), /*width=*/32);
248 width = mlir::IntegerAttr::get(i32Ty, options.width.value());
249 }
250
251 // Delegate actual formatting to `moore.fmt.time`, annotate width if
252 // provided
253 if (width) {
254 fragments.push_back(
255 moore::FormatTimeOp::create(builder, loc, value, width));
256 } else {
257 fragments.push_back(moore::FormatTimeOp::create(builder, loc, value));
258 }
259
260 return success();
261 }
262
263 LogicalResult emitString(const slang::ast::Expression &arg,
264 const FormatOptions &options) {
265 if (options.width)
266 return mlir::emitError(loc)
267 << "string format specifier with width not supported";
268
269 // Simplified handling for literals.
270 if (auto *lit = arg.as_if<slang::ast::StringLiteral>()) {
271 emitLiteral(lit->getValue());
272 return success();
273 }
274
275 // Handle expressions
276 if (auto value = context.convertRvalueExpression(
277 arg, builder.getType<moore::FormatStringType>())) {
278 fragments.push_back(value);
279 return success();
280 }
281
282 return mlir::emitError(context.convertLocation(arg.sourceRange))
283 << "expression cannot be formatted as string";
284 }
285
286 /// Emit an expression argument with the appropriate default formatting.
287 LogicalResult emitDefault(const slang::ast::Expression &expr) {
288 FormatOptions options;
289 return emitInteger(expr, options, defaultFormat);
290 }
291};
292} // namespace
293
294FailureOr<Value> Context::convertFormatString(
295 std::span<const slang::ast::Expression *const> arguments, Location loc,
296 IntFormat defaultFormat, bool appendNewline) {
297 FormatStringParser parser(*this, ArrayRef(arguments.data(), arguments.size()),
298 loc, defaultFormat);
299 return parser.parse(appendNewline);
300}
assert(baseType &&"element must be base type")
The InstanceGraph op interface, see InstanceGraphInterface.td for more details.
A helper class to facilitate the conversion from a Slang AST to MLIR operations.
Value convertRvalueExpression(const slang::ast::Expression &expr, Type requiredType={})
Value convertToSimpleBitVector(Value value)
Helper function to convert a value to its simple bit vector representation, if it has one.
MLIRContext * getContext()
Return the MLIR context.
Location convertLocation(slang::SourceLocation loc)
Convert a slang SourceLocation into an MLIR Location.