CIRCT 22.0.0git
Loading...
Searching...
No Matches
FormatStrings.cpp
Go to the documentation of this file.
1//===- FormatStrings.cpp - Verilog format string conversion ---------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
10#include "slang/ast/SFormat.h"
11
12using namespace mlir;
13using namespace circt;
14using namespace ImportVerilog;
15using moore::IntAlign;
16using moore::IntFormat;
17using moore::IntPadding;
18using moore::RealFormat;
19using slang::ast::SFormat::FormatOptions;
20
21namespace {
22struct FormatStringParser {
23 Context &context;
24 OpBuilder &builder;
25 /// The remaining arguments to be parsed.
26 ArrayRef<const slang::ast::Expression *> arguments;
27 /// The current location to use for ops and diagnostics.
28 Location loc;
29 /// The default format for integer arguments not covered by a format string
30 /// literal.
31 IntFormat defaultFormat;
32 /// The interpolated string fragments that will be concatenated using a
33 /// `moore.fmt.concat` op.
34 SmallVector<Value> fragments;
35
36 FormatStringParser(Context &context,
37 ArrayRef<const slang::ast::Expression *> arguments,
38 Location loc, IntFormat defaultFormat)
39 : context(context), builder(context.builder), arguments(arguments),
40 loc(loc), defaultFormat(defaultFormat) {}
41
42 /// Entry point to the format string parser.
43 FailureOr<Value> parse(bool appendNewline) {
44 while (!arguments.empty()) {
45 const auto &arg = *arguments[0];
46 arguments = arguments.drop_front();
47 if (arg.kind == slang::ast::ExpressionKind::EmptyArgument)
48 continue;
49 loc = context.convertLocation(arg.sourceRange);
50 if (auto *lit = arg.as_if<slang::ast::StringLiteral>()) {
51 if (failed(parseFormat(lit->getValue())))
52 return failure();
53 } else {
54 if (failed(emitDefault(arg)))
55 return failure();
56 }
57 }
58
59 // Append the optional newline.
60 if (appendNewline)
61 emitLiteral("\n");
62
63 // Concatenate all string fragments into one formatted string, or return an
64 // empty literal if no fragments were generated.
65 if (fragments.empty())
66 return Value{};
67 if (fragments.size() == 1)
68 return fragments[0];
69 return moore::FormatConcatOp::create(builder, loc, fragments).getResult();
70 }
71
72 /// Parse a format string literal and consume and format the arguments
73 /// corresponding to the format specifiers it contains.
74 LogicalResult parseFormat(StringRef format) {
75 bool anyFailure = false;
76 auto onText = [&](auto text) {
77 if (anyFailure)
78 return;
79 emitLiteral(text);
80 };
81 auto onArg = [&](auto specifier, auto offset, auto len,
82 const auto &options) {
83 if (anyFailure)
84 return;
85 if (failed(emitArgument(specifier, format.substr(offset, len), options)))
86 anyFailure = true;
87 };
88 auto onError = [&](auto, auto, auto, auto) {
89 assert(false && "Slang should have already reported all errors");
90 };
91 slang::ast::SFormat::parse(format, onText, onArg, onError);
92 return failure(anyFailure);
93 }
94
95 /// Emit a string literal that requires no additional formatting.
96 void emitLiteral(StringRef literal) {
97 fragments.push_back(moore::FormatLiteralOp::create(builder, loc, literal));
98 }
99
100 /// Consume the next argument from the list and emit it according to the given
101 /// format specifier.
102 LogicalResult emitArgument(char specifier, StringRef fullSpecifier,
103 const FormatOptions &options) {
104 auto specifierLower = std::tolower(specifier);
105
106 // Special handling for format specifiers that consume no argument.
107 if (specifierLower == 'm' || specifierLower == 'l')
108 return mlir::emitError(loc)
109 << "unsupported format specifier `" << fullSpecifier << "`";
110
111 // Consume the next argument, which will provide the value to be
112 // formatted.
113 assert(!arguments.empty() && "Slang guarantees correct arg count");
114 const auto &arg = *arguments[0];
115 arguments = arguments.drop_front();
116
117 // Handle the different formatting options.
118 // See IEEE 1800-2017 § 21.2.1.2 "Format specifications".
119 switch (specifierLower) {
120 case 'b':
121 return emitInteger(arg, options, IntFormat::Binary);
122 case 'o':
123 return emitInteger(arg, options, IntFormat::Octal);
124 case 'd':
125 return emitInteger(arg, options, IntFormat::Decimal);
126 case 'h':
127 case 'x':
128 return emitInteger(arg, options,
129 std::isupper(specifier) ? IntFormat::HexUpper
130 : IntFormat::HexLower);
131
132 case 'e':
133 case 'g':
134 case 'f':
135 return emitReal(arg, options, RealFormat::Float);
136
137 case 't':
138 return emitTime(arg, options);
139
140 case 's':
141 return emitString(arg, options);
142
143 default:
144 return mlir::emitError(loc)
145 << "unsupported format specifier `" << fullSpecifier << "`";
146 }
147 }
148
149 /// Emit an integer value with the given format.
150 LogicalResult emitInteger(const slang::ast::Expression &arg,
151 const FormatOptions &options, IntFormat format) {
152
153 Type intTy = {};
154 Value val;
155 auto rVal = context.convertRvalueExpression(arg);
156
157 // An IEEE 754 float number is represented using a sign bit s, n mantissa,
158 // and m exponent bits, representing (-1)**s * 1.fraction * 2**(E-bias).
159 // This means that the largest finite value is (2-2**(-n) * 2**(2**m-1)),
160 // just slightly less than ((2**(2**(m)))-1).
161 // Since we need signed value representation, we need integers that can
162 // represent values between [-(2**(2**(m))) ... (2**(2**(m)))-1], which
163 // requires an m+1 bit signed integer.
164 if (auto realTy = dyn_cast<moore::RealType>(rVal.getType())) {
165 if (realTy.getWidth() == moore::RealWidth::f32) {
166 // A 32 Bit IEEE 754 float number needs at most 129 integer bits
167 // (signed).
168 intTy = moore::IntType::getInt(context.getContext(), 129);
169 } else if (realTy.getWidth() == moore::RealWidth::f64) {
170 // A 64 Bit IEEE 754 float number needs at most 1025 integer bits
171 // (signed).
172 intTy = moore::IntType::getInt(context.getContext(), 1025);
173 } else
174 return failure();
175
176 val = moore::RealToIntOp::create(builder, loc, intTy, rVal);
177 } else {
178 val = rVal;
179 }
180
181 auto value = context.convertToSimpleBitVector(val);
182 if (!value)
183 return failure();
184
185 // Determine the width to which the formatted integer should be padded.
186 unsigned width;
187 if (options.width) {
188 width = *options.width;
189 } else {
190 width = cast<moore::IntType>(value.getType()).getWidth();
191 if (format == IntFormat::Octal)
192 // 3 bits per octal digit
193 width = (width + 2) / 3;
194 else if (format == IntFormat::HexLower || format == IntFormat::HexUpper)
195 // 4 bits per hex digit
196 width = (width + 3) / 4;
197 else if (format == IntFormat::Decimal)
198 // ca. 3.322 bits per decimal digit (ln(10)/ln(2))
199 width = std::ceil(width * std::log(2) / std::log(10));
200 }
201
202 // Determine the alignment and padding.
203 auto alignment = options.leftJustify ? IntAlign::Left : IntAlign::Right;
204 auto padding =
205 format == IntFormat::Decimal ? IntPadding::Space : IntPadding::Zero;
206
207 fragments.push_back(moore::FormatIntOp::create(builder, loc, value, format,
208 width, alignment, padding));
209 return success();
210 }
211
212 LogicalResult emitReal(const slang::ast::Expression &arg,
213 const FormatOptions &options, RealFormat format) {
214
215 // Ensures that the given value is moore.real
216 // i.e. $display("%f", 4) -> 4.000000, but 4 is not necessarily of real type
217 auto value = context.convertRvalueExpression(
218 arg, moore::RealType::get(context.getContext(), moore::RealWidth::f64));
219
220 if (!value)
221 return failure();
222
223 // TODO add support for specifics such as width etc
224
225 fragments.push_back(
226 moore::FormatRealOp::create(builder, loc, value, format));
227
228 return success();
229 }
230
231 // Format an integer with the %t specifier according to IEEE 1800-2023
232 // § 20.4.3 "$timeformat"
233 LogicalResult emitTime(const slang::ast::Expression &arg,
234 const FormatOptions &options) {
235
236 // Only handle `TimeType` values.
237 auto value = context.convertRvalueExpression(
238 arg, moore::TimeType::get(context.getContext()));
239 if (!value)
240 return failure();
241
242 mlir::IntegerAttr width = nullptr;
243 if (options.width) {
244 mlir::Type i32Ty =
245 mlir::IntegerType::get(context.getContext(), /*width=*/32);
246 width = mlir::IntegerAttr::get(i32Ty, options.width.value());
247 }
248
249 // Delegate actual formatting to `moore.fmt.time`, annotate width if
250 // provided
251 if (width) {
252 fragments.push_back(
253 moore::FormatTimeOp::create(builder, loc, value, width));
254 } else {
255 fragments.push_back(moore::FormatTimeOp::create(builder, loc, value));
256 }
257
258 return success();
259 }
260
261 LogicalResult emitString(const slang::ast::Expression &arg,
262 const FormatOptions &options) {
263 if (options.width)
264 return mlir::emitError(loc)
265 << "string format specifier with width not supported";
266
267 // Simplified handling for literals.
268 if (auto *lit = arg.as_if<slang::ast::StringLiteral>()) {
269 emitLiteral(lit->getValue());
270 return success();
271 }
272
273 // Handle expressions
274 if (auto value = context.convertRvalueExpression(
275 arg, builder.getType<moore::FormatStringType>())) {
276 fragments.push_back(value);
277 return success();
278 }
279
280 return mlir::emitError(context.convertLocation(arg.sourceRange))
281 << "expression cannot be formatted as string";
282 }
283
284 /// Emit an expression argument with the appropriate default formatting.
285 LogicalResult emitDefault(const slang::ast::Expression &expr) {
286 FormatOptions options;
287 return emitInteger(expr, options, defaultFormat);
288 }
289};
290} // namespace
291
292FailureOr<Value> Context::convertFormatString(
293 std::span<const slang::ast::Expression *const> arguments, Location loc,
294 IntFormat defaultFormat, bool appendNewline) {
295 FormatStringParser parser(*this, ArrayRef(arguments.data(), arguments.size()),
296 loc, defaultFormat);
297 return parser.parse(appendNewline);
298}
assert(baseType &&"element must be base type")
The InstanceGraph op interface, see InstanceGraphInterface.td for more details.
A helper class to facilitate the conversion from a Slang AST to MLIR operations.
Value convertRvalueExpression(const slang::ast::Expression &expr, Type requiredType={})
Value convertToSimpleBitVector(Value value)
Helper function to convert a value to its simple bit vector representation, if it has one.
MLIRContext * getContext()
Return the MLIR context.
Location convertLocation(slang::SourceLocation loc)
Convert a slang SourceLocation into an MLIR Location.