# # # Nim's Runtime Library # (c) Copyright 2017 Nim contributors # # See the file "copying.txt", included in this # distribution, for details about the copyright. # ##[ String `interpolation`:idx: / `format`:idx: inspired by Python's ``f``-strings. ``fmt`` vs. ``&`` ================= You can use either ``fmt`` or the unary ``&`` operator for formatting. The difference between them is subtle but important. The ``fmt"{expr}"`` syntax is more aesthetically pleasing, but it hides a small gotcha. The string is a `generalized raw string literal `_. This has some surprising effects: .. code-block:: nim import strformat let msg = "hello" doAssert fmt"{msg}\n" == "hello\\n" Because the literal is a raw string literal, the ``\n`` is not interpreted as an escape sequence. There are multiple ways to get around this, including the use of the ``&`` operator: .. code-block:: nim import strformat let msg = "hello" doAssert &"{msg}\n" == "hello\n" doAssert fmt"{msg}{'\n'}" == "hello\n" doAssert fmt("{msg}\n") == "hello\n" doAssert "{msg}\n".fmt == "hello\n" The choice of style is up to you. Formatting strings ================== .. code-block:: nim import strformat doAssert &"""{"abc":>4}""" == " abc" doAssert &"""{"abc":<4}""" == "abc " Formatting floats ================= .. code-block:: nim import strformat doAssert fmt"{-12345:08}" == "-0012345" doAssert fmt"{-1:3}" == " -1" doAssert fmt"{-1:03}" == "-01" doAssert fmt"{16:#X}" == "0x10" doAssert fmt"{123.456}" == "123.456" doAssert fmt"{123.456:>9.3f}" == " 123.456" doAssert fmt"{123.456:9.3f}" == " 123.456" doAssert fmt"{123.456:9.4f}" == " 123.4560" doAssert fmt"{123.456:>9.0f}" == " 123." doAssert fmt"{123.456:<9.4f}" == "123.4560 " doAssert fmt"{123.456:e}" == "1.234560e+02" doAssert fmt"{123.456:>13e}" == " 1.234560e+02" doAssert fmt"{123.456:13e}" == " 1.234560e+02" Implementation details ====================== An expression like ``&"{key} is {value:arg} {{z}}"`` is transformed into: .. code-block:: nim var temp = newStringOfCap(educatedCapGuess) temp.formatValue key, "" temp.add " is " temp.formatValue value, arg temp.add " {z}" temp Parts of the string that are enclosed in the curly braces are interpreted as Nim code, to escape an ``{`` or ``}`` double it. ``&`` delegates most of the work to an open overloaded set of ``formatValue`` procs. The required signature for a type ``T`` that supports formatting is usually ``proc formatValue(result: var string; x: T; specifier: string)``. The subexpression after the colon (``arg`` in ``&"{key} is {value:arg} {{z}}"``) is optional. It will be passed as the last argument to ``formatValue``. When the colon with the subexpression it is left out, an empty string will be taken instead. For strings and numeric types the optional argument is a so-called "standard format specifier". Standard format specifier for strings, integers and floats ========================================================== The general form of a standard format specifier is:: [[fill]align][sign][#][0][minimumwidth][.precision][type] The square brackets ``[]`` indicate an optional element. The optional align flag can be one of the following: '<' Forces the field to be left-aligned within the available space. (This is the default for strings.) '>' Forces the field to be right-aligned within the available space. (This is the default for numbers.) '^' Forces the field to be centered within the available space. Note that unless a minimum field width is defined, the field width will always be the same size as the data to fill it, so that the alignment option has no meaning in this case. The optional 'fill' character defines the character to be used to pad the field to the minimum width. The fill character, if present, must be followed by an alignment flag. The 'sign' option is only valid for numeric types, and can be one of the following: =================
{.used.} # ideally, would not be needed

var fun0 {.exportc.} = 10
proc fun1() {.exportc.} = discard
proc fun2() {.exportc: "$1".} = discard
proc fun3() {.exportc: "fun3Bis".} = discard

when defined cpp:
  proc funx1() {.exportcpp.} = discard
pec: StandardFormatSpecifier): string = ## Converts ``n`` to string. If ``n`` is `SomeFloat`, it casts to `int64`. ## Conversion is done using ``radix``. If result's length is lesser than ## ``minimumWidth``, it aligns result to the right or left (depending on ``a``) ## with ``fill`` char. when n is SomeUnsignedInt: var v = n.uint64 let negative = false else: var v = n.int64 let negative = v.int64 < 0 if negative: # FIXME: overflow error for low(int64) v = v * -1 var xx = "" if spec.alternateForm: case spec.typ of 'X': xx = "0x" of 'x': xx = "0x" of 'b': xx = "0b" of 'o': xx = "0o" else: discard if v == 0: result = "0" else: result = "" while v > type(v)(0): let d = v mod type(v)(radix) v = v div type(v)(radix) result.add(mkDigit(d.int, spec.typ)) for idx in 0..<(result.len div 2): swap result[idx], result[result.len - idx - 1] if spec.padWithZero: let sign = negative or spec.sign != '-' let toFill = spec.minimumWidth - result.len - xx.len - ord(sign) if toFill > 0: result = repeat('0', toFill) & result if negative: result = "-" & xx & result elif spec.sign != '-': result = spec.sign & xx & result else: result = xx & result if spec.align == '<': for i in result.len.. 0: result = repeat(spec.fill, toFill) & result proc parseStandardFormatSpecifier*(s: string; start = 0; ignoreUnknownSuffix = false): StandardFormatSpecifier = ## An exported helper proc that parses the "standard format specifiers", ## as specified by the grammar:: ## ## [[fill]align][sign][#][0][minimumwidth][.precision][type] ## ## This is only of interest if you want to write a custom ``format`` proc that ## should support the standard format specifiers. If ``ignoreUnknownSuffix`` is true, ## an unknown suffix after the ``type`` field is not an error. const alignChars = {'<', '>', '^'} result.fill = ' ' result.align = '\0' result.sign = '-' var i = start if i + 1 < s.len and s[i+1] in alignChars: result.fill = s[i] result.align = s[i+1] inc i, 2 elif i < s.len and s[i] in alignChars: result.align = s[i] inc i if i < s.len and s[i] in {'-', '+', ' '}: result.sign = s[i] inc i if i < s.len and s[i] == '#': result.alternateForm = true inc i if i+1 < s.len and s[i] == '0' and s[i+1] in {'0'..'9'}: result.padWithZero = true inc i let parsedLength = parseSaturatedNatural(s, result.minimumWidth, i) inc i, parsedLength if i < s.len and s[i] == '.': inc i let parsedLengthB = parseSaturatedNatural(s, result.precision, i) inc i, parsedLengthB else: result.precision = -1 if i < s.len and s[i] in {'A'..'Z', 'a'..'z'}: result.typ = s[i] inc i result.endPosition = i if i != s.len and not ignoreUnknownSuffix: raise newException(ValueError, "invalid format string, cannot parse: " & s[i..^1]) proc formatValue*[T: SomeInteger](result: var string; value: T; specifier: string) = ## Standard format implementation for ``SomeInteger``. It makes little ## sense to call this directly, but it is required to exist ## by the ``&`` macro. if specifier.len == 0: result.add $value return let spec = parseStandardFormatSpecifier(specifier) var radix = 10 case spec.typ of 'x', 'X': radix = 16 of 'd', '\0': discard of 'b': radix = 2 of 'o': radix = 8 else: raise newException(ValueError, "invalid type in format string for number, expected one " & " of 'x', 'X', 'b', 'd', 'o' but got: " & spec.typ) result.add formatInt(value, radix, spec) proc formatValue*(result: var string; value: SomeFloat; specifier: string) = ## Standard format implementation for ``SomeFloat``. It makes little ## sense to call this directly, but it is required to exist ## by the ``&`` macro. if specifier.len == 0: result.add $value return let spec = parseStandardFormatSpecifier(specifier) var fmode = ffDefault case spec.typ of 'e', 'E': fmode = ffScientific of 'f', 'F': fmode = ffDecimal of 'g', 'G': fmode = ffDefault of '\0': discard else: raise newException(ValueError, "invalid type in format string for number, expected one " & " of 'e', 'E', 'f', 'F', 'g', 'G' but got: " & spec.typ) var f = formatBiggestFloat(value, fmode, spec.precision) var sign = false if value >= 0.0: if spec.sign != '-': sign = true if value == 0.0: if 1.0 / value == Inf: # only insert the sign if value != negZero f.insert($spec.sign, 0) else: f.insert($spec.sign, 0) else: sign = true if spec.padWithZero: var signStr = "" if sign: signStr = $f[0] f = f[1..^1] let toFill = spec.minimumWidth - f.len - ord(sign) if toFill > 0: f = repeat('0', toFill) & f if sign: f = signStr & f # the default for numbers is right-alignment: let align = if spec.align == '\0': '>' else: spec.align let res = alignString(f, spec.minimumWidth, align, spec.fill) if spec.typ in {'A'..'Z'}: result.add toUpperAscii(res) else: result.add res proc formatValue*(result: var string; value: string; specifier: string) = ## Standard format implementation for ``string``. It makes little ## sense to call this directly, but it is required to exist ## by the ``&`` macro. let spec = parseStandardFormatSpecifier(specifier) var value = value case spec.typ of 's', '\0': discard else: raise newException(ValueError, "invalid type in format string for string, expected 's', but got " & spec.typ) if spec.precision != -1: if spec.precision < runeLen(value): setLen(value, runeOffset(value, spec.precision)) result.add alignString(value, spec.minimumWidth, spec.align, spec.fill) proc formatValue[T: not SomeInteger](result: var string; value: T; specifier: string) = mixin `$` formatValue(result, $value, specifier) template formatValue(result: var string; value: char; specifier: string) = result.add value template formatValue(result: var string; value: cstring; specifier: string) = result.add value proc strformatImpl(pattern: NimNode; openChar, closeChar: char): NimNode = if pattern.kind notin {nnkStrLit..nnkTripleStrLit}: error "string formatting (fmt(), &) only works with string literals", pattern if openChar == ':' or closeChar == ':': error "openChar and closeChar must not be ':'" let f = pattern.strVal var i = 0 let res = genSym(nskVar, "fmtRes") result = newNimNode(nnkStmtListExpr, lineInfoFrom = pattern) # XXX: https://github.com/nim-lang/Nim/issues/8405 # When compiling with -d:useNimRtl, certain procs such as `count` from the strutils # module are not accessible at compile-time: let expectedGrowth = when defined(useNimRtl): 0 else: count(f, '{') * 10 result.add newVarStmt(res, newCall(bindSym"newStringOfCap", newLit(f.len + expectedGrowth))) var strlit = "" while i < f.len: if f[i] == openChar: inc i if f[i] == openChar: inc i strlit.add openChar else: if strlit.len > 0: result.add newCall(bindSym"add", res, newLit(strlit)) strlit = "" var subexpr = "" while i < f.len and f[i] != closeChar and f[i] != ':': subexpr.add f[i] inc i var x: NimNode try: x = parseExpr(subexpr) except ValueError: when declared(getCurrentExceptionMsg): let msg = getCurrentExceptionMsg() error("could not parse `" & subexpr & "`.\n" & msg, pattern) else: error("could not parse `" & subexpr & "`.\n", pattern) let formatSym = bindSym("formatValue", brOpen) var options = "" if f[i] == ':': inc i while i < f.len and f[i] != closeChar: options.add f[i] inc i if f[i] == closeChar: inc i else: doAssert false, "invalid format string: missing '}'" result.add newCall(formatSym, res, x, newLit(options)) elif f[i] == closeChar: if f[i+1] == closeChar: strlit.add closeChar inc i, 2 else: doAssert false, "invalid format string: '}' instead of '}}'" inc i else: strlit.add f[i] inc i if strlit.len > 0: result.add newCall(bindSym"add", res, newLit(strlit)) result.add res when defined(debugFmtDsl): echo repr result macro `&`*(pattern: string): untyped = strformatImpl(pattern, '{', '}') ## For a specification of the ``&`` macro, see the module level documentation. macro fmt*(pattern: string): untyped = strformatImpl(pattern, '{', '}') ## An alias for ``&``. macro fmt*(pattern: string; openChar, closeChar: char): untyped = ## Use ``openChar`` instead of '{' and ``closeChar`` instead of '}' runnableExamples: let testInt = 123 doAssert "".fmt('<', '>') == "123" doAssert """(()"foo" & "bar"())""".fmt(')', '(') == "(foobar)" doAssert """ ""{"123+123"}"" """.fmt('"', '"') == " \"{246}\" " strformatImpl(pattern, openChar.intVal.char, closeChar.intVal.char) when isMainModule: template check(actual, expected: string) = doAssert actual == expected from strutils import toUpperAscii, repeat # Basic tests let s = "string" check &"{0} {s}", "0 string" check &"{s[0..2].toUpperAscii}", "STR" check &"{-10:04}", "-010" check &"{-10:<04}", "-010" check &"{-10:>04}", "-010" check &"0x{10:02X}", "0x0A" check &"{10:#04X}", "0x0A" check &"""{"test":#>5}""", "#test" check &"""{"test":>5}""", " test" check &"""{"test":#^7}""", "#test##" check &"""{"test": <5}""", "test " check &"""{"test":<5}""", "test " check &"{1f:.3f}", "1.000" check &"Hello, {s}!", "Hello, string!" # Tests for identifiers without parenthesis check &"{s} works{s}", "string worksstring" check &"{s:>7}", " string" doAssert(not compiles(&"{s_works}")) # parsed as identifier `s_works` # Misc general tests check &"{{}}", "{}" check &"{0}%", "0%" check &"{0}%asdf", "0%asdf" check &("\n{\"\\n\"}\n"), "\n\n\n" check &"""{"abc"}s""", "abcs" # String tests check &"""{"abc"}""", "abc" check &"""{"abc":>4}""", " abc" check &"""{"abc":<4}""", "abc " check &"""{"":>4}""", " " check &"""{"":<4}""", " " # Int tests check &"{12345}", "12345" check &"{ - 12345}", "-12345" check &"{12345:6}", " 12345" check &"{12345:>6}", " 12345" check &"{12345:4}", "12345" check &"{12345:08}", "00012345" check &"{-12345:08}", "-0012345" check &"{0:0}", "0" check &"{0:02}", "00" check &"{-1:3}", " -1" check &"{-1:03}", "-01" check &"{10}", "10" check &"{16:#X}", "0x10" check &"{16:^#7X}", " 0x10 " check &"{16:^+#7X}", " +0x10 " # Hex tests check &"{0:x}", "0" check &"{-0:x}", "0" check &"{255:x}", "ff" check &"{255:X}", "FF" check &"{-255:x}", "-ff" check &"{-255:X}", "-FF" check &"{255:x} uNaffeCteD CaSe", "ff uNaffeCteD CaSe" check &"{255:X} uNaffeCteD CaSe", "FF uNaffeCteD CaSe" check &"{255:4x}", " ff" check &"{255:04x}", "00ff" check &"{-255:4x}", " -ff" check &"{-255:04x}", "-0ff" # Float tests check &"{123.456}", "123.456" check &"{-123.456}", "-123.456" check &"{123.456:.3f}", "123.456" check &"{123.456:+.3f}", "+123.456" check &"{-123.456:+.3f}", "-123.456" check &"{-123.456:.3f}", "-123.456" check &"{123.456:1g}", "123.456" check &"{123.456:.1f}", "123.5" check &"{123.456:.0f}", "123" check &"{123.456:>9.3f}", " 123.456" check &"{123.456:9.3f}", " 123.456" check &"{123.456:>9.4f}", " 123.4560" check &"{123.456:>9.0f}", " 123" check &"{123.456:<9.4f}", "123.4560 " # Float (scientific) tests check &"{123.456:e}", "1.234560e+02" check &"{123.456:>13e}", " 1.234560e+02" check &"{123.456:<13e}", "1.234560e+02 " check &"{123.456:.1e}", "1.2e+02" check &"{123.456:.2e}", "1.23e+02" check &"{123.456:.3e}", "1.235e+02" # Note: times.format adheres to the format protocol. Test that this # works: import times var dt = initDateTime(01, mJan, 2000, 00, 00, 00) check &"{dt:yyyy-MM-dd}", "2000-01-01" var tm = fromUnix(0) discard &"{tm}" # Unicode string tests check &"""{"αβγ"}""", "αβγ" check &"""{"αβγ":>5}""", " αβγ" check &"""{"αβγ":<5}""", "αβγ " check &"""a{"a"}α{"α"}€{"€"}𐍈{"𐍈"}""", "aaαα€€𐍈𐍈" check &"""a{"a":2}α{"α":2}€{"€":2}𐍈{"𐍈":2}""", "aa αα €€ 𐍈𐍈 " # Invalid unicode sequences should be handled as plain strings. # Invalid examples taken from: https://stackoverflow.com/a/3886015/1804173 let invalidUtf8 = [ "\xc3\x28", "\xa0\xa1", "\xe2\x28\xa1", "\xe2\x82\x28", "\xf0\x28\x8c\xbc", "\xf0\x90\x28\xbc", "\xf0\x28\x8c\x28" ] for s in invalidUtf8: check &"{s:>5}", repeat(" ", 5-s.len) & s # bug #11089 let flfoo: float = 1.0 check &"{flfoo}", "1.0" # bug #11092 check &"{high(int64)}", "9223372036854775807" check &"{low(int64)}", "-9223372036854775808" import json doAssert fmt"{'a'} {'b'}" == "a b" echo("All tests ok")