Jump to content

Category talk:Wren-fmt: Difference between revisions

→‎Source code: Several improvements, notably the addition of (s)printf style methods.
(Minor bug-fix.)
(→‎Source code: Several improvements, notably the addition of (s)printf style methods.)
Line 1:
===Source code===
<lang ecmascript>/* Module "fmt.wren" */
 
/* Conv contains routines which do conversions between types. */
class Conv {
Line 9:
// All possible digits (upper case).
static upperDigits { "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ" }
 
// Maximum safe integer = 2^53 - 1.
static maxSafeInt { 9007199254740991 }
 
// Prefix map for different bases.
static prefixes { { "b": "0b", "t": "0t", "o": "0o", "d": "0d", "x": "0x", "X": "0X" } }
 
// Converts an integer to a numeric ASCII string with a base between 2 and 36.
static itoa(n, b) {
Line 27 ⟶ 30:
return ((neg) ? "-" : "") + res[-1..0]
}
 
// Private helper function. Converts ASCII string to upper case.
static upper_(s) { s.bytes.map { |b|
return String.fromByte((b >= 97 && b <= 122) ? b - 32 : b)
}.join() }
 
// As itoa(n, b) but resulting digits are upper case.
static Itoa(n, b) { (b < 11) ? itoa(n, b) : upper_(itoa(n, b)) }
 
// Converts a numeric ASCII string with a base between 2 and 36 to an integer.
static atoi(s, b) {
Line 49 ⟶ 52:
if (s == "") Fiber.abort("String must contain some digits.")
s = upper_(s)
if ((s.startsWith("0B") && b != 2) || (s.startsWith("0O0T") && b != 83) || (s.startsWith("0X") && b != 16)) {
(s.startsWith("0O") && b != 8) || (s.startsWith("0X") && b != 16)) {
Fiber.abort("Inconsistent base specifier.")
}
if (s.startsWith("0B") || s.startsWith("0T") || s.startsWith("0O") || s.startsWith("0X")) {
s = s[2..-1]
if (s == "") Fiber.abort("String after base specifier must contain some digits.")
Line 65 ⟶ 69:
return (neg) ? -res : res
}
 
// Convenience versions of itoa and atoi which use a base of 10.
static itoa(s) { itoa(s, 10) }
static atoi(s) { atoi(s, 10) }
 
// Integer/bool conversion routines.
static itob(i) { (i is Num && i.isInteger) ? (i != 0) : null }
static btoi(b) { (b is Bool) ? (b ? 1 : 0) : null }
 
// Integer/character conversion routines.
static itoc(i) { (i is Num && i.isInteger && i >= 0 && i <= 0x10ffff) ? String.fromCodePoint(i) : null }
static ctoi(c) { (c is String && c.count == 1) ? c.codePoints[0] : null }
 
static bin(n) { itoa(n, 2) } // Converts an integer to binary.
static ter(n) { itoa(n, 3) } // Converts an integer to ternary.
static oct(n) { itoa(n, 8) } // Converts an integer to octal.
static dec(n) { itoa(n, 10) } // Ensures safe decimal integers printed as such.
static hex(n) { itoa(n, 16) } // Converts an integer to hex.
static Hex(n) { Conv.Itoa(n, 16) } // Converts an integer to hex (upper case digits).
 
static pdec(n) { ((n >= 0) ? "+" : "") + dec(n) } // Adds '+' for non-negative integers.
static mdec(n) { ((n >= 0) ? " " : "") + dec(n) } // Only uses '-', leaves space for '+'.
 
// Converts ana non-negative integer to its ordinal equivalent.
static ord(n) {
if (!(n is Num && n.isInteger && n >= 0)) Fiber.abort("Argument must be a non-negative integer.")
Line 104 ⟶ 109:
}
}
 
/* Fmt contains routines which format numbers or strings in various ways. */
class Fmt {
Line 115 ⟶ 120:
return (w > c) ? s + p * (w - c) : s
}
 
// Right justifies 's' in a field of minimum width 'w' using the pad character 'p'.
static rjust(w, s, p) {
Line 124 ⟶ 129:
return (w > c) ? p * (w - c) + s : s
}
 
// Centers 's' in a field of minimum width 'w' using the pad character 'p'.
static cjust(w, s, p) {
Line 135 ⟶ 140:
return p * l + s + p * (w - c - l)
}
 
// Convenience versions of the above which use a space as the pad character.
static ljust(w, s) { ljust(w, s, " ") }
static rjust(w, s) { rjust(w, s, " ") }
static cjust(w, s) { cjust(w, s, " ") }
 
// Right justifies 's' in a field of minimum width 'w' using the pad character '0'.
// Unlike rjust, any sign or elided sign (i.e. space) will be placed before the padding.
Line 153 ⟶ 158:
return sign + "0" * (w - c) + s[1..-1]
}
 
// Private helper method for 'commatize' method.
// Checks whether argument is a numeric decimal string.
Line 164 ⟶ 169:
return n.all { |c| "0123456789".contains(c) }
}
 
// Adds 'thousand separators' to a decimal integer or string.
static commatize(n, c) {
Line 187 ⟶ 192:
return (signed) ? sign + n : n
}
 
// Convenience version of the above method which uses a comma as the separator.
static commatize(n) { commatize(n, ",") }
 
// Convenience method which commatizes an ordinal number using a comma as the separator.
static ordinalize(n) { commatize(n) + Conv.ord(n)[-2..-1] }
 
// Private helper method for 'abbreviate' method.
static sub_(s, r) { s.toList[r].join() }
 
// Abbreviates a string 's' to a maximum number of characters 'w' (non-overlapping) at either end
// or, if 'w' is negative from the front only, using 'sep' as the separator.
Line 209 ⟶ 214:
return sub_(s, 0...le) + sep + ((w >= 0) ? sub_(s, -le..-1) : "")
}
 
// Convenience version of the above method which uses 'three dots' as the separator.
static abbreviate(w, s) { abbreviate(w, s, "...") }
 
// Gets or sets precision for 'f(w, n)' style convenience methodmethods.
static precision { ( __precision != null) ? __precision : 6 }
static precision=(p) { __precision = ((p is Num) && p.isInteger && p >= 0) ? p : __precision }
 
/* 'Short name' methods, useful for formatting values in interpolated strings. */
// Formats an integer 'n' in (d)ecimal, (b)inary, (t)ernary, (o)ctal, he(x) or upper case he(X).
// Pads with spaces to a minimum width of 'w'.
// Negative 'w' left justifies, non-negative 'w' right justifies.
static d(w, n) { (w >= 0) ? rjust(w, Conv.dec(n)) : ljust(-w, Conv.dec(n)) }
static b(w, n) { (w >= 0) ? rjust(w, Conv.bin(n)) : ljust(-w, Conv.bin(n)) }
static ot(w, n) { (w >= 0) ? rjust(w, Conv.octter(n)) : ljust(-w, Conv.octter(n)) }
static o(w, n) { (w >= 0) ? rjust(w, Conv.oct(n)) : ljust(-w, Conv.oct(n)) }
static x(w, n) { (w >= 0) ? rjust(w, Conv.hex(n)) : ljust(-w, Conv.hex(n)) }
static X(w, n) { (w >= 0) ? rjust(w, Conv.Hex(n)) : ljust(-w, Conv.Hex(n)) }
 
// As above but pads with leading zeros instead of spaces.
// Any minus sign will be placed before the padding.
// When used with negative 'w' behaves the same as the above methods.
static dz(w, n) { (w >= 0) ? zfill(w, Conv.dec(n)) : ljust(-w, Conv.dec(n)) }
static bz(w, n) { (w >= 0) ? zfill(w, Conv.bin(n)) : ljust(-w, Conv.bin(n)) }
static tz(w, n) { (w >= 0) ? zfill(w, Conv.ter(n)) : ljust(-w, Conv.ter(n)) }
static oz(w, n) { (w >= 0) ? zfill(w, Conv.oct(n)) : ljust(-w, Conv.oct(n)) }
static xz(w, n) { (w >= 0) ? zfill(w, Conv.hex(n)) : ljust(-w, Conv.hex(n)) }
static Xz(w, n) { (w >= 0) ? zfill(w, Conv.Hex(n)) : ljust(-w, Conv.Hex(n)) }
 
// Formats 'n' in decimal, space padded, with a leading '+' if 'n' is non-negative or '-' otherwise.
static dp(w, n) { (w >= 0) ? rjust(w, Conv.pdec(n)) : ljust(-w, Conv.pdec(n)) }
 
// Formats 'n' in decimal, space padded, with a leading ' ' if 'n' is non-negative or '-' otherwise.
static dm(w, n) { (w >= 0) ? rjust(w, Conv.mdec(n)) : ljust(-w, Conv.mdec(n)) }
 
// Formats 'n' in commatized form, space padded, using ',' as the separator.
static dc(w, n) { (w >= 0) ? rjust(w, commatize(Conv.dec(n))): ljust(-w, commatize(Conv.dec(n))) }
 
// Ranks a non-negative integer 'n' i.e. expresses it in ordinal form, space padded.
static r(w, n) { (w >= 0) ? rjust(w, Conv.ord(n)) : ljust(-w, Conv.ord(n)) }
 
// Pads a character (equivalent to the codepoint 'n') with spaces to a minimum width of 'w'.
// Negative 'w' left justifies, non-negative 'w' right justifies.
static c(w, n) { (w >= 0) ? rjust(w, Conv.itoc(n)): ljust(-w, Conv.itoc(n)) }
 
// Pads a string or value 'v' with spaces to a minimum width of 'w'.
// Negative 'w' left justifies, non-negative 'w' right justifies.
static s(w, v) { (w >= 0) ? rjust(w, v) : ljust(-w, v) }
 
// CentersMiddles a string or value 'v' within a field of minimum width 'w'. Pads with spaces.
static cm(w, v) { cjust(w, v) }
 
// Embeds a string or value 'v' in 'cc', a string with no more than two characters.
Line 262 ⟶ 276:
}
if (len == 0) return (v is String) ? v : "%(v)"
if (len == 1) cc = cc + cc
return "%(cc[0])%(v)%(cc[1])"
}
Line 289 ⟶ 303:
var d = (n - i).abs
var pw = 10.pow(p)
d = (d * pw).round
if (d >= pw) {
ns = "%(Conv.dec(n.round))"
d = 0
}
if (d == 0) return s(w, ns + "." + "0" * p)
var ds = "%(d)"
Line 302 ⟶ 316:
 
// Works like 'f' except replaces any trailing zeros after the decimal point with spaces.
// If the resulting string would end with a decimal point, a zero is first added back.
static g(w, n, p) {
var f = f(w, n, p)
Line 353 ⟶ 367:
static fc(w, n) { fc(w, n, precision) }
static gc(w, n) { gc(w, n, precision) }
 
// Private worker method which calls a'short name' method and returns its result.
static callFn_(fn, w, e, p) {
return (fn == "d") ? d(w, e) :
(fn == "b") ? b(w, e) :
(fn == "t") ? t(w, e) :
(fn == "o") ? o(w, e) :
(fn == "x") ? x(w, e) :
(fn == "X") ? Fmt.X(w, e) :
(fn == "r") ? r(w, e) :
(fn == "c") ? c(w, e) :
(fn == "s") ? s(w, e) :
(fn == "m") ? m(w, e) :
(fn == "q") ? q(e) :
(fn == "f") ? f(w, e, p) :
(fn == "g") ? g(w, e, p) :
(fn == "dz") ? dz(w, e) :
(fn == "bz") ? bz(w, e) :
(fn == "tz") ? tz(w, e) :
(fn == "oz") ? oz(w, e) :
(fn == "xz") ? xz(w, e) :
(fn == "Xz") ? Fmt.Xz(w, e) :
(fn == "fz") ? fz(w, e, p) :
(fn == "gz") ? gz(w, e, p) :
(fn == "dp") ? dp(w, e) :
(fn == "dm") ? dm(w, e) :
(fn == "dc") ? dc(w, e) :
(fn == "fc") ? fc(w, e, p) :
(fn == "gc") ? gc(w, e, p) : Fiber.abort("Method not recognized.")
}
 
// Applies a 'short' formatting method to each element of a list or sequence 'seq'.
// The method to be applied is specified (as a string) in 'fn'.
// The parameters to be passed to the method are specified in 'w' and 'p'
// 'p' is needed for 'f', 'g', 'fz', 'gz', 'fc' or 'gzgc' but is ignored otherwise.
// The resulting strings are then joined together using the separator 'sep'.
// having first applied the 'q' method, with parameter 'cc', to each of them.
Line 366 ⟶ 410:
for (i in 0...seq.count) {
var e = seq[i]
l[i] = q(callFn_(fn, == "d") ? d(w, e, p), : cc)
(fn == "b") ? b(w, e) :
(fn == "o") ? o(w, e) :
(fn == "x") ? x(w, e) :
(fn == "X") ? Fmt.X(w, e) :
(fn == "s") ? s(w, e) :
(fn == "c") ? c(w, e) :
(fn == "f") ? f(w, e, p) :
(fn == "g") ? g(w, e, p) :
(fn == "dz") ? dz(w, e) :
(fn == "bz") ? bz(w, e) :
(fn == "oz") ? oz(w, e) :
(fn == "xz") ? xz(w, e) :
(fn == "Xz") ? Fmt.Xz(w, e) :
(fn == "fz") ? fz(w, e, p) :
(fn == "gz") ? gz(w, e, p) :
(fn == "dp") ? dp(w, e) :
(fn == "dm") ? dm(w, e) :
(fn == "dc") ? dc(w, e) :
(fn == "fc") ? fc(w, e, p) :
(fn == "gc") ? gc(w, e, p) : Fiber.abort("Method not recognized.")
l[i] = q(l[i], cc)
}
return q(l.join(sep), bb)
Line 397 ⟶ 420:
static v(fn, w, seq, p) { v(fn, w, seq, p, ", ", "[]", "") }
static v(fn, w, seq) { v(fn, w, seq, precision, ", ", "[]", "") }
 
// Provides a 'sprintf' style method where the arguments are passed in a separate list and
// formatted in turn by verbs embedded in a format string. Excess arguments are ignored but
// it is an error to provide insufficient arguments. Verbs must be given in this form:
// $[flag][width][.precision][letter] of which all bracketed items except [letter] are optional.
// The letter must be one of the 'short' methods: b, c, d, f, g, m, o, q, r, s, t, v, x or X.
// If present, the flag (there can only be one) must be one of the following:
// + always prints a + or - sign ('dp' method)
// (space) leaves a space for the sign but only prints minus ('dm' method)
// , commatizes the following number ('dc', 'fc' or 'gc' methods)
// # adds the appropriate prefix for the number formats: b, t, o, d, x and X.
// * reads the width from the argument before the one to be formatted
// If present, the width is the minimum width (+/-) to be passed to the appropriate method.
// It doesn't include any '#' flag prefix. If [width] is absent, a width of zero is passed.
// If present, the precision is the number of decimal places to be passed to the appropriate
// 'f' or 'g' style method. If absent, the default precision is passed.
// Where any optional item is inappropriate to the method being used it is simply ignored.
// Where one of the arguments is a sequence (other than a string) this method senses it
// and applies the 'v' method to it. However, the 'sep' parameter is always a single space
// and the 'bb' and 'cc' parameters are always empty strings. The '#' flag has no effect.
static slwrite(fmt, a) {
if (!(fmt is String)) Fiber.abort("First argument must be a string.")
if (!(a is List)) Fiber.abort("Second argument must be a list.")
if (fmt == "") return ""
var cps = fmt.codePoints.toList
var le = cps.count // number of codepoints
var s = "" // accumulates the result string
var i = 0 // current codepoint index
var cp = 0 // current codepoint
var next = 0 // index of next argument to be formatted
 
// Gets the next numeric string from the format.
var getNumber = Fn.new {
i = i + 1
if (i == le) Fiber.abort("Invalid format string.")
cp = cps[i]
var ns = ""
while (cp >= 48 && cp <= 57) {
ns = ns + Conv.itoc(cp)
i = i + 1
if (i == le) Fiber.abort("Invalid format string.")
cp = cps[i]
}
return ns
}
 
while (i < le) {
cp = cps[i]
if (cp != 36) { // not a dollar sign
s = s + Conv.itoc(cp)
} else if (i < le -1 && cps[i + 1] == 36) { // check for $$
s = s + "$"
i = i + 1
} else {
var ns = getNumber.call()
if (ns != "" && "*+,- #".codePoints.contains(cp)) {
Fiber.abort("Invalid format string.")
}
var plus = false
var comma = false
var minus = false
var space = false
var hash = false
var fn = ""
var ds = ""
if ("bcdfgmoqrstxX".codePoints.contains(cp)) { // format letter
fn = Conv.itoc(cp)
} else if (cp == 42) { // star
if (next < a.count) {
ns = "%(a[next])"
next = next + 1
} else {
Fiber.abort("Insufficient arguments passed.")
}
i = i + 1
cp = cps[i]
if (cp == 46) ds = getNumber.call()
} else if (cp == 43) { // plus sign
plus = true
ns = getNumber.call()
if (cp == 46) ds = getNumber.call()
} else if (cp == 44) { // comma
comma = true
ns = getNumber.call()
if (cp == 46) ds = getNumber.call()
} else if (cp == 45) { // minus sign
minus = true
ns = getNumber.call()
if (cp == 46) ds = getNumber.call()
} else if (cp == 46) { // dot
ds = getNumber.call()
} else if (cp == 32) { // space
space = true
ns = getNumber.call()
if (cp == 46) ds = getNumber.call()
} else if (cp == 35) { // hash
hash = true
ns = getNumber.call()
if (cp == 46) ds = getNumber.call()
} else {
Fiber.abort("Unrecognized character in format string.")
}
 
if (fn == "") {
if (!"bcdfgmoqrstxX".codePoints.contains(cp)) {
Fiber.abort("Unrecognized character in format string.")
}
fn = Conv.itoc(cp)
}
if (fn == "d") {
if (plus) {
fn = "dp"
} else if (space) {
fn = "dm"
} else if (comma) {
fn = "dc"
}
} else if ((fn == "f" || fn == "g") && comma) {
fn = fn + "c"
}
if (ns == "") ns = "1"
if (ns[0] == "0" && ns.count > 1 && "dbtoxXfg".contains(fn[0])) {
fn = fn[0] + "z"
}
var n = Num.fromString(ns)
var w = minus ? -n : n
var p = (ds != "") ? Num.fromString(ds) : precision
if (next < a.count) {
var e = a[next]
if ((e is Sequence) && !(e is String)) {
s = s + Fmt.v(fn, w, e, p, " ", "", "")
} else {
var r = callFn_(fn, w, e, p)
if (hash && "btodxX".contains(fn[0])) {
if (r[0] == "-") {
r = "-" + Conv.prefixes[fn[0]] + r[1..-1]
} else {
r = Conv.prefixes[fn[0]] + r
}
}
s = s + r
}
next = next + 1
} else {
Fiber.abort("Insufficient arguments passed.")
}
}
i = i + 1
}
return s
}
 
// Convenience versions of the 'slwrite' method which allow up to 5 arguments
// to be passed individually rather than in a list.
static swrite(fmt, a1, a2, a3, a4, a5) { slwrite(fmt, [a1, a2, a3, a4, a5]) }
static swrite(fmt, a1, a2, a3, a4) { slwrtie(fmt, [a1, a2, a3, a4]) }
static swrite(fmt, a1, a2, a3) { slwrite(fmt, [a1, a2, a3]) }
static swrite(fmt, a1, a2) { slwrite(fmt, [a1, a2]) }
static swrite(fmt, a1) { slwrite(fmt, [a1]) }
 
// Applies slwrite to the arguments and then 'writes' it (no following \n) to stdout.
static write(fmt, a1, a2, a3, a4, a5) { System.write(slwrite(fmt, [a1, a2, a3, a4, a5])) }
static write(fmt, a1, a2, a3, a4) { System.write(slwrite(fmt, [a1, a2, a3, a4])) }
static write(fmt, a1, a2, a3) { System.write(slwrite(fmt, [a1, a2, a3])) }
static write(fmt, a1, a2) { System.write(slwrite(fmt, [a1, a2])) }
static write(fmt, a1) { System.write(slwrite(fmt, [a1])) }
static lwrite(fmt, a) { System.write(slwrite(fmt, a)) }
 
// Applies slwrite to the arguments and then 'prints' it (with a following \n) to stdout.
static print(fmt, a1, a2, a3, a4, a5) { System.print(slwrite(fmt, [a1, a2, a3, a4, a5])) }
static print(fmt, a1, a2, a3, a4) { System.print(slwrite(fmt, [a1, a2, a3, a4])) }
static print(fmt, a1, a2, a3) { System.print(slwrite(fmt, [a1, a2, a3])) }
static print(fmt, a1, a2) { System.print(slwrite(fmt, [a1, a2])) }
static print(fmt, a1) { System.print(slwrite(fmt, [a1])) }
static lprint(fmt, a) { System.print(slwrite(fmt, a)) }
}
 
9,488

edits

Cookies help us deliver our services. By using our services, you agree to our use of cookies.