shithub: mc

Download patch

ref: 52eca667bbd1cf5a929d3f2352c3c1ee8e91625d
parent: 68a437bb6d370781e18ad1b794cc34c21dd5b361
author: Ori Bernstein <ori@eigenstate.org>
date: Mon Dec 25 11:14:38 EST 2017

Formatting as a state machine.

--- a/lib/date/fmt.myr
+++ b/lib/date/fmt.myr
@@ -10,12 +10,7 @@
 const __init__ = {
 	var d : instant
 
-	std.fmtinstall(std.typeof(d), sbfmt, [
-		("D", false),
-		("d", false),
-		("t", false),
-		("f", true),
-	][:])
+	std.fmtinstall(std.typeof(d), sbfmt)
 }
 
 /* Always formats : proleptic Gregorian format */
--- a/lib/date/parse.myr
+++ b/lib/date/parse.myr
@@ -38,7 +38,7 @@
 
 const __init__ = {
 	var fail : parsefail
-	std.fmtinstall(std.typeof(fail), failfmt, [][:])
+	std.fmtinstall(std.typeof(fail), failfmt)
 }
 
 const strparse = {f, s, tz, replace
--- a/lib/escfmt/eschtml.myr
+++ b/lib/escfmt/eschtml.myr
@@ -8,7 +8,7 @@
 
 const __init__ = {
 	var s = ("" : eschtml)
-	std.fmtinstall(std.typeof(s), htmlfmt, [][:])
+	std.fmtinstall(std.typeof(s), htmlfmt)
 }
 
 const html = {s
--- a/lib/escfmt/escre.myr
+++ b/lib/escfmt/escre.myr
@@ -8,7 +8,7 @@
 
 const __init__ = {
 	var s = ("" : escre)
-	std.fmtinstall(std.typeof(s), refmt, [][:])
+	std.fmtinstall(std.typeof(s), refmt)
 }
 
 const re = {s
--- a/lib/escfmt/escsh.myr
+++ b/lib/escfmt/escsh.myr
@@ -8,7 +8,7 @@
 
 const __init__ = {
 	var s = ("" : escsh)
-	std.fmtinstall(std.typeof(s), shfmt, [][:])
+	std.fmtinstall(std.typeof(s), shfmt)
 }
 
 const sh = {s
--- a/lib/escfmt/escurl.myr
+++ b/lib/escfmt/escurl.myr
@@ -8,7 +8,7 @@
 
 const __init__ = {
 	var s = ("" : escurl)
-	std.fmtinstall(std.typeof(s), urlfmt, [][:])
+	std.fmtinstall(std.typeof(s), urlfmt)
 }
 
 const url = {s
--- a/lib/http/client.myr
+++ b/lib/http/client.myr
@@ -196,7 +196,7 @@
 	var m
 
 	m = `Get
-	std.fmtinstall(std.typeof(m), fmtmethod, [][:])
+	std.fmtinstall(std.typeof(m), fmtmethod)
 }
 
 const readchunkedbody = {s, r
--- a/lib/http/url.myr
+++ b/lib/http/url.myr
@@ -12,9 +12,7 @@
 	var u : url#
 
 	u = u
-	std.fmtinstall(std.typeof(u), urlfmt, [
-		("p", false)
-	][:])
+	std.fmtinstall(std.typeof(u), urlfmt)
 }
 
 const urlfmt = {sb, ap, opts
--- a/lib/json/fmt.myr
+++ b/lib/json/fmt.myr
@@ -8,7 +8,7 @@
 const __init__ = {
 	var j : elt
 
-	std.fmtinstall(std.typeof(&j), jsonfmt, [][:])
+	std.fmtinstall(std.typeof(&j), jsonfmt)
 }
 
 const jsonfmt = {sb, ap, opts
--- a/lib/regex/compile.myr
+++ b/lib/regex/compile.myr
@@ -879,7 +879,7 @@
 	match std.vanext(ap)
 	| `Noimpl:	std.sbfmt(sb, "no implementation")
 	| `Incomplete:	std.sbfmt(sb, "regex ended before input fully parsed")
-	| `Unbalanced c:	std.sbfmt(sb, "unbalanced {}", c)
+	| `Unbalanced c:std.sbfmt(sb, "unbalanced {}", c)
 	| `Emptyparen:	std.sbfmt(sb, "empty parentheses")
 	| `Badrep c:	std.sbfmt(sb, "invalid repetition {}", c)
 	| `Badrange s:	std.sbfmt(sb, "invalid range name {}", s)
@@ -899,6 +899,6 @@
 
 const __init__ = {
 	var e : status
-	std.fmtinstall(std.typeof(e), fmtfail, [][:])
+	std.fmtinstall(std.typeof(e), fmtfail)
 }
 
--- a/lib/std/fmt.myr
+++ b/lib/std/fmt.myr
@@ -47,8 +47,7 @@
 
 	/* add a formatter function */
 	const fmtinstall	: (ty : byte[:], \
-		fn : (sb : strbuf#, ap : valist#, opts : (byte[:],byte[:])[:] -> void), \
-		optdesc : (byte[:], bool)[:] \
+		fn : (sb : strbuf#, ap : valist#, opts : (byte[:],byte[:])[:] -> void) \
 		-> void)
 
 	$noret const fatal	: (fmt : byte[:], args : ... -> void)
@@ -55,6 +54,12 @@
 	$noret const fatalv	: (fmt : byte[:], ap : valist# -> void)
 ;;
 
+type parsestate = union
+	`Copy
+	`ParamOpt
+	`ParamArg
+;;
+
 const __init__ = {
 	fmtmap = mkht()
 }
@@ -61,7 +66,6 @@
 
 type fmtdesc = struct
 	fn	: (sb : strbuf#, ap : valist#, opts : (byte[:],byte[:])[:] -> void)
-	optdesc	: (byte[:], bool)[:]
 ;;
 
 /* same as 'put', but exits the program after printing */
@@ -81,10 +85,10 @@
 
 var fmtmap : htab(byte[:], fmtdesc)#
 
-const fmtinstall = {ty, fn, optdesc
+const fmtinstall = {ty, fn
 	match std.htget(fmtmap, ty)
 	| `std.Some _:	std.fatal("doubly installed format\n")
-	| `std.None:	htput(fmtmap, ty, [.fn=fn, .optdesc=sldup(optdesc)])
+	| `std.None:	htput(fmtmap, ty, [.fn=fn])
 	;;
 }
 
@@ -157,39 +161,85 @@
 }
 
 const sbfmtv = {sb, fmt, ap -> size
-	var nfmt, nparams, orig
-	var c, params
+	var buf : byte[256], param : (byte[:], byte[:])[8]
+	var state, startp, endp, starta, nbuf
+	var nfmt, nvarargs, nparam
+	var c
 
-	orig = fmt
-	nparams = ap.tc.nelt
+	nvarargs = ap.tc.nelt
 	nfmt = 0
+	startp = 0
+	starta = 0
+	nparam = 0
+	nbuf = 0
+	endp = 0
+	state = `Copy
 	while fmt.len != 0
 		(c, fmt) = charstep(fmt)
-		match c
-		| '{':
+		match (state, c)
+		/* raw bytes */
+		| (`Copy, '{'):
 			if decode(fmt) == '{'
 				(c, fmt) = charstep(fmt)
 				sbputc(sb, '{')
 			else
-				(params, fmt) = getparams(fmt)
-				nfmt++
-				if nfmt > nparams
-					die("too few params for fmt\n")
-				;;
-
-				fmtval(sb, vatype(ap), ap, params)
+				state = `ParamOpt
+				nparam = 0
+				startp = 0
+				starta = 0
+				nbuf = 0
 			;;
-		| '}':
+		| (`Copy, '}'):
 			if decode(fmt) == '}'
 				sbputc(sb, '}')
 			;;
-		| chr:
+		| (`Copy, chr):
 			sbputc(sb, chr)
+
+		/* {param */
+		| (`ParamOpt, '='):
+			state = `ParamArg
+			endp = nbuf
+			starta = nbuf
+		| (`ParamOpt, ','):
+			if startp != nbuf
+				param[nparam++] = (buf[startp:nbuf], "")
+			;;
+		| (`ParamOpt, '}'):
+			state = `Copy
+			if startp != nbuf
+				param[nparam++] = (buf[startp:nbuf], "")
+			;;
+			fmtval(sb, vatype(ap), ap, param[:nparam])
+			nfmt++
+		| (`ParamOpt, '\\'):
+			(c, fmt) = charstep(fmt)
+			nbuf += std.encode(buf[nbuf:], c)
+		| (`ParamOpt, chr):
+			nbuf += std.encode(buf[nbuf:], chr)
+
+		/* {param=arg} */
+		| (`ParamArg, ','):
+			state = `ParamOpt
+			param[nparam++] = (buf[startp:endp], buf[starta:nbuf])
+			startp = nbuf
+			endp = nbuf
+		| (`ParamArg, '}'):
+			state = `Copy
+			if startp != nbuf
+				param[nparam++] = (buf[startp:endp], buf[starta:nbuf])
+			;;
+			fmtval(sb, vatype(ap), ap, param[:nparam])
+			nfmt++
+		| (`ParamArg, '\\'):
+			(c, fmt) = charstep(fmt)
+			nbuf += std.encode(buf[nbuf:], c)
+		| (`ParamArg, chr):
+			nbuf += std.encode(buf[nbuf:], chr)
 		;;
 :fmtdone
 	;;
-	if nfmt != nparams
-		write(1, orig)
+	if nfmt != nvarargs
 		die("too many params for fmt\n")
 	;;
 	-> sb.len
@@ -196,68 +246,14 @@
 }
 
 const fmtval = {sb, ty, ap, params
-	var pl
-
 	match htget(fmtmap, ty)
 	| `Some f:
-		pl = parseparams(params, f.optdesc)
-		f.fn(sb, ap, pl)
-		std.slfree(pl)
+		f.fn(sb, ap, params)
 	| `None:
 		fallbackfmt(sb, params, ty, ap)
 	;;
 }
 
-const parseparams = {paramstr, optdesc
-	var params, opts
-	var o, a, ha, gotarg, found
-
-	opts = [][:]
-	if optdesc.len == 0 && paramstr.len > 0
-		std.fatal("invalid format options {}\n")
-	;;
-	params = strsplit(paramstr, ",")
-	for p : params
-		/* parse out the key/value pair */
-		match std.strfind(p, "=")
-		| `std.Some idx:
-			o = p[:idx]
-			a = p[idx+1:]
-			gotarg = true
-		| `std.None:
-			o = p
-			a = ""
-			gotarg = false
-		;;
-
-		found = false
-		/* verify and add the arg */
-		for (opt, hasarg) : optdesc
-			if !std.sleq(opt, o)
-				continue
-			;;
-			found = true
-			ha = hasarg
-			if ha == gotarg
-				std.slpush(&opts, (o, a))
-			else
-				std.fatal("invalid arg {} for option {}", a, o)
-			;;
-		;;
-		if !found
-			std.put("options: \n")
-			for (opt, hasarg) : optdesc
-				std.put("\t'{}', hasarg={}\n", opt, hasarg)
-			;;
-			std.put("invalid option '{}' ", o)
-			std.die("dying")
-		;;
-	;;
-	slfree(params)
-	-> opts
-}
-
-
 const fallbackfmt = {sb, params, tyenc, ap : valist# -> void
 	/* value types */
 	var t_val : bool
@@ -369,7 +365,7 @@
 		subap = vaenter(ap)
 		sbputs(sb, "[")
 		while subap.tc.nelt != 0
-			fmtval(sb, vatype(&subap), &subap, "")
+			fmtval(sb, vatype(&subap), &subap, [][:])
 			if subap.tc.nelt > 0
 				sbfmt(sb, ", ")
 			;;
@@ -381,7 +377,7 @@
 		subap = vaenter(ap)
 		sbfmt(sb, "(")
 		for var i = 0; i < subap.tc.nelt; i++
-			fmtval(sb, vatype(&subap), &subap, "")
+			fmtval(sb, vatype(&subap), &subap, [][:])
 			if subap.tc.nelt == 1
 				sbfmt(sb, ",")
 			elif i != subap.tc.nelt -1
@@ -396,7 +392,7 @@
 		for var i = 0; i < subap.tc.nelt; i++
 			(subname, subenc) = ncpeek(&subap.tc)
 			sbfmt(sb, ".{}=", subname)
-			fmtval(sb, vatype(&subap), &subap, "")
+			fmtval(sb, vatype(&subap), &subap, [][:])
 			if subap.tc.nelt == 1
 				sbfmt(sb, ",")
 			elif i != subap.tc.nelt -1
@@ -420,7 +416,7 @@
 		| `Tynone:
 		| _:
 			sbputc(sb, ' ')
-			fmtval(sb, subenc, &subap, "")
+			fmtval(sb, subenc, &subap, [][:])
 		;;
 		vabytes(ap)
 	| `Tyname (name, desc):
@@ -431,28 +427,28 @@
 }
 
 const fmtslice = {sb, subap, params
-	var opts, join, joined
+	var join, joined
 
-	opts = parseparams(params, [
-		("j", true),
-	][:])
 	join = ", "
 	joined = false
-	for o : opts
-		match o
+	for p : params
+		match p
 		| ("j", j):
 			joined = true
 			join = j
-		| _:	std.die("unreacahable")
+		| (opt, arg):
+			std.write(2, "fmt: \0")
+			std.write(2, opt)
+			std.write(2, "\0arg: ")
+			std.write(2, arg)
+			std.die("unreacahable")
 		;;
 	;;
-	std.slfree(opts)
-
 	if !joined
 		sbputs(sb, "[")
 	;;
 	while subap.tc.nelt != 0
-		fmtval(sb, vatype(&subap), &subap, "")
+		fmtval(sb, vatype(&subap), &subap, [][:])
 		if subap.tc.nelt > 0
 			sbfmt(sb, join)
 		;;
@@ -462,19 +458,6 @@
 	;;
 }
 
-const getparams = {fmt
-	var i
-
-	for i = 0; i < fmt.len; i++
-		if fmt[i] == ('}' : byte)
-			goto foundparams
-		;;
-	;;
-	die("invalid format string")
-:foundparams
-	-> (fmt[:i], fmt[i+1:])
-}
-
 type intparams = struct
 	base	: size
 	padto	: size
@@ -483,7 +466,6 @@
 
 const intparams = {params
 	var ip : intparams
-	var opts
 
 	ip = [
 		.base = 10,
@@ -491,27 +473,25 @@
 		.padto = 0
 	]
 
-	opts = parseparams(params, [
-		("b", true),
-		("x", false),
-		("w", true),
-		("p", true)][:])
-	for o : opts
-		match o
+	for p : params
+		match p
 		| ("b", bas):	ip.base = getint(bas, "fmt: base must be integer")
 		| ("x", ""):	ip.base = 16
 		| ("w", wid):	ip.padto = getint(wid, "fmt: width must be integer")
 		| ("p", pad):	ip.padfill = decode(pad)
-		| _:	std.die("unreachable")
+		| (opt, arg):	
+			std.write(2, "fmt: ")
+			std.write(2, opt)
+			std.write(2, "arg: ")
+			std.write(2, arg)
+			std.die("\nunreachable\n")
 		;;
 	;;
 	iassert(ip.padto >= 0, "pad must be >= 0")
-	std.slfree(opts)
 	-> ip
 }
 
 const strfmt = {sb, str, params
-	var opts
 	var w, p, i, raw, esc
 
 	p = ' '
@@ -518,24 +498,17 @@
 	w = 0
 	raw = false
 	esc = false
-	opts = parseparams(params, [
-		("w", true),
-		("p", true),
-		("r", false),
-		("e", false),
-	][:])
 
-	for o : opts
-		match o
+	for pp : params
+		match pp
 		| ("w", wid):	w = getint(wid, "fmt: width must be integer")
 		| ("p", pad):	p = decode(pad)
 		| ("r", ""):	raw = true
 		| ("e", ""):	esc = true
-		| _:	std.die("unreachable")
+		| _:	std.die("unreachable\n")
 		;;
 	;;
 	iassert(p >= 0, "pad must be >= 0")
-	std.slfree(opts)
 	if raw
 		for b : str
 			if esc
--- a/lib/std/fmtfuncs.myr
+++ b/lib/std/fmtfuncs.myr
@@ -17,9 +17,9 @@
 
 	bigint = mkbigint(0)
 	bitset = mkbs()
-	fmtinstall(typeof(bigint), bigfmt, [][:])
-	fmtinstall(typeof(bitset), bsfmt, [][:])
-	fmtinstall(typeof(ipaddr), ipfmt, [][:])
+	fmtinstall(typeof(bigint), bigfmt)
+	fmtinstall(typeof(bitset), bsfmt)
+	fmtinstall(typeof(ipaddr), ipfmt)
 	bigfree(bigint)
 	bsfree(bitset)
 }
--- a/lib/std/test/fmt.myr
+++ b/lib/std/test/fmt.myr
@@ -109,11 +109,8 @@
 
 	x = 0
 	p = [.x=0, .y=0]
-	std.fmtinstall(std.typeof(x), intfmt, [][:])
-	std.fmtinstall(std.typeof(p), pairfmt, [
-		("x", true),
-		("y", false)
-	][:])
+	std.fmtinstall(std.typeof(x), intfmt)
+	std.fmtinstall(std.typeof(p), pairfmt)
 
 	/* single value */
 	check("formatted an int: 0", "{}", 0)