Fixed up some edge cases with as_lua_id and from_lua_id that were

producing bad results.
This commit is contained in:
Bruce Hill 2018-10-03 16:14:17 -07:00
parent 331b22b3a3
commit b615cb5c8e
2 changed files with 28 additions and 10 deletions

View File

@ -143,8 +143,6 @@ local string2 = {
return '"' .. escaped .. '"'
end,
as_lua_id = function(str)
local orig = str
str = gsub(str, "^ *$", "%1 ")
str = gsub(str, "x([0-9A-F][0-9A-F])", "x78%1")
str = gsub(str, "%W", function(c)
if c == ' ' then
@ -159,18 +157,37 @@ local string2 = {
return str
end,
from_lua_id = function(str)
if not (is_lua_id("^_+(.*)$")) then
if not (is_lua_id(str:match("^_*(.*)$"))) then
str = str:sub(2, -1)
end
str = gsub(str, "_", " ")
str = gsub(str, "x([0-9A-F][0-9A-F])", function(hex)
return char(tonumber(hex, 16))
end)
str = gsub(str, "^ ([ ]*)$", "%1")
return str
end
}
for k, v in pairs(string) do
string2[k] = string2[k] or v
end
local _list_0 = {
"",
"_",
" ",
"return",
"asdf",
"one two",
"one_two",
"Hex2Dec",
"He-ec",
"\3"
}
for _index_0 = 1, #_list_0 do
local test = _list_0[_index_0]
local lua_id = string2.as_lua_id(test)
assert(is_lua_id(lua_id), "failed to convert '" .. tostring(test) .. "' to a valid Lua identifier (got '" .. tostring(lua_id) .. "')")
local roundtrip = string2.from_lua_id(lua_id)
assert(roundtrip == test, "Failed lua_id roundtrip: '" .. tostring(test) .. "' -> " .. tostring(lua_id) .. " -> " .. tostring(roundtrip))
end
assert(string2.as_lua_id('') == '_')
return string2

View File

@ -67,10 +67,6 @@ string2 = {
-- but not idempotent. In logic terms: (x != y) => (as_lua_id(x) != as_lua_id(y)),
-- but not (as_lua_id(a) == b) => (as_lua_id(b) == b).
as_lua_id: (str)->
orig = str
-- Empty strings are not valid lua identifiers, so treat them like " ",
-- and treat " " as " ", etc. to preserve injectivity.
str = gsub str, "^ *$", "%1 "
-- Escape 'x' (\x78) when it precedes something that looks like an uppercase hex sequence.
-- This way, all Lua IDs can be unambiguously reverse-engineered, but normal usage
-- of 'x' won't produce ugly Lua IDs.
@ -88,13 +84,18 @@ string2 = {
-- from_lua_id(as_lua_id(str)) == str, but behavior is unspecified for inputs that
-- did not come from as_lua_id()
from_lua_id: (str)->
unless is_lua_id("^_+(.*)$")
unless is_lua_id(str\match("^_*(.*)$"))
str = str\sub(2,-1)
str = gsub(str, "_", " ")
str = gsub(str, "x([0-9A-F][0-9A-F])", (hex)-> char(tonumber(hex, 16)))
str = gsub(str, "^ ([ ]*)$", "%1")
return str
}
for k,v in pairs(string) do string2[k] or= v
for test in *{"", "_", " ", "return", "asdf", "one two", "one_two", "Hex2Dec", "He-ec", "\3"}
lua_id = string2.as_lua_id(test)
assert is_lua_id(lua_id), "failed to convert '#{test}' to a valid Lua identifier (got '#{lua_id}')"
roundtrip = string2.from_lua_id(lua_id)
assert roundtrip == test, "Failed lua_id roundtrip: '#{test}' -> #{lua_id} -> #{roundtrip}"
return string2