Fixed up some edge cases with as_lua_id and from_lua_id that were
producing bad results.
This commit is contained in:
parent
331b22b3a3
commit
b615cb5c8e
25
string2.lua
25
string2.lua
@ -143,8 +143,6 @@ local string2 = {
|
|||||||
return '"' .. escaped .. '"'
|
return '"' .. escaped .. '"'
|
||||||
end,
|
end,
|
||||||
as_lua_id = function(str)
|
as_lua_id = function(str)
|
||||||
local orig = str
|
|
||||||
str = gsub(str, "^ *$", "%1 ")
|
|
||||||
str = gsub(str, "x([0-9A-F][0-9A-F])", "x78%1")
|
str = gsub(str, "x([0-9A-F][0-9A-F])", "x78%1")
|
||||||
str = gsub(str, "%W", function(c)
|
str = gsub(str, "%W", function(c)
|
||||||
if c == ' ' then
|
if c == ' ' then
|
||||||
@ -159,18 +157,37 @@ local string2 = {
|
|||||||
return str
|
return str
|
||||||
end,
|
end,
|
||||||
from_lua_id = function(str)
|
from_lua_id = function(str)
|
||||||
if not (is_lua_id("^_+(.*)$")) then
|
if not (is_lua_id(str:match("^_*(.*)$"))) then
|
||||||
str = str:sub(2, -1)
|
str = str:sub(2, -1)
|
||||||
end
|
end
|
||||||
str = gsub(str, "_", " ")
|
str = gsub(str, "_", " ")
|
||||||
str = gsub(str, "x([0-9A-F][0-9A-F])", function(hex)
|
str = gsub(str, "x([0-9A-F][0-9A-F])", function(hex)
|
||||||
return char(tonumber(hex, 16))
|
return char(tonumber(hex, 16))
|
||||||
end)
|
end)
|
||||||
str = gsub(str, "^ ([ ]*)$", "%1")
|
|
||||||
return str
|
return str
|
||||||
end
|
end
|
||||||
}
|
}
|
||||||
for k, v in pairs(string) do
|
for k, v in pairs(string) do
|
||||||
string2[k] = string2[k] or v
|
string2[k] = string2[k] or v
|
||||||
end
|
end
|
||||||
|
local _list_0 = {
|
||||||
|
"",
|
||||||
|
"_",
|
||||||
|
" ",
|
||||||
|
"return",
|
||||||
|
"asdf",
|
||||||
|
"one two",
|
||||||
|
"one_two",
|
||||||
|
"Hex2Dec",
|
||||||
|
"He-ec",
|
||||||
|
"\3"
|
||||||
|
}
|
||||||
|
for _index_0 = 1, #_list_0 do
|
||||||
|
local test = _list_0[_index_0]
|
||||||
|
local lua_id = string2.as_lua_id(test)
|
||||||
|
assert(is_lua_id(lua_id), "failed to convert '" .. tostring(test) .. "' to a valid Lua identifier (got '" .. tostring(lua_id) .. "')")
|
||||||
|
local roundtrip = string2.from_lua_id(lua_id)
|
||||||
|
assert(roundtrip == test, "Failed lua_id roundtrip: '" .. tostring(test) .. "' -> " .. tostring(lua_id) .. " -> " .. tostring(roundtrip))
|
||||||
|
end
|
||||||
|
assert(string2.as_lua_id('') == '_')
|
||||||
return string2
|
return string2
|
||||||
|
13
string2.moon
13
string2.moon
@ -67,10 +67,6 @@ string2 = {
|
|||||||
-- but not idempotent. In logic terms: (x != y) => (as_lua_id(x) != as_lua_id(y)),
|
-- but not idempotent. In logic terms: (x != y) => (as_lua_id(x) != as_lua_id(y)),
|
||||||
-- but not (as_lua_id(a) == b) => (as_lua_id(b) == b).
|
-- but not (as_lua_id(a) == b) => (as_lua_id(b) == b).
|
||||||
as_lua_id: (str)->
|
as_lua_id: (str)->
|
||||||
orig = str
|
|
||||||
-- Empty strings are not valid lua identifiers, so treat them like " ",
|
|
||||||
-- and treat " " as " ", etc. to preserve injectivity.
|
|
||||||
str = gsub str, "^ *$", "%1 "
|
|
||||||
-- Escape 'x' (\x78) when it precedes something that looks like an uppercase hex sequence.
|
-- Escape 'x' (\x78) when it precedes something that looks like an uppercase hex sequence.
|
||||||
-- This way, all Lua IDs can be unambiguously reverse-engineered, but normal usage
|
-- This way, all Lua IDs can be unambiguously reverse-engineered, but normal usage
|
||||||
-- of 'x' won't produce ugly Lua IDs.
|
-- of 'x' won't produce ugly Lua IDs.
|
||||||
@ -88,13 +84,18 @@ string2 = {
|
|||||||
-- from_lua_id(as_lua_id(str)) == str, but behavior is unspecified for inputs that
|
-- from_lua_id(as_lua_id(str)) == str, but behavior is unspecified for inputs that
|
||||||
-- did not come from as_lua_id()
|
-- did not come from as_lua_id()
|
||||||
from_lua_id: (str)->
|
from_lua_id: (str)->
|
||||||
unless is_lua_id("^_+(.*)$")
|
unless is_lua_id(str\match("^_*(.*)$"))
|
||||||
str = str\sub(2,-1)
|
str = str\sub(2,-1)
|
||||||
str = gsub(str, "_", " ")
|
str = gsub(str, "_", " ")
|
||||||
str = gsub(str, "x([0-9A-F][0-9A-F])", (hex)-> char(tonumber(hex, 16)))
|
str = gsub(str, "x([0-9A-F][0-9A-F])", (hex)-> char(tonumber(hex, 16)))
|
||||||
str = gsub(str, "^ ([ ]*)$", "%1")
|
|
||||||
return str
|
return str
|
||||||
}
|
}
|
||||||
for k,v in pairs(string) do string2[k] or= v
|
for k,v in pairs(string) do string2[k] or= v
|
||||||
|
|
||||||
|
for test in *{"", "_", " ", "return", "asdf", "one two", "one_two", "Hex2Dec", "He-ec", "\3"}
|
||||||
|
lua_id = string2.as_lua_id(test)
|
||||||
|
assert is_lua_id(lua_id), "failed to convert '#{test}' to a valid Lua identifier (got '#{lua_id}')"
|
||||||
|
roundtrip = string2.from_lua_id(lua_id)
|
||||||
|
assert roundtrip == test, "Failed lua_id roundtrip: '#{test}' -> #{lua_id} -> #{roundtrip}"
|
||||||
|
|
||||||
return string2
|
return string2
|
||||||
|
Loading…
Reference in New Issue
Block a user