1
0
pretty/test/test_pstring.lua

288 lines
9.4 KiB
Lua

local SUITE = require 'TestSuite' 'string'
SUITE:setEnvironment{
format = require('pretty')
}
--------------------------------------------------------------------------------
-- Compat
if not loadstring then loadstring = load end -- Lua 5.3 compat
--
local function format_test (t)
SUITE:addTest(t.name or t.expect, function (mode)
local fmt = format(t.input, t.options)
--
assert_equal(t.expect, fmt)
if mode == 'format' then return end
--
local chunk, load_error_msg = loadstring('return '..fmt)
if not chunk then error(load_error_msg) end
if mode == 'parse' then return end
--
local output = chunk()
assert_equal(t.input, output)
end, { line = debug.getinfo(2).currentline, data = {
'format',
not t.not_idempotent and 'parse' or nil,
not t.not_idempotent and 'idempotent' or nil,
}})
end
--------------------------------------------------------------------------------
-- Shortform Strings
format_test {
input = 'Hello World',
expect = '\'Hello World\'',
}
format_test {
input = 'Hello \'World\'',
expect = '\'Hello \\\'World\\\'\'',
}
format_test {
input = 'Hello \"World\"',
expect = '\'Hello \"World\"\'',
}
format_test {
input = 'Hello [[World]]',
expect = '\'Hello [[World]]\'',
}
format_test {
input = '\'Hello\' [[World]]',
expect = '\'\\\'Hello\\\' [[World]]\'',
}
format_test {
input = '\'Hello\' \"there\" [[World]]',
expect = '\'\\\'Hello\\\' \"there\" [[World]]\'',
}
format_test {
input = '\'Hello\' \"there\" [=[World]=]',
expect = '\'\\\'Hello\\\' \"there\" [=[World]=]\'',
}
format_test {
input = '\nHello World',
expect = [['\nHello World']],
}
format_test {
input = '\'\"\n',
expect = [['\'"\n']],
}
format_test {
input = '\n',
expect = '\'\\n\'',
}
format_test {
input = '\\',
expect = [['\\']],
}
format_test {
input = '\000',
expect = '\'\\000\'',
}
format_test {
input = '\a\b\v\r\f',
expect = [['\a\b\v\r\f']],
}
--------------------------------------------------------------------------------
-- Cut Strings
format_test {
name = 'Cut string basics',
not_idempotent = true,
input = {'Lorem ipsum dolor sit amet, consectetur adipiscing elit. Nunc vestibulum tempus ligula. Sed ac lobortis mi.'},
expect = '{\n \'Lorem ipsum dolor sit amet, consectet\'...\n}',
}
format_test {
name = 'Cut strings are cut after escaping',
not_idempotent = true,
input = {'Lorem\tipsum\tdolor\tsit\tamet,\tconsectetur\tadipiscing\telit.\tNunc\tvestibulum\ttempus\tligula.\tSed\tac\tlobortis\tmi.'},
expect = '{\n \'Lorem\\tipsum\\tdolor\\tsit\\tamet,\\tcons\'...\n}',
}
format_test {
name = 'Cut strings are cut after escaping 2',
not_idempotent = true,
input = {'Lorem ipsum dolor sit amet, conse\t\t\tctetur adipiscing elit. Nunc vestibulum tempus ligula. Sed ac lobortis mi.'},
expect = '{\n \'Lorem ipsum dolor sit amet, conse\\t\\t\'...\n}',
}
format_test {
name = 'Cut strings are not cut in the middle of an escape code',
not_idempotent = true,
input = {'Lorem ipsum dolor sit amet, consec\t\t\ttetur adipiscing elit. Nunc vestibulum tempus ligula. Sed ac lobortis mi.'},
expect = '{\n \'Lorem ipsum dolor sit amet, consec\\t\'...\n}',
}
format_test {
name = 'Cut strings are not cut in the middle of backslash sequence',
not_idempotent = true,
input = {'Lorem ipsum dolor sit amet, consec\\\\\\\\\\\\\\tetur adipiscing elit. Nunc vestibulum tempus ligula. Sed ac lobortis mi.'},
expect = '{\n \'Lorem ipsum dolor sit amet, consec\\\\\'...\n}',
}
format_test {
name = 'Cut strings are not cut in the middle of escaping \\',
not_idempotent = true,
input = {'Lorem ipsum dolor sit amet, conse\\\\\\\\ctetur adipiscing elit. Nunc vestibulum tempus ligula. Sed ac lobortis mi.'},
expect = '{\n \'Lorem ipsum dolor sit amet, conse\\\\\\\\\'...\n}',
}
format_test {
name = 'Cut strings are not cut in the middle of decimal escape codes',
not_idempotent = true,
input = {'Lorem ipsum dolor sit amet, consect\014etur adipiscing elit. Nunc vestibulum tempus ligula. Sed ac lobortis mi.'},
expect = '{\n \'Lorem ipsum dolor sit amet, consect\'...\n}',
}
format_test {
name = 'Cut strings can shorten decimal escape codes, if necessary and possible',
not_idempotent = true,
input = {'Lorem ipsum dolor sit amet, consec\014tetur adipiscing elit. Nunc vestibulum tempus ligula. Sed ac lobortis mi.'},
expect = '{\n \'Lorem ipsum dolor sit amet, consec\\14\'...\n}',
}
format_test {
name = 'Cut strings can shorten decimal escape codes, if necessary and possible, but will keep them as long as possible',
not_idempotent = true,
input = {'Lorem ipsum dolor sit amet, consec\004tetur adipiscing elit. Nunc vestibulum tempus ligula. Sed ac lobortis mi.'},
expect = '{\n \'Lorem ipsum dolor sit amet, consec\\04\'...\n}',
}
--------------------------------------------------------------------------------
-- Concatted Strings
format_test {
name = 'Concatted string basics',
input = 'Lorem ipsum dolor sit amet, consectetur adipiscing elit. Nunc vestibulum tempus ligula. Sed \004\002\000 ac lobortis mi.',
expect = [['Lorem ipsum dolor sit amet, consectetur adipiscing elit. Nunc vestibulum te' ..]]..'\n'..[['mpus ligula. Sed \004\002\000 ac lobortis mi.']],
}
format_test {
name = 'Concatted string basics 2',
input = 'Lorem ipsum dolor sit amet, consectetur adipiscing elit.\004\002\000Nunc vestibulum tempus ligula. Sed ac lobortis mi.',
expect = [['Lorem ipsum dolor sit amet, consectetur adipiscing elit.\004\002\000Nunc ve' ..]]..'\n'..[['stibulum tempus ligula. Sed ac lobortis mi.']],
}
format_test {
name = 'Concatted string with decimal escape at border',
input = 'Lorem ipsum dolor sit amet, consectetur adipiscing elit.Nunc vestibu\004\255\000lum tempus ligula. Sed ac lobortis mi.',
expect = [['Lorem ipsum dolor sit amet, consectetur adipiscing elit.Nunc vestibu\004' ..]]..'\n'..[['\255\000lum tempus ligula. Sed ac lobortis mi.']],
}
format_test {
name = 'Concatted string with decimal escape at border 2',
input = 'Lorem ipsum dolor sit amet, consectetur adipiscing elit.Nunc vestibu\004\002\000lum tempus ligula. Sed ac lobortis mi.',
expect = [['Lorem ipsum dolor sit amet, consectetur adipiscing elit.Nunc vestibu\004\02' ..]]..'\n'..[['\000lum tempus ligula. Sed ac lobortis mi.']],
}
--------------------------------------------------------------------------------
-- Longform Strings
local LONG_STRING = [[
Lorem ipsum dolor sit amet, consectetur adipiscing elit.
Nunc vestibulum tempus ligula. Sed ac lobortis mi.
Morbi eu arcu id nunc cursus auctor. Nulla enim tortor, sodales ut nunc non,
euismod aliquam libero. Aliquam neque est, iaculis in nibh vel, mollis ultricies
ante. Sed egestas et massa sit amet posuere. Integer at suscipit lorem, non
consectetur lacus. Vivamus ac facilisis sem. Proin lacinia ex eu volutpat
interdum.
]]
format_test {
name = 'Longform string basics',
input = LONG_STRING,
expect = '[[\n'..LONG_STRING..']]'
}
local LONG_STRING_WITH_LEVELS = [=[
Lorem ipsum dolor sit amet, consectetur adipiscing elit. Nunc vestibulum tempus
ligula. Sed ac lobortis mi. [Morbi eu arcu id nunc cursus auctor. [Nulla enim
tortor, sodales ut nunc non, euismod aliquam libero.]] Aliquam neque est,
iaculis in nibh vel, mollis ultricies ante. Sed egestas et massa sit amet
posuere. Integer at suscipit lorem, non consectetur lacus. Vivamus ac facilisis
sem. Proin lacinia ex eu volutpat interdum.
]=]
format_test {
name = 'Longform string that requires level 1',
input = LONG_STRING_WITH_LEVELS,
expect = '[=[\n'..LONG_STRING_WITH_LEVELS..']=]'
}
local LONG_STRING_WITH_HIGH_LEVELS = [[
Lorem ipsum dolor sit amet, consectetur adipiscing elit. Nunc vestibulum tempus
ligula. Sed ac lobortis mi. [=[Morbi eu arcu id nunc cursus auctor. [Nulla enim
tortor, sodales ut nunc non, euismod aliquam libero.]=] Aliquam neque est,
iaculis in nibh vel, mollis ultricies ante. Sed egestas et massa sit amet
posuere. Integer at suscipit lorem, non consectetur lacus. Vivamus ac facilisis
sem. Proin lacinia ex eu volutpat interdum.
]]
format_test {
name = 'Longform string that requires level 0, but not 1',
input = LONG_STRING_WITH_HIGH_LEVELS,
expect = '[[\n'..LONG_STRING_WITH_HIGH_LEVELS..']]'
}
--------------------------------------------------------------------------------
-- Unicode
format_test {
input = 'ø',
expect = '\'ø\'',
}
format_test {
name = 'Single utf8 continuation byte is escaped',
input = 'abc\169def',
expect = '\'abc\\169def\'',
}
format_test {
name = 'Multiple utf8 continuation bytes are escaped',
input = 'abc\169\190\169\169def',
expect = '\'abc\\169\\190\\169\\169def\'',
}
format_test {
name = 'Single start byte utf8 chars is escaped',
input = 'abc\255def',
expect = '\'abc\\255def\'',
}
--------------------------------------------------------------------------------
do
local data = {}
for str, name in SUITE:getExamples 'STRING_UTF8' do
data[#data+1] = { name, str }
end
SUITE:addTest('UTF8 Idempotency', function (_, str)
assert_equal(str, loadstring('return '..format(str))() )
end, { data = data })
end
--------------------------------------------------------------------------------
return SUITE