local stringx = require 'pl.stringx' local utils = require 'pl.utils' local asserteq = require 'pl.test' . asserteq local T = require 'pl.test'.tuple local function FIX(s) io.stderr:write('FIX:' .. s .. '\n') end -- isalpha asserteq(T(stringx.isalpha''), T(false)) asserteq(T(stringx.isalpha' '), T(false)) asserteq(T(stringx.isalpha'0'), T(false)) asserteq(T(stringx.isalpha'\0'), T(false)) asserteq(T(stringx.isalpha'azAZ'), T(true)) asserteq(T(stringx.isalpha'az9AZ'), T(false)) -- isdigit asserteq(T(stringx.isdigit''), T(false)) asserteq(T(stringx.isdigit' '), T(false)) asserteq(T(stringx.isdigit'a'), T(false)) asserteq(T(stringx.isdigit'0123456789'), T(true)) -- isalnum asserteq(T(stringx.isalnum''), T(false)) asserteq(T(stringx.isalnum' '), T(false)) asserteq(T(stringx.isalnum('azAZ01234567890')), T(true)) -- isspace asserteq(T(stringx.isspace''), T(false)) asserteq(T(stringx.isspace' '), T(true)) asserteq(T(stringx.isspace' \r\n\f\t'), T(true)) asserteq(T(stringx.isspace' \r\n-\f\t'), T(false)) -- islower asserteq(T(stringx.islower''), T(false)) asserteq(T(stringx.islower'az'), T(true)) asserteq(T(stringx.islower'aMz'), T(false)) asserteq(T(stringx.islower'a z'), T(true)) -- isupper asserteq(T(stringx.isupper''), T(false)) asserteq(T(stringx.isupper'AZ'), T(true)) asserteq(T(stringx.isupper'AmZ'), T(false)) asserteq(T(stringx.isupper'A Z'), T(true)) -- startswith local startswith = stringx.startswith asserteq(T(startswith('', '')), T(true)) asserteq(T(startswith('', 'a')), T(false)) asserteq(T(startswith('a', '')), T(true)) asserteq(T(startswith('a', 'a')), T(true)) asserteq(T(startswith('a', 'b')), T(false)) asserteq(T(startswith('a', 'ab')), T(false)) asserteq(T(startswith('abc', 'ab')), T(true)) asserteq(T(startswith('abc', 'bc')), T(false)) -- off by one asserteq(T(startswith('abc', '.')), T(false)) -- Lua pattern char asserteq(T(startswith('a\0bc', 'a\0b')), T(true)) -- '\0' asserteq(startswith('abcfoo',{'abc','def'}),true) asserteq(startswith('deffoo',{'abc','def'}),true) asserteq(startswith('cdefoo',{'abc','def'}),false) -- endswith -- http://snippets.luacode.org/sputnik.lua?p=snippets/Check_string_ends_with_other_string_74 local endswith = stringx.endswith asserteq(T(endswith("", "")), T(true)) asserteq(T(endswith("", "a")), T(false)) asserteq(T(endswith("a", "")), T(true)) asserteq(T(endswith("a", "a")), T(true)) asserteq(T(endswith("a", "A")), T(false)) -- case sensitive asserteq(T(endswith("a", "aa")), T(false)) asserteq(T(endswith("abc", "")), T(true)) asserteq(T(endswith("abc", "ab")), T(false)) -- off by one asserteq(T(endswith("abc", "c")), T(true)) asserteq(T(endswith("abc", "bc")), T(true)) asserteq(T(endswith("abc", "abc")), T(true)) asserteq(T(endswith("abc", " abc")), T(false)) asserteq(T(endswith("abc", "a")), T(false)) asserteq(T(endswith("abc", ".")), T(false)) -- Lua pattern char asserteq(T(endswith("ab\0c", "b\0c")), T(true)) -- \0 asserteq(T(endswith("ab\0c", "b\0d")), T(false)) -- \0 asserteq(endswith('dollar.dot',{'.dot','.txt'}),true) asserteq(endswith('dollar.txt',{'.dot','.txt'}),true) asserteq(endswith('dollar.rtxt',{'.dot','.txt'}),false) -- join asserteq(stringx.join(' ', {1,2,3}), '1 2 3') -- splitlines asserteq(stringx.splitlines(''), {}) asserteq(stringx.splitlines('a'), {'a'}) asserteq(stringx.splitlines('\n'), {''}) asserteq(stringx.splitlines('\n\n'), {'', ''}) asserteq(stringx.splitlines('\r\r'), {'', ''}) asserteq(stringx.splitlines('\r\n'), {''}) asserteq(stringx.splitlines('ab\ncd\n'), {'ab', 'cd'}) asserteq(stringx.splitlines('ab\ncd\n', true), {'ab\n', 'cd\n'}) asserteq(stringx.splitlines('\nab\r\r\ncd\n', true), {'\n', 'ab\r', '\r\n', 'cd\n'}) -- expandtabs ---FIX[[raises error asserteq(T(stringx.expandtabs('',0)), T('')) asserteq(T(stringx.expandtabs('',1)), T('')) asserteq(T(stringx.expandtabs(' ',1)), T(' ')) -- expandtabs now works like Python's str.expandtabs (up to next tab stop) asserteq(T(stringx.expandtabs(' \t ')), T((' '):rep(1+8))) asserteq(T(stringx.expandtabs(' \t ',2)), T(' ')) --]] -- lfind asserteq(T(stringx.lfind('', '')), T(1)) asserteq(T(stringx.lfind('a', '')), T(1)) asserteq(T(stringx.lfind('ab', 'b')), T(2)) asserteq(T(stringx.lfind('abc', 'cd')), T(nil)) asserteq(T(stringx.lfind('abcbc', 'bc')), T(2)) asserteq(T(stringx.lfind('ab..cd', '.')), T(3)) -- pattern char asserteq(T(stringx.lfind('abcbcbbc', 'bc', 3)), T(4)) asserteq(T(stringx.lfind('abcbcbbc', 'bc', 3, 4)), T(nil)) asserteq(T(stringx.lfind('abcbcbbc', 'bc', 3, 5)), T(4)) asserteq(T(stringx.lfind('abcbcbbc', 'bc', nil, 5)), T(2)) -- rfind asserteq(T(stringx.rfind('', '')), T(1)) asserteq(T(stringx.rfind('ab', '')), T(3)) asserteq(T(stringx.rfind('abc', 'cd')), T(nil)) asserteq(T(stringx.rfind('abcbc', 'bc')), T(4)) asserteq(T(stringx.rfind('abcbcb', 'bc')), T(4)) asserteq(T(stringx.rfind('ab..cd', '.')), T(4)) -- pattern char asserteq(T(stringx.rfind('abcbcbbc', 'bc', 3)), T(7)) asserteq(T(stringx.rfind('abcbcbbc', 'bc', 3, 4)), T(nil)) asserteq(T(stringx.rfind('abcbcbbc', 'bc', 3, 5)), T(4)) asserteq(T(stringx.rfind('abcbcbbc', 'bc', nil, 5)), T(4)) asserteq(T(stringx.rfind('banana', 'ana')), T(4)) -- replace asserteq(T(stringx.replace('', '', '')), T('')) asserteq(T(stringx.replace(' ', '', '')), T(' ')) asserteq(T(stringx.replace(' ', '', ' ')), T(' ')) asserteq(T(stringx.replace(' ', ' ', '')), T('')) asserteq(T(stringx.replace('abcabcabc', 'bc', 'BC')), T('aBCaBCaBC')) asserteq(T(stringx.replace('abcabcabc', 'bc', 'BC', 1)), T('aBCabcabc')) asserteq(T(stringx.replace('abcabcabc', 'bc', 'BC', 0)), T('abcabcabc')) asserteq(T(stringx.replace('abc', 'd', 'e')), T('abc')) asserteq(T(stringx.replace('a.b', '.', '%d')), T('a%db')) -- split local split = stringx.split asserteq(split('', ''), {''}) asserteq(split('', 'z'), {}) --FIX:intended and specified behavior? asserteq(split('a', ''), {'a'}) --FIX:intended and specified behavior? asserteq(split('a', 'a'), {''}) -- stringx.split now follows the Python pattern, so it uses a substring, not a pattern. -- If you need to split on a pattern, use utils.split() -- asserteq(split('ab1cd23ef%d', '%d+'), {'ab', 'cd', 'ef%d'}) -- pattern chars -- note that leading space is ignored by the default asserteq(split(' 1 2 3 '),{'1','2','3'}) asserteq(split('a*bb*c*ddd','*'),{'a','bb','c','ddd'}) asserteq(split('dog:fred:bonzo:alice',':',3), {'dog','fred','bonzo:alice'}) asserteq(split('dog:fred:bonzo:alice:',':',3), {'dog','fred','bonzo:alice:'}) asserteq(split('///','/'),{'','','',''}) -- capitalize asserteq(T(stringx.capitalize('')), T('')) asserteq(T(stringx.capitalize('abC deF1')), T('Abc Def1')) -- Python behaviour -- count asserteq(T(stringx.count('', '')), T(0)) --infinite loop]] asserteq(T(stringx.count(' ', '')), T(2)) --infinite loop]] asserteq(T(stringx.count('a..c', '.')), T(2)) -- pattern chars asserteq(T(stringx.count('a1c', '%d')), T(0)) -- pattern chars asserteq(T(stringx.count('Anna Anna Anna', 'Anna')), T(3)) -- no overlap asserteq(T(stringx.count('banana', 'ana', false)), T(1)) -- no overlap asserteq(T(stringx.count('banana', 'ana', true)), T(2)) -- overlap -- ljust asserteq(T(stringx.ljust('', 0)), T('')) asserteq(T(stringx.ljust('', 2)), T(' ')) asserteq(T(stringx.ljust('ab', 3)), T('ab ')) asserteq(T(stringx.ljust('ab', 3, '%')), T('ab%')) asserteq(T(stringx.ljust('abcd', 3)), T('abcd')) -- agrees with Python -- rjust asserteq(T(stringx.rjust('', 0)), T('')) asserteq(T(stringx.rjust('', 2)), T(' ')) asserteq(T(stringx.rjust('ab', 3)), T(' ab')) asserteq(T(stringx.rjust('ab', 3, '%')), T('%ab')) asserteq(T(stringx.rjust('abcd', 3)), T('abcd')) -- agrees with Python -- center asserteq(T(stringx.center('', 0)), T('')) asserteq(T(stringx.center('', 1)), T(' ')) asserteq(T(stringx.center('', 2)), T(' ')) asserteq(T(stringx.center('a', 1)), T('a')) asserteq(T(stringx.center('a', 2)), T('a ')) asserteq(T(stringx.center('a', 3)), T(' a ')) -- ltrim -- http://snippets.luacode.org/sputnik.lua?p=snippets/trim_whitespace_from_string_76 local trim = stringx.lstrip asserteq(T(trim''), T'') asserteq(T(trim' '), T'') asserteq(T(trim' '), T'') asserteq(T(trim'a'), T'a') asserteq(T(trim' a'), T'a') asserteq(T(trim'a '), T'a ') asserteq(T(trim' a '), T'a ') asserteq(T(trim' a '), T'a ') asserteq(T(trim' ab cd '), T'ab cd ') asserteq(T(trim' \t\r\n\f\va\000b \r\t\n\f\v'), T'a\000b \r\t\n\f\v') -- more -- rtrim -- http://snippets.luacode.org/sputnik.lua?p=snippets/trim_whitespace_from_string_76 local trim = stringx.rstrip asserteq(T(trim''), T'') asserteq(T(trim' '), T'') asserteq(T(trim' '), T'') asserteq(T(trim'a'), T'a') asserteq(T(trim' a'), T' a') asserteq(T(trim'a '), T'a') asserteq(T(trim' a '), T' a') asserteq(T(trim' a '), T' a') asserteq(T(trim' ab cd '), T' ab cd') asserteq(T(trim' \t\r\n\f\va\000b \r\t\n\f\v'), T' \t\r\n\f\va\000b') -- more -- trim -- http://snippets.luacode.org/sputnik.lua?p=snippets/trim_whitespace_from_string_76 local trim = stringx.strip asserteq(T(trim''), T'') asserteq(T(trim' '), T'') asserteq(T(trim' '), T'') asserteq(T(trim'a'), T'a') asserteq(T(trim' a'), T'a') asserteq(T(trim'a '), T'a') asserteq(T(trim' a '), T'a') asserteq(T(trim' a '), T'a') asserteq(T(trim' ab cd '), T'ab cd') asserteq(T(trim' \t\r\n\f\va\000b \r\t\n\f\v'), T'a\000b') local long = 'a' .. string.rep(' ', 200000) .. 'a' asserteq(T(trim(long)), T(long)) -- more asserteq({stringx.splitv("hello dolly")}, {"hello", "dolly"}) -- partition -- as per str.partition in Python, delimiter must be non-empty; -- interpreted as a plain string --asserteq(T(stringx.partition('', '')), T('', '', '')) -- error]] --asserteq(T(stringx.partition('a', '')), T('', '', 'a')) --error]] asserteq(T(stringx.partition('a', 'a')), T('', 'a', '')) asserteq(T(stringx.partition('abc', 'b')), T('a', 'b', 'c')) asserteq(T(stringx.partition('abc', '.+')), T('abc','','')) asserteq(T(stringx.partition('a,b,c', ',')), T('a',',','b,c')) asserteq(T(stringx.partition('abc', '/')), T('abc', '', '')) -- rpartition asserteq(T(stringx.rpartition('a/b/c', '/')), T('a/b', '/', 'c')) asserteq(T(stringx.rpartition('abc', 'b')), T('a', 'b', 'c')) asserteq(T(stringx.rpartition('a', 'a')), T('', 'a', '')) asserteq(T(stringx.rpartition('abc', '/')), T('', '', 'abc')) -- at (works like s:sub(idx,idx), so negative indices allowed asserteq(T(stringx.at('a', 1)), T('a')) asserteq(T(stringx.at('ab', 2)), T('b')) asserteq(T(stringx.at('abcd', -1)), T('d')) asserteq(T(stringx.at('abcd', 10)), T('')) -- not found -- lines local function merge(it, ...) assert(select('#', ...) == 0) local ts = {} for val in it do ts[#ts+1] = val end return ts end asserteq(merge(stringx.lines('')), {''}) asserteq(merge(stringx.lines('ab')), {'ab'}) asserteq(merge(stringx.lines('ab\ncd')), {'ab', 'cd'}) asserteq(stringx.capitalize("hello world"), "Hello World") asserteq(stringx.title("hello world"), "Hello World") -- shorten -- The returned string is always equal or less to the given size. asserteq(T(stringx.shorten('', 0)), T'') asserteq(T(stringx.shorten('a', 1)), T'a') asserteq(T(stringx.shorten('ab', 1)), T'.') --FIX:ok? asserteq(T(stringx.shorten('abc', 3)), T'abc') asserteq(T(stringx.shorten('abcd', 3)), T'...') asserteq(T(stringx.shorten('abcde', 5)), T'abcde') asserteq(T(stringx.shorten('abcde', 4)), T'a...') asserteq(T(stringx.shorten('abcde', 3)), T'...') asserteq(T(stringx.shorten('abcde', 2)), T'..') asserteq(T(stringx.shorten('abcde', 0)), T'') asserteq(T(stringx.shorten('', 0, true)), T'') asserteq(T(stringx.shorten('a', 1, true)), T'a') asserteq(T(stringx.shorten('ab', 1, true)), T'.') asserteq(T(stringx.shorten('abcde', 5, true)), T'abcde') asserteq(T(stringx.shorten('abcde', 4, true)), T'...e') asserteq(T(stringx.shorten('abcde', 3, true)), T'...') asserteq(T(stringx.shorten('abcde', 2, true)), T'..') asserteq(T(stringx.shorten('abcde', 0, true)), T'') -- strip asserteq(stringx.strip(' hello '),'hello') asserteq(stringx.strip('--[hello] -- - ','-[] '),'hello') asserteq(stringx.rstrip('--[hello] -- - ','-[] '),'--[hello') asserteq(stringx.strip('hello'..((" "):rep(500))), "hello") -- local assert_str_round_trip = function(s) local qs = stringx.quote_string(s) local compiled, err = utils.load("return "..qs) if not compiled then print( ("stringx.quote_string assert failed: invalid string created: Received:\n%s\n\nCompiled to\n%s\n\nError:\t%s\n"): format(s, qs, err) ) error() else compiled = compiled() end if compiled ~= s then print("stringx.quote_string assert Failed: String compiled but did not round trip.") print("input string:\t\t",s, #s) print("compiled string:\t", compiled, #compiled) print("output string:\t\t",qs, #qs) error() else -- print("input string:\t\t",s) -- print("compiled string:\t", compiled) -- print("output string:\t\t",qs) end end assert_str_round_trip( "normal string with nothing weird.") assert_str_round_trip( "Long string quoted with escaped quote \\\" and a long string pattern match [==[ found near the end.") assert_str_round_trip( "Unescapped quote \" in the middle") assert_str_round_trip( "[[Embedded long quotes \\\". Escaped must stay! ]]") assert_str_round_trip( [[Long quoted string with a slash prior to quote \\\". ]]) assert_str_round_trip( "[[Completely normal\n long quote. ]]") assert_str_round_trip( "String with a newline\nending with a closing bracket]") assert_str_round_trip( "[[String with opening brackets ending with part of a long closing bracket]=") assert_str_round_trip( "\n[[Completely normal\n long quote. Except that we lead with a return! Tricky! ]]") assert_str_round_trip( '"balance [======[ doesn\'t ]====] mater when searching for embedded long-string quotes.') assert_str_round_trip( "Any\0 \t control character other than a return will be handled by the %q mechanism.") assert_str_round_trip( "This\tincludes\ttabs.") assert_str_round_trip( "But not returns.\n Returns are easier to see using long quotes.") assert_str_round_trip( "The \z escape does not trigger a control pattern, however.") assert_str_round_trip( "[==[If a string is long-quoted, escaped \\\" quotes have to stay! ]==]") assert_str_round_trip('"A quoted string looks like what?"') assert_str_round_trip( "'I think that it should be quoted, anyway.'") assert_str_round_trip( "[[Even if they're long quoted.]]") assert_str_round_trip( "]=]==]") assert_str_round_trip( "\"\\\"\\' pathalogical:starts with a quote ]\"\\']=]]==][[]]]=========]") assert_str_round_trip( "\\\"\\\"\\' pathalogical: quote is after this text with a quote ]\"\\']=]]==][[]]]=========]") assert_str_round_trip( "\\\"\\\"\\' pathalogical: quotes are all escaped. ]\\\"\\']=]]==][[]]]=========]") assert_str_round_trip( "") assert_str_round_trip( " ") assert_str_round_trip( "\n") --tricky. assert_str_round_trip( "\r") assert_str_round_trip( "\r\n") assert_str_round_trip( "\r1\n") assert_str_round_trip( "[[") assert_str_round_trip( "''") assert_str_round_trip( '""')