github.com/shawnclovie/gopher-lua@v0.0.0-20200520092726-90b44ec0e2f2/_lua5.1-tests/pm.lua (about)

     1  print('testing pattern matching')
     2  
     3  function f(s, p)
     4    local i,e = string.find(s, p)
     5    if i then return string.sub(s, i, e) end
     6  end
     7  
     8  function f1(s, p)
     9    p = string.gsub(p, "%%([0-9])", function (s) return "%" .. (s+1) end)
    10    p = string.gsub(p, "^(^?)", "%1()", 1)
    11    p = string.gsub(p, "($?)$", "()%1", 1)
    12    local t = {string.match(s, p)}
    13    return string.sub(s, t[1], t[#t] - 1)
    14  end
    15  
    16  a,b = string.find('', '')    -- empty patterns are tricky
    17  assert(a == 1 and b == 0);
    18  a,b = string.find('alo', '')
    19  assert(a == 1 and b == 0)
    20  a,b = string.find('a\0o a\0o a\0o', 'a', 1)   -- first position
    21  assert(a == 1 and b == 1)
    22  a,b = string.find('a\0o a\0o a\0o', 'a\0o', 2)   -- starts in the midle
    23  assert(a == 5 and b == 7)
    24  a,b = string.find('a\0o a\0o a\0o', 'a\0o', 9)   -- starts in the midle
    25  assert(a == 9 and b == 11)
    26  a,b = string.find('a\0a\0a\0a\0\0ab', '\0ab', 2);  -- finds at the end
    27  assert(a == 9 and b == 11);
    28  a,b = string.find('a\0a\0a\0a\0\0ab', 'b')    -- last position
    29  assert(a == 11 and b == 11)
    30  assert(string.find('a\0a\0a\0a\0\0ab', 'b\0') == nil)   -- check ending
    31  assert(string.find('', '\0') == nil)
    32  assert(string.find('alo123alo', '12') == 4)
    33  assert(string.find('alo123alo', '^12') == nil)
    34  
    35  assert(f('aloALO', '%l*') == 'alo')
    36  assert(f('aLo_ALO', '%a*') == 'aLo')
    37  
    38  assert(f('aaab', 'a*') == 'aaa');
    39  assert(f('aaa', '^.*$') == 'aaa');
    40  assert(f('aaa', 'b*') == '');
    41  assert(f('aaa', 'ab*a') == 'aa')
    42  assert(f('aba', 'ab*a') == 'aba')
    43  assert(f('aaab', 'a+') == 'aaa')
    44  assert(f('aaa', '^.+$') == 'aaa')
    45  assert(f('aaa', 'b+') == nil)
    46  assert(f('aaa', 'ab+a') == nil)
    47  assert(f('aba', 'ab+a') == 'aba')
    48  assert(f('a$a', '.$') == 'a')
    49  assert(f('a$a', '.%$') == 'a$')
    50  assert(f('a$a', '.$.') == 'a$a')
    51  assert(f('a$a', '$$') == nil)
    52  assert(f('a$b', 'a$') == nil)
    53  assert(f('a$a', '$') == '')
    54  assert(f('', 'b*') == '')
    55  assert(f('aaa', 'bb*') == nil)
    56  assert(f('aaab', 'a-') == '')
    57  assert(f('aaa', '^.-$') == 'aaa')
    58  assert(f('aabaaabaaabaaaba', 'b.*b') == 'baaabaaabaaab')
    59  assert(f('aabaaabaaabaaaba', 'b.-b') == 'baaab')
    60  assert(f('alo xo', '.o$') == 'xo')
    61  assert(f(' \n isto é assim', '%S%S*') == 'isto')
    62  assert(f(' \n isto é assim', '%S*$') == 'assim')
    63  assert(f(' \n isto é assim', '[a-z]*$') == 'assim')
    64  assert(f('um caracter ? extra', '[^%sa-z]') == '?')
    65  assert(f('', 'a?') == '')
    66  assert(f('á', 'á?') == 'á')
    67  assert(f('ábl', 'á?b?l?') == 'ábl')
    68  assert(f('  ábl', 'á?b?l?') == '')
    69  assert(f('aa', '^aa?a?a') == 'aa')
    70  -- assert(f(']]]áb', '[^]]') == 'á')
    71  assert(f(']]]áb', '[^%]]') == 'á')
    72  assert(f("0alo alo", "%x*") == "0a")
    73  assert(f("alo alo", "%C+") == "alo alo")
    74  print('+')
    75  
    76  assert(f1('alo alx 123 b\0o b\0o', '(..*) %1') == "b\0o b\0o")
    77  assert(f1('axz123= 4= 4 34', '(.+)=(.*)=%2 %1') == '3= 4= 4 3')
    78  assert(f1('=======', '^(=*)=%1$') == '=======')
    79  assert(string.match('==========', '^([=]*)=%1$') == nil)
    80  
    81  local function range (i, j)
    82    if i <= j then
    83      return i, range(i+1, j)
    84    end
    85  end
    86  
    87  local function range (i, j)
    88    local ret = {}
    89    for k=i, j do; table.insert(ret, k); end
    90    return unpack(ret)
    91  end
    92  
    93  local abc = string.char(range(0, 255));
    94  
    95  assert(string.len(abc) == 256)
    96  
    97  function strset (p)
    98    local res = {s=''}
    99    string.gsub(abc, p, function (c) res.s = res.s .. c end)
   100    return res.s
   101  end;
   102  
   103  assert(string.len(strset('[\200-\210]')) == 11)
   104  
   105  assert(strset('[a-z]') == "abcdefghijklmnopqrstuvwxyz")
   106  assert(strset('[a-z%d]') == strset('[%da-uu-z]'))
   107  -- assert(strset('[a-]') == "-a")
   108  assert(strset('[a%-]') == "-a")
   109  assert(strset('[^%W]') == strset('[%w]'))
   110  -- assert(strset('[]%%]') == '%]')
   111  assert(strset('[%]%%]') == '%]')
   112  assert(strset('[a%-z]') == '-az')
   113  assert(strset('[%^%[%-a%]%-b]') == '-[]^ab')
   114  assert(strset('%Z') == strset('[\1-\255]'))
   115  assert(strset('.') == strset('[\1-\255%z]'))
   116  print('+');
   117  
   118  assert(string.match("alo xyzK", "(%w+)K") == "xyz")
   119  assert(string.match("254 K", "(%d*)K") == "")
   120  assert(string.match("alo ", "(%w*)$") == "")
   121  assert(string.match("alo ", "(%w+)$") == nil)
   122  assert(string.find("(álo)", "%(á") == 1)
   123  local a, b, c, d, e = string.match("âlo alo", "^(((.).).* (%w*))$")
   124  assert(a == 'âlo alo' and b == 'âl' and c == 'â' and d == 'alo' and e == nil)
   125  a, b, c, d  = string.match('0123456789', '(.+(.?)())')
   126  assert(a == '0123456789' and b == '' and c == 11 and d == nil)
   127  print('+')
   128  
   129  assert(string.gsub('ülo ülo', 'ü', 'x') == 'xlo xlo')
   130  assert(string.gsub('alo úlo  ', ' +$', '') == 'alo úlo')  -- trim
   131  assert(string.gsub('  alo alo  ', '^%s*(.-)%s*$', '%1') == 'alo alo')  -- double trim
   132  assert(string.gsub('alo  alo  \n 123\n ', '%s+', ' ') == 'alo alo 123 ')
   133  t = "abç d"
   134  a, b = string.gsub(t, '(.)', '%1@')
   135  assert('@'..a == string.gsub(t, '', '@') and b == 5)
   136  a, b = string.gsub('abçd', '(.)', '%0@', 2)
   137  assert(a == 'a@b@çd' and b == 2)
   138  assert(string.gsub('alo alo', '()[al]', '%1') == '12o 56o')
   139  assert(string.gsub("abc=xyz", "(%w*)(%p)(%w+)", "%3%2%1-%0") ==
   140                "xyz=abc-abc=xyz")
   141  assert(string.gsub("abc", "%w", "%1%0") == "aabbcc")
   142  assert(string.gsub("abc", "%w+", "%0%1") == "abcabc")
   143  assert(string.gsub('áéí', '$', '\0óú') == 'áéí\0óú')
   144  assert(string.gsub('', '^', 'r') == 'r')
   145  assert(string.gsub('', '$', 'r') == 'r')
   146  print('+')
   147  
   148  assert(string.gsub("um (dois) tres (quatro)", "(%(%w+%))", string.upper) ==
   149              "um (DOIS) tres (QUATRO)")
   150  
   151  do
   152    local function setglobal (n,v) rawset(_G, n, v) end
   153    string.gsub("a=roberto,roberto=a", "(%w+)=(%w%w*)", setglobal)
   154    assert(_G.a=="roberto" and _G.roberto=="a")
   155  end
   156  
   157  function f(a,b) return string.gsub(a,'.',b) end
   158  assert(string.gsub("trocar tudo em |teste|b| é |beleza|al|", "|([^|]*)|([^|]*)|", f) ==
   159              "trocar tudo em bbbbb é alalalalalal")
   160  
   161  local function dostring (s) return loadstring(s)() or "" end
   162  assert(string.gsub("alo $a=1$ novamente $return a$", "$([^$]*)%$", dostring) ==
   163              "alo  novamente 1")
   164  
   165  x = string.gsub("$x=string.gsub('alo', '.', string.upper)$ assim vai para $return x$",
   166           "$([^$]*)%$", dostring)
   167  assert(x == ' assim vai para ALO')
   168  
   169  t = {}
   170  s = 'a alo jose  joao'
   171  r = string.gsub(s, '()(%w+)()', function (a,w,b)
   172        assert(string.len(w) == b-a);
   173        t[a] = b-a;
   174      end)
   175  assert(s == r and t[1] == 1 and t[3] == 3 and t[7] == 4 and t[13] == 4)
   176  
   177  
   178  function isbalanced (s)
   179    return string.find(string.gsub(s, "%b()", ""), "[()]") == nil
   180  end
   181  
   182  assert(isbalanced("(9 ((8))(\0) 7) \0\0 a b ()(c)() a"))
   183  assert(not isbalanced("(9 ((8) 7) a b (\0 c) a"))
   184  assert(string.gsub("alo 'oi' alo", "%b''", '"') == 'alo " alo')
   185  
   186  
   187  local t = {"apple", "orange", "lime"; n=0}
   188  assert(string.gsub("x and x and x", "x", function () t.n=t.n+1; return t[t.n] end)
   189          == "apple and orange and lime")
   190  
   191  t = {n=0}
   192  string.gsub("first second word", "%w%w*", function (w) t.n=t.n+1; t[t.n] = w end)
   193  assert(t[1] == "first" and t[2] == "second" and t[3] == "word" and t.n == 3)
   194  
   195  t = {n=0}
   196  assert(string.gsub("first second word", "%w+",
   197           function (w) t.n=t.n+1; t[t.n] = w end, 2) == "first second word")
   198  assert(t[1] == "first" and t[2] == "second" and t[3] == nil)
   199  
   200  assert(not pcall(string.gsub, "alo", "(.", print))
   201  assert(not pcall(string.gsub, "alo", ".)", print))
   202  assert(not pcall(string.gsub, "alo", "(.", {}))
   203  assert(not pcall(string.gsub, "alo", "(.)", "%2"))
   204  assert(not pcall(string.gsub, "alo", "(%1)", "a"))
   205  assert(not pcall(string.gsub, "alo", "(%0)", "a"))
   206  
   207  -- big strings
   208  local a = string.rep('a', 300000)
   209  assert(string.find(a, '^a*.?$'))
   210  assert(not string.find(a, '^a*.?b$'))
   211  assert(string.find(a, '^a-.?$'))
   212  
   213  -- deep nest of gsubs
   214  function rev (s)
   215    return string.gsub(s, "(.)(.+)", function (c,s1) return rev(s1)..c end)
   216  end
   217  
   218  local x = string.rep('012345', 10)
   219  assert(rev(rev(x)) == x)
   220  
   221  
   222  -- gsub with tables
   223  assert(string.gsub("alo alo", ".", {}) == "alo alo")
   224  assert(string.gsub("alo alo", "(.)", {a="AA", l=""}) == "AAo AAo")
   225  assert(string.gsub("alo alo", "(.).", {a="AA", l="K"}) == "AAo AAo")
   226  assert(string.gsub("alo alo", "((.)(.?))", {al="AA", o=false}) == "AAo AAo")
   227  
   228  assert(string.gsub("alo alo", "().", {2,5,6}) == "256 alo")
   229  
   230  t = {}; setmetatable(t, {__index = function (t,s) return string.upper(s) end})
   231  assert(string.gsub("a alo b hi", "%w%w+", t) == "a ALO b HI")
   232  
   233  
   234  -- tests for gmatch
   235  assert(string.gfind == string.gmatch)
   236  local a = 0
   237  for i in string.gmatch('abcde', '()') do assert(i == a+1); a=i end
   238  assert(a==6)
   239  
   240  t = {n=0}
   241  for w in string.gmatch("first second word", "%w+") do
   242        t.n=t.n+1; t[t.n] = w
   243  end
   244  assert(t[1] == "first" and t[2] == "second" and t[3] == "word")
   245  
   246  t = {3, 6, 9}
   247  for i in string.gmatch ("xuxx uu ppar r", "()(.)%2") do
   248    assert(i == table.remove(t, 1))
   249  end
   250  assert(table.getn(t) == 0)
   251  
   252  t = {}
   253  for i,j in string.gmatch("13 14 10 = 11, 15= 16, 22=23", "(%d+)%s*=%s*(%d+)") do
   254    t[i] = j
   255  end
   256  a = 0
   257  for k,v in pairs(t) do assert(k+1 == v+0); a=a+1 end
   258  assert(a == 3)
   259  
   260  
   261  -- tests for `%f' (`frontiers')
   262  
   263  -- assert(string.gsub("aaa aa a aaa a", "%f[%w]a", "x") == "xaa xa x xaa x")
   264  -- assert(string.gsub("[[]] [][] [[[[", "%f[[].", "x") == "x[]] x]x] x[[[")
   265  -- assert(string.gsub("01abc45de3", "%f[%d]", ".") == ".01abc.45de.3")
   266  -- assert(string.gsub("01abc45 de3x", "%f[%D]%w", ".") == "01.bc45 de3.")
   267  -- assert(string.gsub("function", "%f[\1-\255]%w", ".") == ".unction")
   268  -- assert(string.gsub("function", "%f[^\1-\255]", ".") == "function.")
   269  -- 
   270  -- local i, e = string.find(" alo aalo allo", "%f[%S].-%f[%s].-%f[%S]")
   271  -- assert(i == 2 and e == 5)
   272  -- local k = string.match(" alo aalo allo", "%f[%S](.-%f[%s].-%f[%S])")
   273  -- assert(k == 'alo ')
   274  -- 
   275  -- local a = {1, 5, 9, 14, 17,}
   276  -- for k in string.gmatch("alo alo th02 is 1hat", "()%f[%w%d]") do
   277  --   assert(table.remove(a, 1) == k)
   278  -- end
   279  -- assert(table.getn(a) == 0)
   280  
   281  
   282  print('OK')