[Test] Remove legacy tokenizer tests

author Vsevolod Stakhov <vsevolod@highsecure.ru>

Fri, 24 Aug 2018 09:19:55 +0000 (10:19 +0100)

committer Vsevolod Stakhov <vsevolod@highsecure.ru>

Fri, 24 Aug 2018 09:19:55 +0000 (10:19 +0100)
author Vsevolod Stakhov <vsevolod@highsecure.ru>
Fri, 24 Aug 2018 09:19:55 +0000 (10:19 +0100)
committer Vsevolod Stakhov <vsevolod@highsecure.ru>
Fri, 24 Aug 2018 09:19:55 +0000 (10:19 +0100)
diff --git a/test/lua/unit/tokenizer.lua b/test/lua/unit/tokenizer.lua

index 16f8f18461a6722d3e009ebdd61e8f15fa4b68e4..fbf7ee3e73742b6f416063d73a9ecd871d68f796 100644 (file)
--- a/test/lua/unit/tokenizer.lua
+++ b/test/lua/unit/tokenizer.lua
@@ -33,40 +33,6 @@ context("Text tokenization test", function()
      end)
    end
  
-
-  cases = {
-    -- First token is bad
-    {"Lorem ipsum dolor sit amet, consectetur adipiscing elit. Integer mattis, nibh",
-     {"orem", "ipsum", "dolor", "sit", "amet", "consectetur", "adipiscing", "elit",
-      "Integer", "mattis", "nibh"
-     }
-    },
-    -- Unicode is broken
-    --{"Հետաքրքրվողների համար ոտորև ներկայացված",
-    --  {"Հետաքրքրվողների", "համար", "ոտորև", "ներկայացված"}
-    --},
-    {"", {}},
-    {",,,,,", {}},
-    {"word,,,,,word    ", {"ord", "word"}},
-    {"word", {"ord"}},
-    {",,,,word,,,", {"word"}}
-  }
-
-  for i,c in ipairs(cases) do
-    test("Tokenize simple text (legacy) " .. i, function()
-      local w = util.tokenize_text(c[1], {}, true)
-      if #c[2] == 0 then
-        assert_equal(#w, 0, "must not have tokens " .. c[1])
-      else
-        assert_not_nil(w, "must tokenize " .. c[1])
-
-        for i,wrd in ipairs(w) do
-          assert_equal(wrd, c[2][i])
-        end
-      end
-    end)
-  end
-
    cases = {
      {"word https://example.com/path word",
       {{5, 24}},
author	Vsevolod Stakhov <vsevolod@highsecure.ru>
	Fri, 24 Aug 2018 09:19:55 +0000 (10:19 +0100)
committer	Vsevolod Stakhov <vsevolod@highsecure.ru>
	Fri, 24 Aug 2018 09:19:55 +0000 (10:19 +0100)