koreader/spec/unit/util_spec.lua

describe("util module", function()
    local DataStorage, util
    setup(function()
        require("commonrequire")
        DataStorage = require("datastorage")
        util = require("util")
    end)

    it("should strip punctuation marks around word", function()
        assert.is_equal("hello world", util.stripPunctuation("\"hello world\""))
        assert.is_equal("hello world", util.stripPunctuation("\"hello world?\""))
        assert.is_equal("hello, world", util.stripPunctuation("\"hello, world?\""))
        assert.is_equal("你好", util.stripPunctuation("“你好“"))
        assert.is_equal("你好", util.stripPunctuation("“你好?“"))
        assert.is_equal("", util.stripPunctuation(""))
        assert.is_nil(util.stripPunctuation(nil))
    end)

    describe("gsplit()", function()
        it("should split string with patterns", function()
            local sentence = "Hello world, welcome to KOReader!"
            local words = {}
            for word in util.gsplit(sentence, "%s+", false) do
                table.insert(words, word)
            end
            assert.are_same({"Hello", "world,", "welcome", "to", "KOReader!"}, words)
        end)
        it("should split command line arguments with quotation", function()
            local command = "./sdcv -nj \"words\" \"a lot\" 'more or less' --data-dir=dict"
            local argv = {}
            for arg1 in util.gsplit(command, "[\"'].-[\"']", true) do
                for arg2 in util.gsplit(arg1, "^[^\"'].-%s+", true) do
                    for arg3 in util.gsplit(arg2, "[\"']", false) do
                        local trimmed = util.trim(arg3)
                        if trimmed ~= "" then
                            table.insert(argv, trimmed)
                        end
                    end
                end
            end
            assert.are_same({"./sdcv", "-nj", "words", "a lot", "more or less", "--data-dir=dict"}, argv)
        end)
        it("should split string with dashes", function()
            local words = {}
            for word in util.gsplit("a-b-c-d", "-", false) do
                table.insert(words, word)
            end
            assert.are_same({"a", "b", "c", "d"}, words)
        end)
        it("should split string with dashes with final dash", function()
            local words = {}
            for word in util.gsplit("a-b-c-d-", "-", false) do
                table.insert(words, word)
            end
            assert.are_same({"a", "b", "c", "d"}, words)
        end)
    end)

    describe("splitToWords()", function()
        it("should split line into words", function()
            local words = util.splitToWords("one two,three  four . five")
            assert.are_same({
                "one",
                " ",
                "two",
                ",",
                "three",
                "  ",
                "four",
                " . ",
                "five",
            }, words)
        end)
        it("should split ancient greek words", function()
            local words = util.splitToWords("Λαρισαῖος Λευκοθέα Λιγυαστάδης.")
            assert.are_same({
                "Λαρισαῖος",
                " ",
                "Λευκοθέα",
                " ",
                "Λιγυαστάδης",
                "."
            }, words)
        end)
        it("should split Chinese words", function()
            local words = util.splitToWords("彩虹是通过太阳光的折射引起的。")
            assert.are_same({
                "彩","虹","是","通","过","太","阳","光","的","折","射","引","起","的","。",
            }, words)
        end)
        it("should split Japanese words", function()
            local words = util.splitToWords("色は匂へど散りぬるを我が世誰ぞ常ならむ")
            assert.are_same({
                "色","は","匂","へ","ど","散","り","ぬ","る","を",
                "我","が","世","誰","ぞ","常","な","ら","む",
            }, words)
        end)
        it("should split Korean words", function()
            -- Technically splitting on spaces is correct but we treat Korean
            -- as if it were any other CJK text.
            local words = util.splitToWords("대한민국의 국기는 대한민국 국기법에 따라 태극기")
            assert.are_same({
                "대","한","민","국","의"," ","국","기","는"," ",
                "대","한","민","국"," ","국","기","법","에"," ",
                "따","라"," ","태","극","기",
            }, words)
        end)
        it("should split words of multilingual text", function()
            local words = util.splitToWords("BBC纪录片")
            assert.are_same({"BBC", "纪", "录", "片"}, words)
        end)
    end)

    describe("splitToChars()", function()
        it("should split text to line - unicode", function()
            local text = "Pójdźże, chmurność glück schließen Štěstí neštěstí. Uñas gavilán"
            local word = ""
            local table_of_words = {}
            local c
            local table_chars = util.splitToChars(text)
            for i = 1, #table_chars  do
                c = table_chars[i]
                word = word .. c
                if util.isSplittable(c) then
                    table.insert(table_of_words, word)
                    word = ""
                end
                if i == #table_chars and word ~= "" then table.insert(table_of_words, word) end
            end
            assert.are_same({
                "Pójdźże, ",
                "chmurność ",
                "glück ",
                "schließen ",
                "Štěstí ",
                "neštěstí. ",
                "Uñas ",
                "gavilán",
            }, table_of_words)
        end)
        it("should split text to line - CJK Chinese", function()
            local text = "彩虹是通过太阳光的折射引起的。"
            local word = ""
            local table_of_words = {}
            local c
            local table_chars = util.splitToChars(text)
            for i = 1, #table_chars  do
                c = table_chars[i]
                word = word .. c
                if util.isSplittable(c) then
                    table.insert(table_of_words, word)
                    word = ""
                end
                if i == #table_chars and word ~= "" then table.insert(table_of_words, word) end
            end
            assert.are_same({
                "彩","虹","是","通","过","太","阳","光","的","折","射","引","起","的","。",
            }, table_of_words)
        end)
        it("should split text to line - CJK Japanese", function()
            local text = "色は匂へど散りぬるを我が世誰ぞ常ならむ"
            local word = ""
            local table_of_words = {}
            local c
            local table_chars = util.splitToChars(text)
            for i = 1, #table_chars  do
                c = table_chars[i]
                word = word .. c
                if util.isSplittable(c) then
                    table.insert(table_of_words, word)
                    word = ""
                end
                if i == #table_chars and word ~= "" then table.insert(table_of_words, word) end
            end
            assert.are_same({
                "色","は","匂","へ","ど","散","り","ぬ","る","を",
                "我","が","世","誰","ぞ","常","な","ら","む",
            }, table_of_words)
        end)
        it("should split text to line - CJK Korean", function()
            local text = "대한민국의 국기는 대한민국 국기법에 따라 태극기"
            local word = ""
            local table_of_words = {}
            local c
            local table_chars = util.splitToChars(text)
            for i = 1, #table_chars  do
                c = table_chars[i]
                word = word .. c
                if util.isSplittable(c) then
                    table.insert(table_of_words, word)
                    word = ""
                end
                if i == #table_chars and word ~= "" then table.insert(table_of_words, word) end
            end
            assert.are_same({
                "대","한","민","국","의"," ","국","기","는"," ",
                "대","한","민","국"," ","국","기","법","에"," ",
                "따","라"," ","태","극","기",
            }, table_of_words)
        end)
        it("should split text to line - mixed CJK and latin", function()
            local text = "This is Russian: русский язык, Chinese: 汉语, Japanese: 日本語、 Korean: 한국어。"
            local word = ""
            local table_of_words = {}
            local c
            local table_chars = util.splitToChars(text)
            for i = 1, #table_chars  do
                c = table_chars[i]
                word = word .. c
                if util.isSplittable(c) then
                    table.insert(table_of_words, word)
                    word = ""
                end
                if i == #table_chars and word ~= "" then table.insert(table_of_words, word) end
            end
            assert.are_same({
                "This ", "is ",
                "Russian: ", "русский ", "язык, ",
                "Chinese: ", "汉","语",", ",
                "Japanese: ", "日","本","語","、", " ",
                "Korean: ", "한","국","어","。",
            }, table_of_words)
        end)
        it("should split text to line with next_c - unicode", function()
            local text = "Ce test : 1) est très simple ; 2 ) simple comme ( 2/2 ) > 50 % ? ok."
            local word = ""
            local table_of_words = {}
            local c, next_c
            local table_chars = util.splitToChars(text)
            for i = 1, #table_chars  do
                c = table_chars[i]
                next_c = i < #table_chars and table_chars[i+1] or nil
                word = word .. c
                if util.isSplittable(c, next_c) then
                    table.insert(table_of_words, word)
                    word = ""
                end
                if i == #table_chars and word ~= "" then table.insert(table_of_words, word) end
            end
            assert.are_same({
                "Ce ",
                "test : ",
                "1) ",
                "est ",
                "très ",
                "simple ; ",
                "2 ) ",
                "simple ",
                "comme ",
                "( ",
                "2/2 ) > ",
                "50 % ? ",
                "ok."
            }, table_of_words)
        end)
        it("should split text to line with next_c and prev_c - unicode", function()
            local text = "Ce test : 1) est « très simple » ; 2 ) simple comme ( 2/2 ) > 50 % ? ok."
            local word = ""
            local table_of_words = {}
            local c, next_c, prev_c
            local table_chars = util.splitToChars(text)
            for i = 1, #table_chars  do
                c = table_chars[i]
                next_c = i < #table_chars and table_chars[i+1] or nil
                prev_c = i > 1 and table_chars[i-1] or nil
                word = word .. c
                if util.isSplittable(c, next_c, prev_c) then
                    table.insert(table_of_words, word)
                    word = ""
                end
                if i == #table_chars and word ~= "" then table.insert(table_of_words, word) end
            end
            assert.are_same({
                "Ce ",
                "test : ",
                "1) ",
                "est ",
                "« très ",
                "simple » ; ",
                "2 ) ",
                "simple ",
                "comme ",
                "( 2/2 ) > 50 % ? ",
                "ok."
            }, table_of_words)
        end)
    end)

    it("should split file path and name", function()
        local test = function(full, path, name)
            local p, n = util.splitFilePathName(full)
            assert.are_same(p, path)
            assert.are_same(n, name)
        end
        test("/a/b/c.txt", "/a/b/", "c.txt")
        test("/a/b////c.txt", "/a/b////", "c.txt")
        test("/a/b/", "/a/b/", "")
        test("c.txt", "", "c.txt")
        test("", "", "")
        test(nil, "", "")
        test("a/b", "a/", "b")
        test("/b", "/", "b")
        assert.are_same("/a/b/", util.splitFilePathName("/a/b/c.txt"))
    end)

    it("should split file name and suffix", function()
        local test = function(full, name, suffix)
            local n, s = util.splitFileNameSuffix(full)
            assert.are_same(n, name)
            assert.are_same(s, suffix)
        end
        test("a.txt", "a", "txt")
        test("/a/b.txt", "/a/b", "txt")
        test("a", "a", "")
        test("/a/b", "/a/b", "")
        test("/a/", "/a/", "")
        test("/a/.txt", "/a/", "txt")
        test(nil, "", "")
        test("", "", "")
        assert.are_same("a", util.splitFileNameSuffix("a.txt"))
    end)

    describe("getSafeFileName()", function()
        it("should replace unsafe characters", function()
            assert.is_equal("___", util.getSafeFilename("|||"))
        end)
        it("should truncate any characters beyond the limit", function()
            assert.is_equal("aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa", util.getSafeFilename("aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa"))
        end)
        it("should truncate extension beyond the limit", function()
            assert.is_equal("aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa", util.getSafeFilename("aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa.aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa"))
        end)
        it("should strip HTML from the filename", function()
            assert.is_equal("lalala", util.getSafeFilename("<span>lalala</span>"))
        end)
    end)

    describe("partialMD5()", function()
        it("should calculate partial md5 hash of pdf file", function()
            assert.is_equal(util.partialMD5("spec/front/unit/data/tall.pdf"), "41cce710f34e5ec21315e19c99821415")
        end)
        it("should calculate partial md5 hash of epub file", function()
            assert.is_equal(util.partialMD5("spec/front/unit/data/leaves.epub"), "59d481d168cca6267322f150c5f6a2a3")
        end)
    end)

    describe("fixUtf8()", function()
        it("should replace invalid UTF-8 characters with an underscore", function()
            assert.is_equal("\127 _ _\127 ", util.fixUtf8("\127 \128 \194\127 ", "_"))
        end)

        it("should replace invalid UTF-8 characters with multiple characters", function()
            assert.is_equal("\127 __ __\127 ", util.fixUtf8("\127 \128 \194\127 ", "__"))
        end)

        it("should replace invalid UTF-8 characters with empty char", function()
            assert.is_equal("\127  \127 ", util.fixUtf8("\127 \128 \194\127 ", ""))
        end)

        it("should not replace valid UTF-8 <20> character", function()
            assert.is_equal("<EFBFBD>valid <20> char <20>", util.fixUtf8("<EFBFBD>valid <20> char <20>", "__"))
        end)

        it("should not replace valid UTF-8 characters", function()
            assert.is_equal("\99 \244\129\130\190", util.fixUtf8("\99 \244\129\130\190", "_"))
        end)

        it("should not replace valid UTF-8 characters Polish chars", function()
            assert.is_equal("Pójdźże źółć", util.fixUtf8("Pójdźże źółć", "_"))
        end)

        it("should not replace valid UTF-8 characters German chars", function()
            assert.is_equal("glück schließen", util.fixUtf8("glück schließen", "_"))
        end)
    end)

    describe("splitToArray()", function()
        it("should split input to array", function()
            assert.are_same({"100", "abc", "", "def", "ghi200"},
                            util.splitToArray("100\tabc\t\tdef\tghi200\t", "\t", true))
        end)

        it("should also split input to array", function()
            assert.are_same({"", "bc", "bc", "bc", "bc"},
                            util.splitToArray("abcabcabcabca", "a", true))
        end)

        it("should split input to array without empty entities", function()
            assert.are_same({"100", "abc", "def", "ghi200"},
                            util.splitToArray("100  abc   def ghi200  ", " ", false))
        end)
    end)

    describe("htmlToPlainTextIfHtml()", function()
        it("should guess it is not HTML and let is as is", function()
            local s = "if (i < 0 && j < 0) j = i&amp;"
            assert.is_equal(s, util.htmlToPlainTextIfHtml(s))
        end)
        it("should guess it is HTML and convert it to text", function()
            assert.is_equal("Making unit tests is fun & nécéssaire",
                            util.htmlToPlainTextIfHtml("<div> <br> Making <b>unit&nbsp;tests</b> is <i class='notreally'>fun &amp; n&#xE9;c&#233;ssaire</i><br/> </div>"))
        end)
        it("should guess it is double encoded HTML and convert it to text", function()
            assert.is_equal("Deux parties.\nPrologue.Désespérée, elle le tue...\nPremière partie. Sur la route & dans la nuit",
                            util.htmlToPlainTextIfHtml("Deux parties.&lt;br&gt;Prologue.Désespérée, elle le tue...&lt;br&gt;Première partie. Sur la route &amp;amp; dans la nuit"))
        end)
    end)

    describe("isEmptyDir()", function()
        it("should return true on empty dir", function()
            assert.is_true(util.isEmptyDir(DataStorage:getDataDir() .. "/history")) -- should be empty during unit tests
        end)
        it("should return false on non-empty dir", function()
            assert.is_false(util.isEmptyDir(DataStorage:getDataDir())) -- should contain subdirectories
        end)
        it("should return nil on non-existent dir", function()
            assert.is_nil(util.isEmptyDir("/this/is/just/some/nonsense/really/this/should/not/exist"))
        end)
    end)

    describe("getFriendlySize()", function()
        describe("should convert bytes to friendly size as string", function()
            it("to 100.0 GB", function()
                assert.is_equal("100.0 GB",
                                util.getFriendlySize(100*1000*1000*1000))
            end)
            it("to 1.0 GB", function()
                assert.is_equal("1.0 GB",
                                util.getFriendlySize(1000*1000*1000+1))
            end)
            it("to 1.0 MB", function()
                assert.is_equal("1.0 MB",
                                util.getFriendlySize(1000*1000+1))
            end)
            it("to 1.0 kB", function()
                assert.is_equal("1.0 kB",
                                util.getFriendlySize(1000+1))
            end)
            it("to B", function()
                assert.is_equal("10 B",
                                util.getFriendlySize(10))
            end)
            it("to 100.0 GB with minimum field width alignment", function()
                assert.is_equal(" 100.0 GB",
                                util.getFriendlySize(100*1000*1000*1000, true))
            end)
            it("to 1.0 GB with minimum field width alignment", function()
                assert.is_equal("   1.0 GB",
                                util.getFriendlySize(1000*1000*1000+1, true))
            end)
            it("to 1.0 MB with minimum field width alignment", function()
                assert.is_equal("   1.0 MB",
                                util.getFriendlySize(1000*1000+1, true))
            end)
            it("to 1.0 kB with minimum field width alignment", function()
                assert.is_equal("   1.0 kB",
                                util.getFriendlySize(1000+1, true))
            end)
            it("to B with minimum field width alignment", function()
                assert.is_equal("    10 B",
                                util.getFriendlySize(10, true))
            end)
        end)
        it("should return nil when input is nil or false", function()
            assert.is_nil(util.getFriendlySize(nil))
            assert.is_nil(util.getFriendlySize(false))
        end)
        it("should return nil when input is not a number", function()
            assert.is_nil(util.getFriendlySize("a string"))
        end)
    end)

    describe("urlEncode() and urlDecode", function()
        it("should encode string", function()
            assert.is_equal("Secret_Password123", util.urlEncode("Secret_Password123"))
            assert.is_equal("Secret%20Password123", util.urlEncode("Secret Password123"))
            assert.is_equal("S*cret%3DP%40%24%24word*!%23%3F", util.urlEncode("S*cret=P@$$word*!#?"))
            assert.is_equal("~%5E-_%5C%25!*'()%3B%3A%40%26%3D%2B%24%2C%2F%3F%23%5B%5D",
                util.urlEncode("~^-_\\%!*'();:@&=+$,/?#[]"))
        end)
        it("should decode string", function()
            assert.is_equal("Secret_Password123", util.urlDecode("Secret_Password123"))
            assert.is_equal("Secret Password123", util.urlDecode("Secret%20Password123"))
            assert.is_equal("S*cret=P@$$word*!#?", util.urlDecode("S*cret%3DP%40%24%24word*!%23%3F"))
            assert.is_equal("~^-_\\%!*'();:@&=+$,/?#[]",
                util.urlDecode("~%5E-_%5C%25!*'()%3B%3A%40%26%3D%2B%24%2C%2F%3F%23%5B%5D"))
        end)
        it("should encode and back decode string", function()
            assert.is_equal("Secret_Password123",
                util.urlDecode(util.urlEncode("Secret_Password123")))
            assert.is_equal("Secret Password123",
                util.urlDecode(util.urlEncode("Secret Password123")))
            assert.is_equal("S*cret=P@$$word*!#?",
                util.urlDecode(util.urlEncode("S*cret=P@$$word*!#?")))
            assert.is_equal("~^-_%!*'();:@&=+$,/?#[]",
                util.urlDecode(util.urlEncode("~^-_%!*'();:@&=+$,/?#[]")))
        end)
    end)
end)
-												Refactor out string.gsplit to util.gsplit

											
										
										
											2015-04-22 06:17:06 +00:00
+								describe("util module", function()
-												add unit test

											
										
										
											2017-08-12 13:22:00 +00:00
+								    local DataStorage, util
-												kobo: fix screen probe for touch

											
										
										
											2016-04-03 04:52:30 +00:00
+								    setup(function()
 								        require("commonrequire")
-												add unit test

											
										
										
											2017-08-12 13:22:00 +00:00
+								        DataStorage = require("datastorage")
-												kobo: fix screen probe for touch

											
										
										
											2016-04-03 04:52:30 +00:00
+								        util = require("util")
 								    end)
-												Other minor frontend.util cleanups (#5629)

* Resync fixUtf8 w/ upstream
* Fix lastIndexOf desc
* Drop unichar usage, it's a crappier unicodeCodepointToUtf8 ;).

											
										
										
											2019-11-23 23:27:27 +00:00
+								    it("should strip punctuation marks around word", function()
 								        assert.is_equal("hello world", util.stripPunctuation("\"hello world\""))
 								        assert.is_equal("hello world", util.stripPunctuation("\"hello world?\""))
 								        assert.is_equal("hello, world", util.stripPunctuation("\"hello, world?\""))
 								        assert.is_equal("你好", util.stripPunctuation("“你好“"))
 								        assert.is_equal("你好", util.stripPunctuation("“你好?“"))
 								        assert.is_equal("", util.stripPunctuation(""))
 								        assert.is_nil(util.stripPunctuation(nil))
-												Refactor out string.gsplit to util.gsplit

											
										
										
											2015-04-22 06:17:06 +00:00
+								    end)
-												kobo: fix screen probe for touch

											
										
										
											2016-04-03 04:52:30 +00:00
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								    describe("gsplit()", function()
 								        it("should split string with patterns", function()
 								            local sentence = "Hello world, welcome to KOReader!"
 								            local words = {}
 								            for word in util.gsplit(sentence, "%s+", false) do
 								                table.insert(words, word)
 								            end
 								            assert.are_same({"Hello", "world,", "welcome", "to", "KOReader!"}, words)
 								        end)
 								        it("should split command line arguments with quotation", function()
 								            local command = "./sdcv -nj \"words\" \"a lot\" 'more or less' --data-dir=dict"
 								            local argv = {}
 								            for arg1 in util.gsplit(command, "[\"'].-[\"']", true) do
 								                for arg2 in util.gsplit(arg1, "^[^\"'].-%s+", true) do
 								                    for arg3 in util.gsplit(arg2, "[\"']", false) do
-												Show full ToC entry on hold (#6729)

Fix #6728
											
										
										
											2020-09-30 17:56:56 +00:00
+								                        local trimmed = util.trim(arg3)
 								                        if trimmed ~= "" then
 								                            table.insert(argv, trimmed)
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								                        end
-												Refactor out string.gsplit to util.gsplit

											
										
										
											2015-04-22 06:17:06 +00:00
+								                    end
 								                end
 								            end
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								            assert.are_same({"./sdcv", "-nj", "words", "a lot", "more or less", "--data-dir=dict"}, argv)
 								        end)
 								        it("should split string with dashes", function()
 								            local words = {}
 								            for word in util.gsplit("a-b-c-d", "-", false) do
 								                table.insert(words, word)
 								            end
 								            assert.are_same({"a", "b", "c", "d"}, words)
 								        end)
 								        it("should split string with dashes with final dash", function()
 								            local words = {}
 								            for word in util.gsplit("a-b-c-d-", "-", false) do
 								                table.insert(words, word)
 								            end
 								            assert.are_same({"a", "b", "c", "d"}, words)
 								        end)
-												split accient greek words with spacing character
This should fix #1705.

											
										
										
											2016-06-28 15:50:21 +00:00
+								    end)
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								    describe("splitToWords()", function()
 								        it("should split line into words", function()
 								            local words = util.splitToWords("one two,three  four . five")
 								            assert.are_same({
 								                "one",
 								                " ",
 								                "two",
 								                ",",
 								                "three",
 								                "  ",
 								                "four",
 								                " . ",
 								                "five",
 								            }, words)
 								        end)
 								        it("should split ancient greek words", function()
 								            local words = util.splitToWords("Λαρισαῖος Λευκοθέα Λιγυαστάδης.")
 								            assert.are_same({
 								                "Λαρισαῖος",
 								                " ",
 								                "Λευκοθέα",
 								                " ",
 								                "Λιγυαστάδης",
 								                "."
 								            }, words)
 								        end)
 								        it("should split Chinese words", function()
 								            local words = util.splitToWords("彩虹是通过太阳光的折射引起的。")
 								            assert.are_same({
 								                "彩","虹","是","通","过","太","阳","光","的","折","射","引","起","的","。",
 								            }, words)
 								        end)
-												util.utf8: improve CJK character detection

Previously the CJK character detection defined only characters in the
range U+4000..U+AFFF as "CJK characters". This excludes an incredibly
large number of CJK characters within the BMP, let alone the whole two
planes dedicated to rarer CJK characters (the SIP and TIP). As a result,
a very large number of Chinese, Japanese, and Korean characters were not
detected as being CJK characters.

While slightly less elegant-looking, it is far more accurate to compute
the codepoint from the utf8 character and then see if it falls within
one of the defined CJK blocks. This is not future-proof against future
CJK ideograph extensions in future Unicode versions, but there is no
real way to accurately predict such changes so this is the best we can
do without accidentally treating characters explicitily defined as being
non-CJK in Unicode as CJK.

While we're at it, copy Lua 5.3's utf8.charpattern constant definition
so that we can more easily write utf8 iterators with string.gmatch (at
least in the interim until there is a rework of utf8 handling in
KOReader and everything is rebuilt on top of utf8proc).

Some unit tests are added for Korean and Japanese text, and the existing
unit tests needed a minor adjustment to handle the fact that
isSplittable now correctly detects CJK punctuation as a character to
compare against the forbidden split rules.

Signed-off-by: Aleksa Sarai <cyphar@cyphar.com>

											
										
										
											2021-10-23 10:12:38 +00:00
+								        it("should split Japanese words", function()
 								            local words = util.splitToWords("色は匂へど散りぬるを我が世誰ぞ常ならむ")
 								            assert.are_same({
 								                "色","は","匂","へ","ど","散","り","ぬ","る","を",
 								                "我","が","世","誰","ぞ","常","な","ら","む",
 								            }, words)
 								        end)
 								        it("should split Korean words", function()
-												[chore] Spaces for indendation, not tabs (#8364)

Overlooked in #8312.
											
										
										
											2021-10-23 14:11:47 +00:00
+								            -- Technically splitting on spaces is correct but we treat Korean
 								            -- as if it were any other CJK text.
-												util.utf8: improve CJK character detection

Previously the CJK character detection defined only characters in the
range U+4000..U+AFFF as "CJK characters". This excludes an incredibly
large number of CJK characters within the BMP, let alone the whole two
planes dedicated to rarer CJK characters (the SIP and TIP). As a result,
a very large number of Chinese, Japanese, and Korean characters were not
detected as being CJK characters.

While slightly less elegant-looking, it is far more accurate to compute
the codepoint from the utf8 character and then see if it falls within
one of the defined CJK blocks. This is not future-proof against future
CJK ideograph extensions in future Unicode versions, but there is no
real way to accurately predict such changes so this is the best we can
do without accidentally treating characters explicitily defined as being
non-CJK in Unicode as CJK.

While we're at it, copy Lua 5.3's utf8.charpattern constant definition
so that we can more easily write utf8 iterators with string.gmatch (at
least in the interim until there is a rework of utf8 handling in
KOReader and everything is rebuilt on top of utf8proc).

Some unit tests are added for Korean and Japanese text, and the existing
unit tests needed a minor adjustment to handle the fact that
isSplittable now correctly detects CJK punctuation as a character to
compare against the forbidden split rules.

Signed-off-by: Aleksa Sarai <cyphar@cyphar.com>

											
										
										
											2021-10-23 10:12:38 +00:00
+								            local words = util.splitToWords("대한민국의 국기는 대한민국 국기법에 따라 태극기")
 								            assert.are_same({
 								                "대","한","민","국","의"," ","국","기","는"," ",
 								                "대","한","민","국"," ","국","기","법","에"," ",
 								                "따","라"," ","태","극","기",
 								            }, words)
 								        end)
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								        it("should split words of multilingual text", function()
 								            local words = util.splitToWords("BBC纪录片")
 								            assert.are_same({"BBC", "纪", "录", "片"}, words)
 								        end)
-												split accient greek words with spacing character
This should fix #1705.

											
										
										
											2016-06-28 15:50:21 +00:00
+								    end)
-												Fix hyphenation words with unicode character in texboxwidget (#2356)


											
										
										
											2016-11-19 20:26:53 +00:00
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								    describe("splitToChars()", function()
 								        it("should split text to line - unicode", function()
 								            local text = "Pójdźże, chmurność glück schließen Štěstí neštěstí. Uñas gavilán"
 								            local word = ""
 								            local table_of_words = {}
 								            local c
 								            local table_chars = util.splitToChars(text)
 								            for i = 1, #table_chars  do
 								                c = table_chars[i]
 								                word = word .. c
 								                if util.isSplittable(c) then
 								                    table.insert(table_of_words, word)
 								                    word = ""
 								                end
-												util.utf8: improve CJK character detection

Previously the CJK character detection defined only characters in the
range U+4000..U+AFFF as "CJK characters". This excludes an incredibly
large number of CJK characters within the BMP, let alone the whole two
planes dedicated to rarer CJK characters (the SIP and TIP). As a result,
a very large number of Chinese, Japanese, and Korean characters were not
detected as being CJK characters.

While slightly less elegant-looking, it is far more accurate to compute
the codepoint from the utf8 character and then see if it falls within
one of the defined CJK blocks. This is not future-proof against future
CJK ideograph extensions in future Unicode versions, but there is no
real way to accurately predict such changes so this is the best we can
do without accidentally treating characters explicitily defined as being
non-CJK in Unicode as CJK.

While we're at it, copy Lua 5.3's utf8.charpattern constant definition
so that we can more easily write utf8 iterators with string.gmatch (at
least in the interim until there is a rework of utf8 handling in
KOReader and everything is rebuilt on top of utf8proc).

Some unit tests are added for Korean and Japanese text, and the existing
unit tests needed a minor adjustment to handle the fact that
isSplittable now correctly detects CJK punctuation as a character to
compare against the forbidden split rules.

Signed-off-by: Aleksa Sarai <cyphar@cyphar.com>

											
										
										
											2021-10-23 10:12:38 +00:00
+								                if i == #table_chars and word ~= "" then table.insert(table_of_words, word) end
-												Fix hyphenation words with unicode character in texboxwidget (#2356)


											
										
										
											2016-11-19 20:26:53 +00:00
+								            end
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								            assert.are_same({
 								                "Pójdźże, ",
 								                "chmurność ",
 								                "glück ",
 								                "schließen ",
 								                "Štěstí ",
 								                "neštěstí. ",
 								                "Uñas ",
 								                "gavilán",
 								            }, table_of_words)
 								        end)
-												util.utf8: improve CJK character detection

Previously the CJK character detection defined only characters in the
range U+4000..U+AFFF as "CJK characters". This excludes an incredibly
large number of CJK characters within the BMP, let alone the whole two
planes dedicated to rarer CJK characters (the SIP and TIP). As a result,
a very large number of Chinese, Japanese, and Korean characters were not
detected as being CJK characters.

While slightly less elegant-looking, it is far more accurate to compute
the codepoint from the utf8 character and then see if it falls within
one of the defined CJK blocks. This is not future-proof against future
CJK ideograph extensions in future Unicode versions, but there is no
real way to accurately predict such changes so this is the best we can
do without accidentally treating characters explicitily defined as being
non-CJK in Unicode as CJK.

While we're at it, copy Lua 5.3's utf8.charpattern constant definition
so that we can more easily write utf8 iterators with string.gmatch (at
least in the interim until there is a rework of utf8 handling in
KOReader and everything is rebuilt on top of utf8proc).

Some unit tests are added for Korean and Japanese text, and the existing
unit tests needed a minor adjustment to handle the fact that
isSplittable now correctly detects CJK punctuation as a character to
compare against the forbidden split rules.

Signed-off-by: Aleksa Sarai <cyphar@cyphar.com>

											
										
										
											2021-10-23 10:12:38 +00:00
+								        it("should split text to line - CJK Chinese", function()
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								            local text = "彩虹是通过太阳光的折射引起的。"
 								            local word = ""
 								            local table_of_words = {}
 								            local c
 								            local table_chars = util.splitToChars(text)
 								            for i = 1, #table_chars  do
 								                c = table_chars[i]
 								                word = word .. c
 								                if util.isSplittable(c) then
 								                    table.insert(table_of_words, word)
 								                    word = ""
 								                end
-												util.utf8: improve CJK character detection

Previously the CJK character detection defined only characters in the
range U+4000..U+AFFF as "CJK characters". This excludes an incredibly
large number of CJK characters within the BMP, let alone the whole two
planes dedicated to rarer CJK characters (the SIP and TIP). As a result,
a very large number of Chinese, Japanese, and Korean characters were not
detected as being CJK characters.

While slightly less elegant-looking, it is far more accurate to compute
the codepoint from the utf8 character and then see if it falls within
one of the defined CJK blocks. This is not future-proof against future
CJK ideograph extensions in future Unicode versions, but there is no
real way to accurately predict such changes so this is the best we can
do without accidentally treating characters explicitily defined as being
non-CJK in Unicode as CJK.

While we're at it, copy Lua 5.3's utf8.charpattern constant definition
so that we can more easily write utf8 iterators with string.gmatch (at
least in the interim until there is a rework of utf8 handling in
KOReader and everything is rebuilt on top of utf8proc).

Some unit tests are added for Korean and Japanese text, and the existing
unit tests needed a minor adjustment to handle the fact that
isSplittable now correctly detects CJK punctuation as a character to
compare against the forbidden split rules.

Signed-off-by: Aleksa Sarai <cyphar@cyphar.com>

											
										
										
											2021-10-23 10:12:38 +00:00
+								                if i == #table_chars and word ~= "" then table.insert(table_of_words, word) end
-												PR #2356 breaks CJK character splitting

											
										
										
											2016-11-26 00:46:56 +00:00
+								            end
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								            assert.are_same({
 								                "彩","虹","是","通","过","太","阳","光","的","折","射","引","起","的","。",
 								            }, table_of_words)
 								        end)
-												util.utf8: improve CJK character detection

Previously the CJK character detection defined only characters in the
range U+4000..U+AFFF as "CJK characters". This excludes an incredibly
large number of CJK characters within the BMP, let alone the whole two
planes dedicated to rarer CJK characters (the SIP and TIP). As a result,
a very large number of Chinese, Japanese, and Korean characters were not
detected as being CJK characters.

While slightly less elegant-looking, it is far more accurate to compute
the codepoint from the utf8 character and then see if it falls within
one of the defined CJK blocks. This is not future-proof against future
CJK ideograph extensions in future Unicode versions, but there is no
real way to accurately predict such changes so this is the best we can
do without accidentally treating characters explicitily defined as being
non-CJK in Unicode as CJK.

While we're at it, copy Lua 5.3's utf8.charpattern constant definition
so that we can more easily write utf8 iterators with string.gmatch (at
least in the interim until there is a rework of utf8 handling in
KOReader and everything is rebuilt on top of utf8proc).

Some unit tests are added for Korean and Japanese text, and the existing
unit tests needed a minor adjustment to handle the fact that
isSplittable now correctly detects CJK punctuation as a character to
compare against the forbidden split rules.

Signed-off-by: Aleksa Sarai <cyphar@cyphar.com>

											
										
										
											2021-10-23 10:12:38 +00:00
+								        it("should split text to line - CJK Japanese", function()
 								            local text = "色は匂へど散りぬるを我が世誰ぞ常ならむ"
 								            local word = ""
 								            local table_of_words = {}
 								            local c
 								            local table_chars = util.splitToChars(text)
 								            for i = 1, #table_chars  do
 								                c = table_chars[i]
 								                word = word .. c
 								                if util.isSplittable(c) then
 								                    table.insert(table_of_words, word)
 								                    word = ""
 								                end
 								                if i == #table_chars and word ~= "" then table.insert(table_of_words, word) end
 								            end
 								            assert.are_same({
 								                "色","は","匂","へ","ど","散","り","ぬ","る","を",
 								                "我","が","世","誰","ぞ","常","な","ら","む",
 								            }, table_of_words)
 								        end)
 								        it("should split text to line - CJK Korean", function()
 								            local text = "대한민국의 국기는 대한민국 국기법에 따라 태극기"
 								            local word = ""
 								            local table_of_words = {}
 								            local c
 								            local table_chars = util.splitToChars(text)
 								            for i = 1, #table_chars  do
 								                c = table_chars[i]
 								                word = word .. c
 								                if util.isSplittable(c) then
 								                    table.insert(table_of_words, word)
 								                    word = ""
 								                end
 								                if i == #table_chars and word ~= "" then table.insert(table_of_words, word) end
 								            end
 								            assert.are_same({
 								                "대","한","민","국","의"," ","국","기","는"," ",
 								                "대","한","민","국"," ","국","기","법","에"," ",
 								                "따","라"," ","태","극","기",
 								            }, table_of_words)
 								        end)
 								        it("should split text to line - mixed CJK and latin", function()
 								            local text = "This is Russian: русский язык, Chinese: 汉语, Japanese: 日本語、 Korean: 한국어。"
 								            local word = ""
 								            local table_of_words = {}
 								            local c
 								            local table_chars = util.splitToChars(text)
 								            for i = 1, #table_chars  do
 								                c = table_chars[i]
 								                word = word .. c
 								                if util.isSplittable(c) then
 								                    table.insert(table_of_words, word)
 								                    word = ""
 								                end
 								                if i == #table_chars and word ~= "" then table.insert(table_of_words, word) end
 								            end
 								            assert.are_same({
 								                "This ", "is ",
 								                "Russian: ", "русский ", "язык, ",
 								                "Chinese: ", "汉","语",", ",
 								                "Japanese: ", "日","本","語","、", " ",
 								                "Korean: ", "한","국","어","。",
 								            }, table_of_words)
 								        end)
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								        it("should split text to line with next_c - unicode", function()
 								            local text = "Ce test : 1) est très simple ; 2 ) simple comme ( 2/2 ) > 50 % ? ok."
 								            local word = ""
 								            local table_of_words = {}
 								            local c, next_c
 								            local table_chars = util.splitToChars(text)
 								            for i = 1, #table_chars  do
 								                c = table_chars[i]
 								                next_c = i < #table_chars and table_chars[i+1] or nil
 								                word = word .. c
 								                if util.isSplittable(c, next_c) then
 								                    table.insert(table_of_words, word)
 								                    word = ""
 								                end
-												util.utf8: improve CJK character detection

Previously the CJK character detection defined only characters in the
range U+4000..U+AFFF as "CJK characters". This excludes an incredibly
large number of CJK characters within the BMP, let alone the whole two
planes dedicated to rarer CJK characters (the SIP and TIP). As a result,
a very large number of Chinese, Japanese, and Korean characters were not
detected as being CJK characters.

While slightly less elegant-looking, it is far more accurate to compute
the codepoint from the utf8 character and then see if it falls within
one of the defined CJK blocks. This is not future-proof against future
CJK ideograph extensions in future Unicode versions, but there is no
real way to accurately predict such changes so this is the best we can
do without accidentally treating characters explicitily defined as being
non-CJK in Unicode as CJK.

While we're at it, copy Lua 5.3's utf8.charpattern constant definition
so that we can more easily write utf8 iterators with string.gmatch (at
least in the interim until there is a rework of utf8 handling in
KOReader and everything is rebuilt on top of utf8proc).

Some unit tests are added for Korean and Japanese text, and the existing
unit tests needed a minor adjustment to handle the fact that
isSplittable now correctly detects CJK punctuation as a character to
compare against the forbidden split rules.

Signed-off-by: Aleksa Sarai <cyphar@cyphar.com>

											
										
										
											2021-10-23 10:12:38 +00:00
+								                if i == #table_chars and word ~= "" then table.insert(table_of_words, word) end
-												textboxwidget and scrolltextwidget enhancements (#2393)

util: made isSplitable() accept an optional next_char
for wiser decision

textboxwidget: speed up rendering, enhanced text wrapping,
allow selection of multiple words with Hold.

scrolltextwidget: allow scrolling with Tap.

Details in #2393

											
										
										
											2016-12-06 21:10:25 +00:00
+								            end
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								            assert.are_same({
 								                "Ce ",
 								                "test : ",
 								                "1) ",
 								                "est ",
 								                "très ",
 								                "simple ; ",
 								                "2 ) ",
 								                "simple ",
 								                "comme ",
 								                "( ",
 								                "2/2 ) > ",
 								                "50 % ? ",
 								                "ok."
 								            }, table_of_words)
 								        end)
 								        it("should split text to line with next_c and prev_c - unicode", function()
 								            local text = "Ce test : 1) est « très simple » ; 2 ) simple comme ( 2/2 ) > 50 % ? ok."
 								            local word = ""
 								            local table_of_words = {}
 								            local c, next_c, prev_c
 								            local table_chars = util.splitToChars(text)
 								            for i = 1, #table_chars  do
 								                c = table_chars[i]
 								                next_c = i < #table_chars and table_chars[i+1] or nil
 								                prev_c = i > 1 and table_chars[i-1] or nil
 								                word = word .. c
 								                if util.isSplittable(c, next_c, prev_c) then
 								                    table.insert(table_of_words, word)
 								                    word = ""
 								                end
-												util.utf8: improve CJK character detection

Previously the CJK character detection defined only characters in the
range U+4000..U+AFFF as "CJK characters". This excludes an incredibly
large number of CJK characters within the BMP, let alone the whole two
planes dedicated to rarer CJK characters (the SIP and TIP). As a result,
a very large number of Chinese, Japanese, and Korean characters were not
detected as being CJK characters.

While slightly less elegant-looking, it is far more accurate to compute
the codepoint from the utf8 character and then see if it falls within
one of the defined CJK blocks. This is not future-proof against future
CJK ideograph extensions in future Unicode versions, but there is no
real way to accurately predict such changes so this is the best we can
do without accidentally treating characters explicitily defined as being
non-CJK in Unicode as CJK.

While we're at it, copy Lua 5.3's utf8.charpattern constant definition
so that we can more easily write utf8 iterators with string.gmatch (at
least in the interim until there is a rework of utf8 handling in
KOReader and everything is rebuilt on top of utf8proc).

Some unit tests are added for Korean and Japanese text, and the existing
unit tests needed a minor adjustment to handle the fact that
isSplittable now correctly detects CJK punctuation as a character to
compare against the forbidden split rules.

Signed-off-by: Aleksa Sarai <cyphar@cyphar.com>

											
										
										
											2021-10-23 10:12:38 +00:00
+								                if i == #table_chars and word ~= "" then table.insert(table_of_words, word) end
-												textboxwidget: even better text wrapping

util.isSplitable() accepts now also the previous char to help
decide if a space can be used to split a line.
TextBoxWidget:_splitCharWidthList() : simplified logic

											
										
										
											2016-12-12 22:41:16 +00:00
+								            end
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								            assert.are_same({
 								                "Ce ",
 								                "test : ",
 								                "1) ",
 								                "est ",
 								                "« très ",
 								                "simple » ; ",
 								                "2 ) ",
 								                "simple ",
 								                "comme ",
 								                "( 2/2 ) > 50 % ? ",
 								                "ok."
 								            }, table_of_words)
 								        end)
-												textboxwidget: even better text wrapping

util.isSplitable() accepts now also the previous char to help
decide if a space can be used to split a line.
TextBoxWidget:_splitCharWidthList() : simplified logic

											
										
										
											2016-12-12 22:41:16 +00:00
+								    end)
-												evernote: ReadHistory integration and text file output (#2498)



											
										
										
											2017-01-21 09:32:42 +00:00
+								    it("should split file path and name", function()
 								        local test = function(full, path, name)
 								            local p, n = util.splitFilePathName(full)
 								            assert.are_same(p, path)
 								            assert.are_same(n, name)
 								        end
 								        test("/a/b/c.txt", "/a/b/", "c.txt")
 								        test("/a/b////c.txt", "/a/b////", "c.txt")
 								        test("/a/b/", "/a/b/", "")
 								        test("c.txt", "", "c.txt")
 								        test("", "", "")
 								        test(nil, "", "")
 								        test("a/b", "a/", "b")
 								        test("/b", "/", "b")
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								        assert.are_same("/a/b/", util.splitFilePathName("/a/b/c.txt"))
-												evernote: ReadHistory integration and text file output (#2498)



											
										
										
											2017-01-21 09:32:42 +00:00
+								    end)
-												textboxwidget: even better text wrapping

util.isSplitable() accepts now also the previous char to help
decide if a space can be used to split a line.
TextBoxWidget:_splitCharWidthList() : simplified logic

											
										
										
											2016-12-12 22:41:16 +00:00
-												evernote: ReadHistory integration and text file output (#2498)



											
										
										
											2017-01-21 09:32:42 +00:00
+								    it("should split file name and suffix", function()
 								        local test = function(full, name, suffix)
 								            local n, s = util.splitFileNameSuffix(full)
 								            assert.are_same(n, name)
 								            assert.are_same(s, suffix)
 								        end
 								        test("a.txt", "a", "txt")
 								        test("/a/b.txt", "/a/b", "txt")
 								        test("a", "a", "")
 								        test("/a/b", "/a/b", "")
 								        test("/a/", "/a/", "")
 								        test("/a/.txt", "/a/", "txt")
 								        test(nil, "", "")
 								        test("", "", "")
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								        assert.are_same("a", util.splitFileNameSuffix("a.txt"))
-												evernote: ReadHistory integration and text file output (#2498)



											
										
										
											2017-01-21 09:32:42 +00:00
+								    end)
-												Added util.fixUtf8 (#2704)

* Remove invalid UTF-8 chars from OPDS
* add unit tests
											
										
										
											2017-04-02 14:17:49 +00:00
-												[fix] util.getSafeFilename() maximum extension length (#5067)

Strip HTML and do some semi-intelligent detection of faux extensions (i.e., more than 10 characters probably isn't one).

Fixes #5049.
											
										
										
											2019-06-10 15:06:13 +00:00
+								    describe("getSafeFileName()", function()
 								        it("should replace unsafe characters", function()
 								            assert.is_equal("___", util.getSafeFilename("|||"))
 								        end)
 								        it("should truncate any characters beyond the limit", function()
 								            assert.is_equal("aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa", util.getSafeFilename("aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa"))
 								        end)
 								        it("should truncate extension beyond the limit", function()
 								            assert.is_equal("aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa", util.getSafeFilename("aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa.aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa"))
 								        end)
 								        it("should strip HTML from the filename", function()
 								            assert.is_equal("lalala", util.getSafeFilename("<span>lalala</span>"))
 								        end)
 								    end)
-												md5: centralize and deduplicate (#11003)

Document partial md5 hash is calculated by util.partialMD5() and stored in doc_settings as "partial_md5_checksum" on the first document opening.
											
										
										
											2023-10-15 04:47:09 +00:00
+								    describe("partialMD5()", function()
 								        it("should calculate partial md5 hash of pdf file", function()
 								            assert.is_equal(util.partialMD5("spec/front/unit/data/tall.pdf"), "41cce710f34e5ec21315e19c99821415")
 								        end)
 								        it("should calculate partial md5 hash of epub file", function()
 								            assert.is_equal(util.partialMD5("spec/front/unit/data/leaves.epub"), "59d481d168cca6267322f150c5f6a2a3")
 								        end)
 								    end)
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								    describe("fixUtf8()", function()
 								        it("should replace invalid UTF-8 characters with an underscore", function()
 								            assert.is_equal("\127 _ _\127 ", util.fixUtf8("\127 \128 \194\127 ", "_"))
 								        end)
-												Added util.fixUtf8 (#2704)

* Remove invalid UTF-8 chars from OPDS
* add unit tests
											
										
										
											2017-04-02 14:17:49 +00:00
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								        it("should replace invalid UTF-8 characters with multiple characters", function()
 								            assert.is_equal("\127 __ __\127 ", util.fixUtf8("\127 \128 \194\127 ", "__"))
 								        end)
-												Added util.fixUtf8 (#2704)

* Remove invalid UTF-8 chars from OPDS
* add unit tests
											
										
										
											2017-04-02 14:17:49 +00:00
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								        it("should replace invalid UTF-8 characters with empty char", function()
 								            assert.is_equal("\127  \127 ", util.fixUtf8("\127 \128 \194\127 ", ""))
 								        end)
-												Added util.fixUtf8 (#2704)

* Remove invalid UTF-8 chars from OPDS
* add unit tests
											
										
										
											2017-04-02 14:17:49 +00:00
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								        it("should not replace valid UTF-8 <20> character", function()
 								            assert.is_equal("<EFBFBD>valid <20> char <20>", util.fixUtf8("<EFBFBD>valid <20> char <20>", "__"))
 								        end)
-												Added util.fixUtf8 (#2704)

* Remove invalid UTF-8 chars from OPDS
* add unit tests
											
										
										
											2017-04-02 14:17:49 +00:00
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								        it("should not replace valid UTF-8 characters", function()
 								            assert.is_equal("\99 \244\129\130\190", util.fixUtf8("\99 \244\129\130\190", "_"))
 								        end)
-												Added util.fixUtf8 (#2704)

* Remove invalid UTF-8 chars from OPDS
* add unit tests
											
										
										
											2017-04-02 14:17:49 +00:00
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								        it("should not replace valid UTF-8 characters Polish chars", function()
 								            assert.is_equal("Pójdźże źółć", util.fixUtf8("Pójdźże źółć", "_"))
 								        end)
-												Added util.fixUtf8 (#2704)

* Remove invalid UTF-8 chars from OPDS
* add unit tests
											
										
										
											2017-04-02 14:17:49 +00:00
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								        it("should not replace valid UTF-8 characters German chars", function()
 								            assert.is_equal("glück schließen", util.fixUtf8("glück schließen", "_"))
 								        end)
-												Added util.fixUtf8 (#2704)

* Remove invalid UTF-8 chars from OPDS
* add unit tests
											
										
										
											2017-04-02 14:17:49 +00:00
+								    end)
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								    describe("splitToArray()", function()
 								        it("should split input to array", function()
 								            assert.are_same({"100", "abc", "", "def", "ghi200"},
 								                            util.splitToArray("100\tabc\t\tdef\tghi200\t", "\t", true))
 								        end)
-												Merge various information into systemstat (#2764)

* Merge various information to systemstat
											
										
										
											2017-04-14 19:12:28 +00:00
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								        it("should also split input to array", function()
 								            assert.are_same({"", "bc", "bc", "bc", "bc"},
 								                            util.splitToArray("abcabcabcabca", "a", true))
 								        end)
-												Merge various information into systemstat (#2764)

* Merge various information to systemstat
											
										
										
											2017-04-14 19:12:28 +00:00
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								        it("should split input to array without empty entities", function()
 								            assert.are_same({"100", "abc", "def", "ghi200"},
 								                            util.splitToArray("100  abc   def ghi200  ", " ", false))
 								        end)
-												Merge various information into systemstat (#2764)

* Merge various information to systemstat
											
										
										
											2017-04-14 19:12:28 +00:00
+								    end)
-												Book information: refactored and additional features

- Factored out duplicate code from filemanager.lua and filemanagerhistory.lua
to new filemanagerbookinfo.lua (and other common code to filemanagerutil.lua).
- Uses sidecar files' new doc_props and doc_pages settings, or fallback to
old 'stats' settings, or to opening document.
- Shows filename, filetype and directory.
- Shows description (Hold to see whole truncated text), keywords, and
cover image (tap to extract image from document and display it if available).
- Book information now available from reader menu, to display info about
the currently opened book.
- Convert possibly HTML description to plain text via added
util.htmlToPlainTextIfHtml() (for simple HTML conversion).

											
										
										
											2017-07-01 10:11:44 +00:00
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								    describe("htmlToPlainTextIfHtml()", function()
 								        it("should guess it is not HTML and let is as is", function()
 								            local s = "if (i < 0 && j < 0) j = i&amp;"
 								            assert.is_equal(s, util.htmlToPlainTextIfHtml(s))
 								        end)
 								        it("should guess it is HTML and convert it to text", function()
 								            assert.is_equal("Making unit tests is fun & nécéssaire",
 								                            util.htmlToPlainTextIfHtml("<div> <br> Making <b>unit&nbsp;tests</b> is <i class='notreally'>fun &amp; n&#xE9;c&#233;ssaire</i><br/> </div>"))
 								        end)
 								        it("should guess it is double encoded HTML and convert it to text", function()
 								            assert.is_equal("Deux parties.\nPrologue.Désespérée, elle le tue...\nPremière partie. Sur la route & dans la nuit",
 								                            util.htmlToPlainTextIfHtml("Deux parties.&lt;br&gt;Prologue.Désespérée, elle le tue...&lt;br&gt;Première partie. Sur la route &amp;amp; dans la nuit"))
 								        end)
-												Book information: refactored and additional features

- Factored out duplicate code from filemanager.lua and filemanagerhistory.lua
to new filemanagerbookinfo.lua (and other common code to filemanagerutil.lua).
- Uses sidecar files' new doc_props and doc_pages settings, or fallback to
old 'stats' settings, or to opening document.
- Shows filename, filetype and directory.
- Shows description (Hold to see whole truncated text), keywords, and
cover image (tap to extract image from document and display it if available).
- Book information now available from reader menu, to display info about
the currently opened book.
- Convert possibly HTML description to plain text via added
util.htmlToPlainTextIfHtml() (for simple HTML conversion).

											
										
										
											2017-07-01 10:11:44 +00:00
+								    end)
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
 								    describe("isEmptyDir()", function()
 								        it("should return true on empty dir", function()
-												Tests: emptydir switch from data/dict to history (#8296)

So this test doesn't fail when one has dictionaries locally
(history folder is deprecated and should be empty).
											
										
										
											2021-10-10 11:33:57 +00:00
+								            assert.is_true(util.isEmptyDir(DataStorage:getDataDir() .. "/history")) -- should be empty during unit tests
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
+								        end)
 								        it("should return false on non-empty dir", function()
 								            assert.is_false(util.isEmptyDir(DataStorage:getDataDir())) -- should contain subdirectories
 								        end)
 								        it("should return nil on non-existent dir", function()
 								            assert.is_nil(util.isEmptyDir("/this/is/just/some/nonsense/really/this/should/not/exist"))
 								        end)
-												add unit test

											
										
										
											2017-08-12 13:22:00 +00:00
+								    end)
-												[chore] Rework util spec, rework util.secondsToClock: round seconds to minutes in 00:00 mode + spec

Most of the tests in util_spec were the wrong way around.
It's `assert(expected, given)`.

											
										
										
											2017-10-11 14:38:20 +00:00
-												[spec] util_spec: tests for util.getFriendlySize() (#3650)


											
										
										
											2018-01-31 16:22:34 +00:00
+								    describe("getFriendlySize()", function()
 								        describe("should convert bytes to friendly size as string", function()
 								            it("to 100.0 GB", function()
 								                assert.is_equal("100.0 GB",
-												Address assorted Weblate comments (#7154)

* Fix typo in dropbox

Reported by @lescheck

* Rephrase text justification explanation more elegantly

* CoverBrowser: fix up some plurals

* Statistics: remove random use of template function

* Use ngettext for minute/minutes and second/seconds

* Change KB/MB/GB to kB/MB/GB SI units
											
										
										
											2021-01-16 20:40:00 +00:00
+								                                util.getFriendlySize(100*1000*1000*1000))
-												[spec] util_spec: tests for util.getFriendlySize() (#3650)


											
										
										
											2018-01-31 16:22:34 +00:00
+								            end)
-												util.getFriendlySize(): add option to right align

Left align by default, but allow right alignment by
padding left with spaces.

											
										
										
											2019-12-17 12:00:35 +00:00
+								            it("to 1.0 GB", function()
 								                assert.is_equal("1.0 GB",
-												Address assorted Weblate comments (#7154)

* Fix typo in dropbox

Reported by @lescheck

* Rephrase text justification explanation more elegantly

* CoverBrowser: fix up some plurals

* Statistics: remove random use of template function

* Use ngettext for minute/minutes and second/seconds

* Change KB/MB/GB to kB/MB/GB SI units
											
										
										
											2021-01-16 20:40:00 +00:00
+								                                util.getFriendlySize(1000*1000*1000+1))
-												[spec] util_spec: tests for util.getFriendlySize() (#3650)


											
										
										
											2018-01-31 16:22:34 +00:00
+								            end)
-												util.getFriendlySize(): add option to right align

Left align by default, but allow right alignment by
padding left with spaces.

											
										
										
											2019-12-17 12:00:35 +00:00
+								            it("to 1.0 MB", function()
 								                assert.is_equal("1.0 MB",
-												Address assorted Weblate comments (#7154)

* Fix typo in dropbox

Reported by @lescheck

* Rephrase text justification explanation more elegantly

* CoverBrowser: fix up some plurals

* Statistics: remove random use of template function

* Use ngettext for minute/minutes and second/seconds

* Change KB/MB/GB to kB/MB/GB SI units
											
										
										
											2021-01-16 20:40:00 +00:00
+								                                util.getFriendlySize(1000*1000+1))
-												[spec] util_spec: tests for util.getFriendlySize() (#3650)


											
										
										
											2018-01-31 16:22:34 +00:00
+								            end)
-												Address assorted Weblate comments (#7154)

* Fix typo in dropbox

Reported by @lescheck

* Rephrase text justification explanation more elegantly

* CoverBrowser: fix up some plurals

* Statistics: remove random use of template function

* Use ngettext for minute/minutes and second/seconds

* Change KB/MB/GB to kB/MB/GB SI units
											
										
										
											2021-01-16 20:40:00 +00:00
+								            it("to 1.0 kB", function()
 								                assert.is_equal("1.0 kB",
 								                                util.getFriendlySize(1000+1))
-												[spec] util_spec: tests for util.getFriendlySize() (#3650)


											
										
										
											2018-01-31 16:22:34 +00:00
+								            end)
 								            it("to B", function()
-												util.getFriendlySize(): add option to right align

Left align by default, but allow right alignment by
padding left with spaces.

											
										
										
											2019-12-17 12:00:35 +00:00
+								                assert.is_equal("10 B",
 								                                util.getFriendlySize(10))
 								            end)
 								            it("to 100.0 GB with minimum field width alignment", function()
 								                assert.is_equal(" 100.0 GB",
-												Address assorted Weblate comments (#7154)

* Fix typo in dropbox

Reported by @lescheck

* Rephrase text justification explanation more elegantly

* CoverBrowser: fix up some plurals

* Statistics: remove random use of template function

* Use ngettext for minute/minutes and second/seconds

* Change KB/MB/GB to kB/MB/GB SI units
											
										
										
											2021-01-16 20:40:00 +00:00
+								                                util.getFriendlySize(100*1000*1000*1000, true))
-												util.getFriendlySize(): add option to right align

Left align by default, but allow right alignment by
padding left with spaces.

											
										
										
											2019-12-17 12:00:35 +00:00
+								            end)
 								            it("to 1.0 GB with minimum field width alignment", function()
 								                assert.is_equal("   1.0 GB",
-												Address assorted Weblate comments (#7154)

* Fix typo in dropbox

Reported by @lescheck

* Rephrase text justification explanation more elegantly

* CoverBrowser: fix up some plurals

* Statistics: remove random use of template function

* Use ngettext for minute/minutes and second/seconds

* Change KB/MB/GB to kB/MB/GB SI units
											
										
										
											2021-01-16 20:40:00 +00:00
+								                                util.getFriendlySize(1000*1000*1000+1, true))
-												util.getFriendlySize(): add option to right align

Left align by default, but allow right alignment by
padding left with spaces.

											
										
										
											2019-12-17 12:00:35 +00:00
+								            end)
 								            it("to 1.0 MB with minimum field width alignment", function()
 								                assert.is_equal("   1.0 MB",
-												Address assorted Weblate comments (#7154)

* Fix typo in dropbox

Reported by @lescheck

* Rephrase text justification explanation more elegantly

* CoverBrowser: fix up some plurals

* Statistics: remove random use of template function

* Use ngettext for minute/minutes and second/seconds

* Change KB/MB/GB to kB/MB/GB SI units
											
										
										
											2021-01-16 20:40:00 +00:00
+								                                util.getFriendlySize(1000*1000+1, true))
-												util.getFriendlySize(): add option to right align

Left align by default, but allow right alignment by
padding left with spaces.

											
										
										
											2019-12-17 12:00:35 +00:00
+								            end)
-												Address assorted Weblate comments (#7154)

* Fix typo in dropbox

Reported by @lescheck

* Rephrase text justification explanation more elegantly

* CoverBrowser: fix up some plurals

* Statistics: remove random use of template function

* Use ngettext for minute/minutes and second/seconds

* Change KB/MB/GB to kB/MB/GB SI units
											
										
										
											2021-01-16 20:40:00 +00:00
+								            it("to 1.0 kB with minimum field width alignment", function()
 								                assert.is_equal("   1.0 kB",
 								                                util.getFriendlySize(1000+1, true))
-												util.getFriendlySize(): add option to right align

Left align by default, but allow right alignment by
padding left with spaces.

											
										
										
											2019-12-17 12:00:35 +00:00
+								            end)
 								            it("to B with minimum field width alignment", function()
 								                assert.is_equal("    10 B",
 								                                util.getFriendlySize(10, true))
-												[spec] util_spec: tests for util.getFriendlySize() (#3650)


											
										
										
											2018-01-31 16:22:34 +00:00
+								            end)
 								        end)
 								        it("should return nil when input is nil or false", function()
 								            assert.is_nil(util.getFriendlySize(nil))
 								            assert.is_nil(util.getFriendlySize(false))
 								        end)
 								        it("should return nil when input is not a number", function()
 								            assert.is_nil(util.getFriendlySize("a string"))
 								        end)
 								    end)
-												CloudStorage: Allow use reserved characters in FTP username and FTP password  (#3924)

Depends on RFC 3986 compliant util.urlEncode() and adds unit tests for the new functions.
											
										
										
											2018-05-04 15:06:58 +00:00
+								    describe("urlEncode() and urlDecode", function()
 								        it("should encode string", function()
 								            assert.is_equal("Secret_Password123", util.urlEncode("Secret_Password123"))
 								            assert.is_equal("Secret%20Password123", util.urlEncode("Secret Password123"))
 								            assert.is_equal("S*cret%3DP%40%24%24word*!%23%3F", util.urlEncode("S*cret=P@$$word*!#?"))
 								            assert.is_equal("~%5E-_%5C%25!*'()%3B%3A%40%26%3D%2B%24%2C%2F%3F%23%5B%5D",
 								                util.urlEncode("~^-_\\%!*'();:@&=+$,/?#[]"))
 								        end)
 								        it("should decode string", function()
 								            assert.is_equal("Secret_Password123", util.urlDecode("Secret_Password123"))
 								            assert.is_equal("Secret Password123", util.urlDecode("Secret%20Password123"))
 								            assert.is_equal("S*cret=P@$$word*!#?", util.urlDecode("S*cret%3DP%40%24%24word*!%23%3F"))
 								            assert.is_equal("~^-_\\%!*'();:@&=+$,/?#[]",
 								                util.urlDecode("~%5E-_%5C%25!*'()%3B%3A%40%26%3D%2B%24%2C%2F%3F%23%5B%5D"))
 								        end)
 								        it("should encode and back decode string", function()
 								            assert.is_equal("Secret_Password123",
 								                util.urlDecode(util.urlEncode("Secret_Password123")))
 								            assert.is_equal("Secret Password123",
 								                util.urlDecode(util.urlEncode("Secret Password123")))
 								            assert.is_equal("S*cret=P@$$word*!#?",
 								                util.urlDecode(util.urlEncode("S*cret=P@$$word*!#?")))
 								            assert.is_equal("~^-_%!*'();:@&=+$,/?#[]",
 								                util.urlDecode(util.urlEncode("~^-_%!*'();:@&=+$,/?#[]")))
 								        end)
 								    end)
-												Refactor out string.gsplit to util.gsplit

											
										
										
											2015-04-22 06:17:06 +00:00
+								end)