koreader/frontend/util.lua

--[[--
This module contains miscellaneous helper functions for the KOReader frontend.
]]

local BaseUtil = require("ffi/util")
local util = {}

--- Strips all punctuation and spaces from a string.
---- @string text the string to be stripped
---- @treturn string stripped text
function util.stripePunctuations(text)
    if not text then return end
    -- strip ASCII punctuation characters around text
    -- and strip any generic punctuation (U+2000 - U+206F) in the text
    return text:gsub("\226[\128-\131][\128-\191]", ''):gsub("^%p+", ''):gsub("%p+$", '')
end

--- Splits a string by a pattern
--[[--
Lua doesn't have a string.split() function and most of the time
you don't really need it because string.gmatch() is enough.
However string.gmatch() has one significant disadvantage for me:
You can't split a string while matching both the delimited
strings and the delimiters themselves without tracking positions
and substrings. The gsplit function below takes care of
this problem.
Author: Peter Odding
License: MIT/X11
Source: http://snippets.luacode.org/snippets/String_splitting_130
]]
----@string str string to split
----@param pattern the pattern to split against
----@bool capture
function util.gsplit(str, pattern, capture)
    pattern = pattern and tostring(pattern) or '%s+'
    if (''):find(pattern) then
        error('pattern matches empty string!', 2)
    end
    return coroutine.wrap(function()
        local index = 1
        repeat
            local first, last = str:find(pattern, index)
            if first and last then
                if index < first then
                    coroutine.yield(str:sub(index, first - 1))
                end
                if capture then
                    coroutine.yield(str:sub(first, last))
                end
                index = last + 1
            else
                if index <= #str then
                    coroutine.yield(str:sub(index))
                end
                break
            end
        until index > #str
    end)
end

--- Converts seconds to a clock string.
-- Source: https://gist.github.com/jesseadams/791673
---- @int seconds number of seconds
---- @bool withoutSeconds if true 00:00, if false 00:00:00
---- @treturn string clock string in the form of 00:00 or 00:00:00
function util.secondsToClock(seconds, withoutSeconds)
    seconds = tonumber(seconds)
    if seconds == 0 or seconds ~= seconds then
        if withoutSeconds then
            return "00:00";
        else
            return "00:00:00";
        end
    else
        local hours = string.format("%02.f", math.floor(seconds / 3600));
        local mins = string.format("%02.f", math.floor(seconds / 60 - (hours * 60)));
        if withoutSeconds then
            return hours .. ":" .. mins
        end
        local secs = string.format("%02.f", math.floor(seconds - hours * 3600 - mins * 60));
        return hours .. ":" .. mins .. ":" .. secs
    end
end

--- Returns number of keys in a table.
---- @param T Lua table
---- @treturn int number of keys in table T
function util.tableSize(T)
    local count = 0
    for _ in pairs(T) do count = count + 1 end
    return count
end

-- append all elements from t2 into t1
function util.arrayAppend(t1, t2)
    for _, v in ipairs(t2) do
        table.insert(t1, v)
    end
end

-- Returns the index within this string of the last occurrence of the specified character
-- or -1 if the character does not occur.
-- To find . you need to escape it.
function util.lastIndexOf(string, ch)
    local i = string:match(".*" .. ch .. "()")
    if i == nil then return -1 else return i - 1 end
end


--- Splits string into a list of UTF-8 characters.
---- @string text the string to be split.
---- @treturn table list of UTF-8 chars
function util.splitToChars(text)
    local tab = {}
    if text ~= nil then
        local prevcharcode, charcode = 0
        for uchar in string.gfind(text, "([%z\1-\127\194-\244][\128-\191]*)") do
            charcode = BaseUtil.utf8charcode(uchar)
            if prevcharcode then -- utf8
                table.insert(tab, uchar)
            end
            prevcharcode = charcode
        end
    end
    return tab
end

-- Tests whether c is a CJK character
function util.isCJKChar(c)
    return string.match(c, "[\228-\234][\128-\191].") == c
end

-- Test whether str contains CJK characters
function util.hasCJKChar(str)
    return string.match(str, "[\228-\234][\128-\191].") ~= nil
end

--- Split texts into a list of words, spaces and punctuation.
---- @string text text to split
---- @treturn table list of words, spaces and punctuation
function util.splitToWords(text)
    local wlist = {}
    for word in util.gsplit(text, "[%s%p]+", true) do
        -- if space splitted word contains CJK characters
        if util.hasCJKChar(word) then
            -- split with CJK characters
            for char in util.gsplit(word, "[\228-\234\192-\255][\128-\191]+", true) do
                table.insert(wlist, char)
            end
        else
            table.insert(wlist, word)
        end
    end
    return wlist
end

-- We don't want to split on a space if it is followed by some
-- specific punctuation : e.g. "word :" or "word )"
-- (In french, there is a space before a colon, and it better
-- not be wrapped there.)
local non_splitable_space_tailers = ":;,.!?)]}$%=-+*/|<>»”"
-- Same if a space has some specific other punctuation before it
local non_splitable_space_leaders = "([{$=-+*/|<>«“"


-- Similar rules exist for CJK text. Taken from :
-- https://en.wikipedia.org/wiki/Line_breaking_rules_in_East_Asian_languages

local cjk_non_splitable_tailers = table.concat( {
    -- Simplified Chinese
    "!%),.:;?]}¢°·’\"†‡›℃∶、。〃〆〕〗〞﹚﹜！＂％＇），．：；？！］｝～",
    -- Traditional Chinese
    "!),.:;?]}¢·–—’\"•、。〆〞〕〉》」︰︱︲︳﹐﹑﹒﹓﹔﹕﹖﹘﹚﹜！），．：；？︶︸︺︼︾﹀﹂﹗］｜｝､",
    -- Japanese
    ")]｝〕〉》」』】〙〗〟’\"｠»ヽヾーァィゥェォッャュョヮヵヶぁぃぅぇぉっゃゅょゎゕゖㇰㇱㇲㇳㇴㇵㇶㇷㇸㇹㇺㇻㇼㇽㇾㇿ々〻‐゠–〜?!‼⁇⁈⁉・、:;,。.",
    -- Korean
    "!%),.:;?]}¢°’\"†‡℃〆〈《「『〕！％），．：；？］｝",
})

local cjk_non_splitable_leaders = table.concat( {
    -- Simplified Chinese
    "$(£¥·‘\"〈《「『【〔〖〝﹙﹛＄（．［｛￡￥",
    -- Traditional Chinese
    "([{£¥‘\"‵〈《「『〔〝︴﹙﹛（｛︵︷︹︻︽︿﹁﹃﹏",
    -- Japanese
    "([｛〔〈《「『【〘〖〝‘\"｟«",
    -- Korean
    "$([{£¥‘\"々〇〉》」〔＄（［｛｠￥￦#",
})

local cjk_non_splitable = table.concat( {
    -- Japanese
    "—…‥〳〴〵",
})

-- Test whether a string could be separated by this char for multi-line rendering
-- Optional next or prev chars may be provided to help make the decision
function util.isSplitable(c, next_c, prev_c)
    if util.isCJKChar(c) then
        -- a CJKChar is a word in itself, and so is splitable
        if cjk_non_splitable:find(c, 1, true) then
            -- except a few of them
            return false
        elseif next_c and cjk_non_splitable_tailers:find(next_c, 1, true) then
            -- but followed by a char that is not permitted at start of line
            return false
        elseif prev_c and cjk_non_splitable_leaders:find(prev_c, 1, true) then
            -- but preceded by a char that is not permitted at end of line
            return false
        else
            -- we can split on this CJKchar
            return true
        end
    elseif c == " " then
        -- we only split on a space (so punctuation sticks to prev word)
        -- if next_c or prev_c is provided, we can make a better decision
        if next_c and non_splitable_space_tailers:find(next_c, 1, true) then
            -- this space is followed by some punctuation that is better kept with us
            return false
        elseif prev_c and non_splitable_space_leaders:find(prev_c, 1, true) then
            -- this space is lead by some punctuation that is better kept with us
            return false
        else
            -- we can split on this space
            return true
        end
    end
    -- otherwise, non splitable
    return false
end

--- Gets filesystem type of a path
-- Checks if the path occurs in /proc/mounts
----@string path an absolute path
function util.getFilesystemType(path)
    local mounts = io.open("/proc/mounts", "r")
    if not mounts then return nil end
    local type
    while true do
        local line
        local mount = {}
        line = mounts:read()
        if line == nil then
            break
        end
        for param in line:gmatch("%S+") do table.insert(mount, param) end
        if string.match(path, mount[2]) then
            type = mount[3]
            if mount[2] ~= '/' then
                break
            end
        end
    end
    mounts:close()
    return type
end

function util.replaceInvalidChars(str)
    if str then
        return str:gsub('[\\,%/,:,%*,%?,%",%<,%>,%|]','_')
    end
end

function util.replaceSlashChar(str)
    if str then
        return str:gsub('%/','_')
    end
end

-- Split a file into its path and name
function util.splitFilePathName(file)
    if file == nil or file == "" then return "", "" end
    if string.find(file, "/") == nil then return "", file end
    return string.gsub(file, "(.*/)(.*)", "%1"), string.gsub(file, ".*/", "")
end

-- Split a file name into its pure file name and suffix
function util.splitFileNameSuffix(file)
    if file == nil or file == "" then return "", "" end
    if string.find(file, "%.") == nil then return file, "" end
    return string.gsub(file, "(.*)%.(.*)", "%1"), string.gsub(file, ".*%.", "")
end

function util.getFileNameSuffix(file)
    local _, suffix = util.splitFileNameSuffix(file)
    return suffix
end

function util.getMenuText(item)
    local text
    if item.text_func then
        text = item.text_func()
    else
        text = item.text
    end
    if item.sub_item_table ~= nil then
        text = text .. " \226\150\184"
    end
    return text
end

-- from http://notebook.kulchenko.com/programming/fixing-malformed-utf8-in-lua with modification
--- Replaces invalid UTF-8 characters with a replacement string.
---- @string str the string to be checked for invalid characters
---- @string replacement the string to replace invalid characters with
---- @treturn string valid UTF-8
function util.fixUtf8(str, replacement)
    local pos = 1
    local len = #str
    while pos <= len do
        if     pos == str:find("[%z\1-\127]", pos) then pos = pos + 1
        elseif pos == str:find("[\194-\223][\128-\191]", pos) then pos = pos + 2
        elseif pos == str:find(       "\224[\160-\191][\128-\191]", pos)
            or pos == str:find("[\225-\236][\128-\191][\128-\191]", pos)
            or pos == str:find(       "\237[\128-\159][\128-\191]", pos)
            or pos == str:find("[\238-\239][\128-\191][\128-\191]", pos) then pos = pos + 3
        elseif pos == str:find(       "\240[\144-\191][\128-\191][\128-\191]", pos)
            or pos == str:find("[\241-\243][\128-\191][\128-\191][\128-\191]", pos)
            or pos == str:find(       "\244[\128-\143][\128-\191][\128-\191]", pos) then pos = pos + 4
        else
            str = str:sub(1, pos - 1) .. replacement .. str:sub(pos + 1)
            pos = pos + #replacement
            len = len + #replacement - 1
        end
    end
    return str
end

return util
doc: add documentation build infrastructure 8 years ago			`--[[--`
Doc: miscellaneous improvements. 7 years ago			`This module contains miscellaneous helper functions for the KOReader frontend.`
textboxwidget(fix): handle onHoldWord event 8 years ago			`]]`
doc: add documentation build infrastructure 8 years ago
textboxwidget(fix): handle onHoldWord event 8 years ago			`local BaseUtil = require("ffi/util")`
strip punctuations around word before searching This should fix #1337. 9 years ago			`local util = {}`

Doc: miscellaneous improvements. 7 years ago			`--- Strips all punctuation and spaces from a string.`
textboxwidget(fix): handle onHoldWord event 8 years ago			`---- @string text the string to be stripped`
			`---- @treturn string stripped text`
			`function util.stripePunctuations(text)`
			`if not text then return end`
			`-- strip ASCII punctuation characters around text`
			`-- and strip any generic punctuation (U+2000 - U+206F) in the text`
			`return text:gsub("\226[\128-\131][\128-\191]", ''):gsub("^%p+", ''):gsub("%p+$", '')`
strip punctuations around word before searching This should fix #1337. 9 years ago			`end`

util: add some LDoc descriptions 7 years ago			`--- Splits a string by a pattern`
			`--[[--`
Refactor out string.gsplit to util.gsplit 9 years ago			`Lua doesn't have a string.split() function and most of the time`
			`you don't really need it because string.gmatch() is enough.`
			`However string.gmatch() has one significant disadvantage for me:`
			`You can't split a string while matching both the delimited`
			`strings and the delimiters themselves without tracking positions`
			`and substrings. The gsplit function below takes care of`
			`this problem.`
			`Author: Peter Odding`
			`License: MIT/X11`
			`Source: http://snippets.luacode.org/snippets/String_splitting_130`
util: add some LDoc descriptions 7 years ago			`]]`
			`----@string str string to split`
			`----@param pattern the pattern to split against`
			`----@bool capture`
Refactor out string.gsplit to util.gsplit 9 years ago			`function util.gsplit(str, pattern, capture)`
			`pattern = pattern and tostring(pattern) or '%s+'`
			`if (''):find(pattern) then`
			`error('pattern matches empty string!', 2)`
			`end`
			`return coroutine.wrap(function()`
			`local index = 1`
			`repeat`
			`local first, last = str:find(pattern, index)`
			`if first and last then`
			`if index < first then`
			`coroutine.yield(str:sub(index, first - 1))`
			`end`
			`if capture then`
			`coroutine.yield(str:sub(first, last))`
			`end`
			`index = last + 1`
			`else`
			`if index <= #str then`
			`coroutine.yield(str:sub(index))`
			`end`
			`break`
			`end`
			`until index > #str`
			`end)`
			`end`

util: add some LDoc descriptions 7 years ago			`--- Converts seconds to a clock string.`
			`-- Source: https://gist.github.com/jesseadams/791673`
			`---- @int seconds number of seconds`
			`---- @bool withoutSeconds if true 00:00, if false 00:00:00`
			`---- @treturn string clock string in the form of 00:00 or 00:00:00`
minor: no need to override function arg with local 8 years ago			`function util.secondsToClock(seconds, withoutSeconds)`
			`seconds = tonumber(seconds)`
#1723 Add time to read into the status bar Add new statuses: TB - book time to read TC - chapter time to read Fix backward compatible in statistics plugin 9 years ago			`if seconds == 0 or seconds ~= seconds then`
			`if withoutSeconds then`
			`return "00:00";`
			`else`
			`return "00:00:00";`
			`end`
			`else`
			`local hours = string.format("%02.f", math.floor(seconds / 3600));`
			`local mins = string.format("%02.f", math.floor(seconds / 60 - (hours * 60)));`
			`if withoutSeconds then`
			`return hours .. ":" .. mins`
			`end`
			`local secs = string.format("%02.f", math.floor(seconds - hours * 3600 - mins * 60));`
			`return hours .. ":" .. mins .. ":" .. secs`
			`end`
			`end`

doc: add documentation build infrastructure 8 years ago			`--- Returns number of keys in a table.`
			`---- @param T Lua table`
textboxwidget(fix): handle onHoldWord event 8 years ago			`---- @treturn int number of keys in table T`
style(util): rename tablelength to tableSize 8 years ago			`function util.tableSize(T)`
#1723 Add time to read into the status bar Add new statuses: TB - book time to read TC - chapter time to read Fix backward compatible in statistics plugin 9 years ago			`local count = 0`
			`for _ in pairs(T) do count = count + 1 end`
			`return count`
			`end`

feat(util): add array.Append helper 8 years ago			`-- append all elements from t2 into t1`
			`function util.arrayAppend(t1, t2)`
#1710 FR: Add support of statistics plugin for pdf 8 years ago			`for _, v in ipairs(t2) do`
feat(util): add array.Append helper 8 years ago			`table.insert(t1, v)`
			`end`
			`end`

#1710 FR: Add support of statistics plugin for pdf 8 years ago			`-- Returns the index within this string of the last occurrence of the specified character`
			`-- or -1 if the character does not occur.`
			`-- To find . you need to escape it.`
			`function util.lastIndexOf(string, ch)`
			`local i = string:match(".*" .. ch .. "()")`
			`if i == nil then return -1 else return i - 1 end`
			`end`

add cursor functionality 8 years ago
Doc: miscellaneous improvements. 7 years ago			`--- Splits string into a list of UTF-8 characters.`
			`---- @string text the string to be split.`
textboxwidget(fix): handle onHoldWord event 8 years ago			`---- @treturn table list of UTF-8 chars`
fix function util.splitToChars in frontend/util.lua 8 years ago			`function util.splitToChars(text)`
			`local tab = {}`
			`if text ~= nil then`
			`local prevcharcode, charcode = 0`
			`for uchar in string.gfind(text, "([%z\1-\127\194-\244][\128-\191]*)") do`
			`charcode = BaseUtil.utf8charcode(uchar)`
			`if prevcharcode then -- utf8`
			`table.insert(tab, uchar)`
			`end`
			`prevcharcode = charcode`
add cursor functionality 8 years ago			`end`
			`end`
fix function util.splitToChars in frontend/util.lua 8 years ago			`return tab`
add cursor functionality 8 years ago			`end`

Doc: miscellaneous improvements. 7 years ago			`-- Tests whether c is a CJK character`
PR #2356 breaks CJK character splitting 8 years ago			`function util.isCJKChar(c)`
			`return string.match(c, "[\228-\234][\128-\191].") == c`
			`end`

			`-- Test whether str contains CJK characters`
			`function util.hasCJKChar(str)`
			`return string.match(str, "[\228-\234][\128-\191].") ~= nil`
			`end`

Doc: miscellaneous improvements. 7 years ago			`--- Split texts into a list of words, spaces and punctuation.`
textboxwidget(fix): handle onHoldWord event 8 years ago			`---- @string text text to split`
Doc: miscellaneous improvements. 7 years ago			`---- @treturn table list of words, spaces and punctuation`
textboxwidget(fix): handle onHoldWord event 8 years ago			`function util.splitToWords(text)`
			`local wlist = {}`
split accient greek words with spacing character This should fix #1705. 8 years ago			`for word in util.gsplit(text, "[%s%p]+", true) do`
			`-- if space splitted word contains CJK characters`
PR #2356 breaks CJK character splitting 8 years ago			`if util.hasCJKChar(word) then`
split accient greek words with spacing character This should fix #1705. 8 years ago			`-- split with CJK characters`
			`for char in util.gsplit(word, "[\228-\234\192-\255][\128-\191]+", true) do`
			`table.insert(wlist, char)`
			`end`
			`else`
textboxwidget(fix): handle onHoldWord event 8 years ago			`table.insert(wlist, word)`
			`end`
			`end`
			`return wlist`
			`end`

textboxwidget and scrolltextwidget enhancements (#2393) util: made isSplitable() accept an optional next_char for wiser decision textboxwidget: speed up rendering, enhanced text wrapping, allow selection of multiple words with Hold. scrolltextwidget: allow scrolling with Tap. Details in #2393 7 years ago			`-- We don't want to split on a space if it is followed by some`
			`-- specific punctuation : e.g. "word :" or "word )"`
			`-- (In french, there is a space before a colon, and it better`
			`-- not be wrapped there.)`
textboxwidget: even better text wrapping util.isSplitable() accepts now also the previous char to help decide if a space can be used to split a line. TextBoxWidget:_splitCharWidthList() : simplified logic 7 years ago			`local non_splitable_space_tailers = ":;,.!?)]}$%=-+*/\|<>»”"`
			`-- Same if a space has some specific other punctuation before it`
			`local non_splitable_space_leaders = "([{$=-+*/\|<>«“"`
textboxwidget and scrolltextwidget enhancements (#2393) util: made isSplitable() accept an optional next_char for wiser decision textboxwidget: speed up rendering, enhanced text wrapping, allow selection of multiple words with Hold. scrolltextwidget: allow scrolling with Tap. Details in #2393 7 years ago
textboxwidget: enhanced CJK text wrapping (changes only in util.isSplitable(), but used by textboxwidget) Implemented line breaking rules from : https://en.wikipedia.org/wiki/Line_breaking_rules_in_East_Asian_languages 7 years ago
			`-- Similar rules exist for CJK text. Taken from :`
			`-- https://en.wikipedia.org/wiki/Line_breaking_rules_in_East_Asian_languages`

			`local cjk_non_splitable_tailers = table.concat( {`
			`-- Simplified Chinese`
			`"!%),.:;?]}¢°·’\"†‡›℃∶、。〃〆〕〗〞﹚﹜！＂％＇），．：；？！］｝～",`
			`-- Traditional Chinese`
			`"!),.:;?]}¢·–—’\"•、。〆〞〕〉》」︰︱︲︳﹐﹑﹒﹓﹔﹕﹖﹘﹚﹜！），．：；？︶︸︺︼︾﹀﹂﹗］｜｝､",`
			`-- Japanese`
			`")]｝〕〉》」』】〙〗〟’\"｠»ヽヾーァィゥェォッャュョヮヵヶぁぃぅぇぉっゃゅょゎゕゖㇰㇱㇲㇳㇴㇵㇶㇷㇸㇹㇺㇻㇼㇽㇾㇿ々〻‐゠–〜?!‼⁇⁈⁉・、:;,。.",`
			`-- Korean`
			`"!%),.:;?]}¢°’\"†‡℃〆〈《「『〕！％），．：；？］｝",`
			`})`

			`local cjk_non_splitable_leaders = table.concat( {`
			`-- Simplified Chinese`
			`"$(£¥·‘\"〈《「『【〔〖〝﹙﹛＄（．［｛￡￥",`
			`-- Traditional Chinese`
			`"([{£¥‘\"‵〈《「『〔〝︴﹙﹛（｛︵︷︹︻︽︿﹁﹃﹏",`
			`-- Japanese`
			`"([｛〔〈《「『【〘〖〝‘\"｟«",`
			`-- Korean`
			`"$([{£¥‘\"々〇〉》」〔＄（［｛｠￥￦#",`
			`})`

			`local cjk_non_splitable = table.concat( {`
			`-- Japanese`
			`"—…‥〳〴〵",`
			`})`

textboxwidget and scrolltextwidget enhancements (#2393) util: made isSplitable() accept an optional next_char for wiser decision textboxwidget: speed up rendering, enhanced text wrapping, allow selection of multiple words with Hold. scrolltextwidget: allow scrolling with Tap. Details in #2393 7 years ago			`-- Test whether a string could be separated by this char for multi-line rendering`
textboxwidget: even better text wrapping util.isSplitable() accepts now also the previous char to help decide if a space can be used to split a line. TextBoxWidget:_splitCharWidthList() : simplified logic 7 years ago			`-- Optional next or prev chars may be provided to help make the decision`
			`function util.isSplitable(c, next_c, prev_c)`
textboxwidget and scrolltextwidget enhancements (#2393) util: made isSplitable() accept an optional next_char for wiser decision textboxwidget: speed up rendering, enhanced text wrapping, allow selection of multiple words with Hold. scrolltextwidget: allow scrolling with Tap. Details in #2393 7 years ago			`if util.isCJKChar(c) then`
			`-- a CJKChar is a word in itself, and so is splitable`
textboxwidget: enhanced CJK text wrapping (changes only in util.isSplitable(), but used by textboxwidget) Implemented line breaking rules from : https://en.wikipedia.org/wiki/Line_breaking_rules_in_East_Asian_languages 7 years ago			`if cjk_non_splitable:find(c, 1, true) then`
			`-- except a few of them`
			`return false`
			`elseif next_c and cjk_non_splitable_tailers:find(next_c, 1, true) then`
			`-- but followed by a char that is not permitted at start of line`
			`return false`
			`elseif prev_c and cjk_non_splitable_leaders:find(prev_c, 1, true) then`
			`-- but preceded by a char that is not permitted at end of line`
			`return false`
			`else`
			`-- we can split on this CJKchar`
			`return true`
			`end`
textboxwidget and scrolltextwidget enhancements (#2393) util: made isSplitable() accept an optional next_char for wiser decision textboxwidget: speed up rendering, enhanced text wrapping, allow selection of multiple words with Hold. scrolltextwidget: allow scrolling with Tap. Details in #2393 7 years ago			`elseif c == " " then`
			`-- we only split on a space (so punctuation sticks to prev word)`
textboxwidget: even better text wrapping util.isSplitable() accepts now also the previous char to help decide if a space can be used to split a line. TextBoxWidget:_splitCharWidthList() : simplified logic 7 years ago			`-- if next_c or prev_c is provided, we can make a better decision`
textboxwidget and scrolltextwidget enhancements (#2393) util: made isSplitable() accept an optional next_char for wiser decision textboxwidget: speed up rendering, enhanced text wrapping, allow selection of multiple words with Hold. scrolltextwidget: allow scrolling with Tap. Details in #2393 7 years ago			`if next_c and non_splitable_space_tailers:find(next_c, 1, true) then`
textboxwidget: even better text wrapping util.isSplitable() accepts now also the previous char to help decide if a space can be used to split a line. TextBoxWidget:_splitCharWidthList() : simplified logic 7 years ago			`-- this space is followed by some punctuation that is better kept with us`
			`return false`
			`elseif prev_c and non_splitable_space_leaders:find(prev_c, 1, true) then`
			`-- this space is lead by some punctuation that is better kept with us`
textboxwidget and scrolltextwidget enhancements (#2393) util: made isSplitable() accept an optional next_char for wiser decision textboxwidget: speed up rendering, enhanced text wrapping, allow selection of multiple words with Hold. scrolltextwidget: allow scrolling with Tap. Details in #2393 7 years ago			`return false`
			`else`
			`-- we can split on this space`
			`return true`
			`end`
			`end`
			`-- otherwise, non splitable`
			`return false`
add cursor functionality 8 years ago			`end`

util: add some LDoc descriptions 7 years ago			`--- Gets filesystem type of a path`
			`-- Checks if the path occurs in /proc/mounts`
			`----@string path an absolute path`
Sanitize filename for vfat, fix #2433 (#2464) 7 years ago			`function util.getFilesystemType(path)`
			`local mounts = io.open("/proc/mounts", "r")`
			`if not mounts then return nil end`
			`local type`
			`while true do`
			`local line`
			`local mount = {}`
			`line = mounts:read()`
			`if line == nil then`
			`break`
			`end`
			`for param in line:gmatch("%S+") do table.insert(mount, param) end`
			`if string.match(path, mount[2]) then`
			`type = mount[3]`
			`if mount[2] ~= '/' then`
			`break`
			`end`
			`end`
			`end`
			`mounts:close()`
			`return type`
			`end`

			`function util.replaceInvalidChars(str)`
Fix crash when downloading books with unknown characters in title (#2628) 7 years ago			`if str then`
Added util.fixUtf8 (#2704) * Remove invalid UTF-8 chars from OPDS * add unit tests 7 years ago			`return str:gsub('[\\,%/,:,%*,%?,%",%<,%>,%\|]','_')`
Fix crash when downloading books with unknown characters in title (#2628) 7 years ago			`end`
Sanitize filename for vfat, fix #2433 (#2464) 7 years ago			`end`

			`function util.replaceSlashChar(str)`
Fix crash when downloading books with unknown characters in title (#2628) 7 years ago			`if str then`
Added util.fixUtf8 (#2704) * Remove invalid UTF-8 chars from OPDS * add unit tests 7 years ago			`return str:gsub('%/','_')`
Fix crash when downloading books with unknown characters in title (#2628) 7 years ago			`end`
Sanitize filename for vfat, fix #2433 (#2464) 7 years ago			`end`

evernote: ReadHistory integration and text file output (#2498) 7 years ago			`-- Split a file into its path and name`
			`function util.splitFilePathName(file)`
			`if file == nil or file == "" then return "", "" end`
			`if string.find(file, "/") == nil then return "", file end`
			`return string.gsub(file, "(./)(.)", "%1"), string.gsub(file, ".*/", "")`
			`end`

			`-- Split a file name into its pure file name and suffix`
			`function util.splitFileNameSuffix(file)`
			`if file == nil or file == "" then return "", "" end`
			`if string.find(file, "%.") == nil then return file, "" end`
			`return string.gsub(file, "(.)%.(.)", "%1"), string.gsub(file, ".*%.", "")`
			`end`

More sorting orders in file manager (#2535) 7 years ago			`function util.getFileNameSuffix(file)`
			`local _, suffix = util.splitFileNameSuffix(file)`
			`return suffix`
			`end`

Resolve review comments 7 years ago			`function util.getMenuText(item)`
			`local text`
			`if item.text_func then`
			`text = item.text_func()`
			`else`
			`text = item.text`
			`end`
			`if item.sub_item_table ~= nil then`
Use small triangle 7 years ago			`text = text .. " \226\150\184"`
Resolve review comments 7 years ago			`end`
			`return text`
			`end`

Added util.fixUtf8 (#2704) * Remove invalid UTF-8 chars from OPDS * add unit tests 7 years ago			`-- from http://notebook.kulchenko.com/programming/fixing-malformed-utf8-in-lua with modification`
			`--- Replaces invalid UTF-8 characters with a replacement string.`
			`---- @string str the string to be checked for invalid characters`
			`---- @string replacement the string to replace invalid characters with`
			`---- @treturn string valid UTF-8`
			`function util.fixUtf8(str, replacement)`
			`local pos = 1`
			`local len = #str`
			`while pos <= len do`
			`if pos == str:find("[%z\1-\127]", pos) then pos = pos + 1`
			`elseif pos == str:find("[\194-\223][\128-\191]", pos) then pos = pos + 2`
			`elseif pos == str:find( "\224[\160-\191][\128-\191]", pos)`
			`or pos == str:find("[\225-\236][\128-\191][\128-\191]", pos)`
			`or pos == str:find( "\237[\128-\159][\128-\191]", pos)`
			`or pos == str:find("[\238-\239][\128-\191][\128-\191]", pos) then pos = pos + 3`
			`elseif pos == str:find( "\240[\144-\191][\128-\191][\128-\191]", pos)`
			`or pos == str:find("[\241-\243][\128-\191][\128-\191][\128-\191]", pos)`
			`or pos == str:find( "\244[\128-\143][\128-\191][\128-\191]", pos) then pos = pos + 4`
			`else`
			`str = str:sub(1, pos - 1) .. replacement .. str:sub(pos + 1)`
			`pos = pos + #replacement`
			`len = len + #replacement - 1`
			`end`
			`end`
			`return str`
			`end`

strip punctuations around word before searching This should fix #1337. 9 years ago			`return util`