rime-ice/lua/unicode.lua

-- Unicode
-- 复制自： https://github.com/shewer/librime-lua-script/blob/main/lua/component/unicode.lua
-- 示例：输入 U62fc 得到「拼」
-- 触发前缀默认为 recognizer/patterns/unicode 的第 2 个字符，即 U
-- 2024.02.26: 限定编码最大值
-- 2024.06.01: 部分变量初始化，条件语句调整。

local path = 'recognizer/patterns/unicode'
local function unicode(input, seg, env)
    if not seg:has_tag("unicode") or input == '' then return end
    -- 获取 recognizer/patterns/unicode 的第 2 个字符作为触发前缀
    -- config:get_string(path) 可能取得 nil 造成error
    if not env.unicode_keyword then
        local pattern = env.engine.schema.config:get_string(path) or "UU"
        env.unicode_keyword = pattern:sub(2,2)
    end

    local ucodestr = input:match(env.unicode_keyword .. "(%x+)")
    if ucodestr and #ucodestr > 1 then
        local code = tonumber(ucodestr, 16)
        if code > 0x10FFFF then
           yield(Candidate("unicode", seg.start, seg._end, "数值超限！", ""))
           return
        end
        local text = utf8.char(code)
        yield(Candidate("unicode", seg.start, seg._end, text, string.format("U%x", code)))
        if code < 0x10000 then
           for i = 0, 15 do
               local text = utf8.char(code * 16 + i)
                yield(Candidate("unicode", seg.start, seg._end, text, string.format("U%x~%x", code, i)))
           end
        end
    end
end

return unicode
refactor: Lua 模块化删除 `rime.lua`，拆分到 `lua/` 文件夹内。方案中的 `- lua_xxx@xxx` 修改为 `- lua_xxx@*xxx`（加一个星号）。 2023-05-04 19:41:21 +02:00			`-- Unicode`
			`-- 复制自： https://github.com/shewer/librime-lua-script/blob/main/lua/component/unicode.lua`
feat: translator 改成自动读取 recognizer/patterns 配置来获取触发前缀 close #615 2024-01-14 16:58:37 +01:00			`-- 示例：输入 U62fc 得到「拼」`
			`-- 触发前缀默认为 recognizer/patterns/unicode 的第 2 个字符，即 U`
dict: 槛（jian 栏杆、圈） (#705) lua：Unicode.lua 添加数值超限警告，防止 error 产生 2024-02-26 16:53:18 +01:00			`-- 2024.02.26: 限定编码最大值`
chore: some adjustments for unicode.lua (#898) * Update unicode.lua 1. config:get_string() 可能取得 nil , 增加預設字串 2. seg:has_tag() , input == "" 提前判斷，可以避免 patterns 未設定的問題 * trim and add change log --------- Co-authored-by: mirtlecn <mirtle.cn+github@outlook.com> 2024-06-01 15:29:27 +02:00			`-- 2024.06.01: 部分变量初始化，条件语句调整。`

			`local path = 'recognizer/patterns/unicode'`
refactor: Lua 模块化删除 `rime.lua`，拆分到 `lua/` 文件夹内。方案中的 `- lua_xxx@xxx` 修改为 `- lua_xxx@*xxx`（加一个星号）。 2023-05-04 19:41:21 +02:00			`local function unicode(input, seg, env)`
chore: some adjustments for unicode.lua (#898) * Update unicode.lua 1. config:get_string() 可能取得 nil , 增加預設字串 2. seg:has_tag() , input == "" 提前判斷，可以避免 patterns 未設定的問題 * trim and add change log --------- Co-authored-by: mirtlecn <mirtle.cn+github@outlook.com> 2024-06-01 15:29:27 +02:00			`if not seg:has_tag("unicode") or input == '' then return end`
style: Lua 统一缩进 4 空格 2024-02-08 11:39:49 +01:00			`-- 获取 recognizer/patterns/unicode 的第 2 个字符作为触发前缀`
chore: some adjustments for unicode.lua (#898) * Update unicode.lua 1. config:get_string() 可能取得 nil , 增加預設字串 2. seg:has_tag() , input == "" 提前判斷，可以避免 patterns 未設定的問題 * trim and add change log --------- Co-authored-by: mirtlecn <mirtle.cn+github@outlook.com> 2024-06-01 15:29:27 +02:00			`-- config:get_string(path) 可能取得 nil 造成error`
			`if not env.unicode_keyword then`
			`local pattern = env.engine.schema.config:get_string(path) or "UU"`
			`env.unicode_keyword = pattern:sub(2,2)`
			`end`

			`local ucodestr = input:match(env.unicode_keyword .. "(%x+)")`
			`if ucodestr and #ucodestr > 1 then`
			`local code = tonumber(ucodestr, 16)`
			`if code > 0x10FFFF then`
			`yield(Candidate("unicode", seg.start, seg._end, "数值超限！", ""))`
			`return`
			`end`
			`local text = utf8.char(code)`
			`yield(Candidate("unicode", seg.start, seg._end, text, string.format("U%x", code)))`
			`if code < 0x10000 then`
			`for i = 0, 15 do`
			`local text = utf8.char(code * 16 + i)`
			`yield(Candidate("unicode", seg.start, seg._end, text, string.format("U%x~%x", code, i)))`
			`end`
style: Lua 统一缩进 4 空格 2024-02-08 11:39:49 +01:00			`end`
			`end`
refactor: Lua 模块化删除 `rime.lua`，拆分到 `lua/` 文件夹内。方案中的 `- lua_xxx@xxx` 修改为 `- lua_xxx@*xxx`（加一个星号）。 2023-05-04 19:41:21 +02:00			`end`

			`return unicode`