X-Git-Url: http://git.osdn.jp/view?a=blobdiff_plain;f=src%2Fltj-inputbuf.lua;h=f97f966039b45ca90cad037765bfae36b2e27801;hb=cf51a2259a27eeed9a3d5d0c40c767a5e6bc403e;hp=6032b5067bf43228f043cf86da6c203eda769adf;hpb=09c86f04a588a4a2b50d8c86868e8ed7d834f53c;p=luatex-ja%2Fluatexja.git diff --git a/src/ltj-inputbuf.lua b/src/ltj-inputbuf.lua index 6032b50..f97f966 100644 --- a/src/ltj-inputbuf.lua +++ b/src/ltj-inputbuf.lua @@ -1,24 +1,18 @@ -- --- luatexja/inputbuf.lua +-- luatexja/ltj-inputbuf.lua -- -luatexbase.provides_module({ - name = 'luatexja.inputbuf', - date = '2011/04/01', - version = '0.1', - description = 'Supressing a space by newline after Japanese characters', -}) -module('luatexja.inputbuf', package.seeall) -local err, warn, info, log = luatexbase.errwarinf(_NAME) luatexja.load_module('charrange'); local ltjc = luatexja.charrange +local utf = unicode.utf8 local node_new = node.new local id_glyph = node.id('glyph') local getcatcode = tex.getcatcode +local ltjc_is_ucs_in_japanese_char = ltjc.is_ucs_in_japanese_char --- the following function is modified from jafontspec.lua (by K. Maeda). --- Instead of "%", we use U+FFFFF for suppressing spaces. -function add_comment(buffer) +local function add_comment(buffer) local i = utf.len(buffer) while (i>0) and (getcatcode(utf.byte(buffer, i))==1 or getcatcode(utf.byte(buffer, i))==2) do @@ -26,18 +20,20 @@ function add_comment(buffer) end if i>0 then local c = utf.byte(buffer, i) - local ct = getcatcode(c) - local te = tex.endlinechar - local ctl = (te ~= -1) and (getcatcode(te)==5) and (getcatcode(0xFFFFF)==14) - -- Is the catcode of endline character is 5 (end-of-line)? - -- Is the catcode of U+FFFFF (new comment char) is 14 (comment)? - if ((ct==11) or (ct==12)) and ctl then - local p = node_new(id_glyph) - p.char = c - if ltjc.is_ucs_in_japanese_char(p) then - buffer = buffer .. string.char(0xF3,0xBF,0xBF,0xBF) -- U+FFFFF + if c>0x80 then + local ct = getcatcode(c) + local te = tex.endlinechar + local ctl = (te ~= -1) and (getcatcode(te)==5) and (getcatcode(0xFFFFF)==14) + -- Is the catcode of endline character is 5 (end-of-line)? + -- Is the catcode of U+FFFFF (new comment char) is 14 (comment)? + if ((ct==11) or (ct==12)) and ctl then + local p = node_new(id_glyph) + p.char = c + if ltjc_is_ucs_in_japanese_char(p) then + buffer = buffer .. string.char(0xF3,0xBF,0xBF,0xBF) -- U+FFFFF + end + node.free(p) end - node.free(p) end end return buffer