Hi folks !
I have just finished a first draft of pret-xml.lua:
- I need to improve its coverage (html);
- DTD declaration is not yet managed;
- I do nothing about re-indentation since I prefer to format my xml
sample by myself (by hand or using xmllint);
- That's my first try to lua/luatex (after several months of Java...) so
my definitions (esp. for functions) is not clean at all (you have been
warned);
I have done it the "trial/error" way without much design reflexion just
for fun (I'm on vacation)... I'm not sure it will be reusable...
Take all your test files and please report issues (or give me advices)! ;)
Thank you Matthijs!
Regards,
Renaud
Matthijs Kooijman a écrit :
Hey all,
./tex/texmf-context/tex/context/base/verb-.*\.lua !
Actually, in newer versions (since a month or so), that's pret-*.lua.
Where to start with this topic (current state in Mark IV, roadmap, ...) ?
I've been struggling with this a bit as well lately and found there was next
to no documentation. I've managed to create my own pretty printer, and tried
to update the docs a bit. See [1] and [2] on the wiki for more info. There are
still some details I don't get (why is there a line() hook, what is all this
nesting stuff, etc.), so feel free to find out more and improve these pages!
Gr.
Matthijs
[1]: http://wiki.contextgarden.net/Verbatim_text#Your_own_formatter
[2]: http://wiki.contextgarden.net/Custom_pretty_printer
------------------------------------------------------------------------
___________________________________________________________________________________
If your question is of interest to others as well, please add an entry to the
Wiki!
maillist : ntg-context@ntg.nl / http://www.ntg.nl/mailman/listinfo/ntg-context
webpage : http://www.pragma-ade.nl / http://tex.aanhet.net
archive : https://foundry.supelec.fr/projects/contextrev/
wiki : http://contextgarden.net
___________________________________________________________________________________
if not modules then modules = { } end modules ['pret-xml'] = {
version = 1.001,
comment = "from pret-.*\.lua, http://wiki.contextgarden.net/Verbatim_text#Your_own_formatter and http://wiki.contextgarden.net/Custom_pretty_printer",
author = "Renaud AUBIN",
copyright = "to be defined",
license = "to be defined"
}
local utf = unicode.utf8
local utfcharacters, utfvalues = string.utfcharacters, string.utfvalues
local utfbyte, utffind = utf.byte, utf.find
local byte, sub, find, gfind, match = string.byte, string.sub, string.find, string.gfind, string.match
local texsprint, texwrite = tex.sprint, tex.write
local ctxcatcodes = tex.ctxcatcodes
local change_state, finish_state = buffers.change_state, buffers.finish_state
buffers.visualizers.xml = buffers.visualizers.xml or { }
buffers.visualizers.xml.identifiers = buffers.visualizers.xml.identifiers or { }
incomment = false
local colors = {
"prettyone",
"prettytwo",
"prettythree",
"prettyfour",
"prettyfive",
"prettysix",
"prettyseven"
}
local states = {
['namespace'] = 1,
['element'] = 2,
['attrname'] = 3,
['attrvalue'] = 4,
['prolog'] = 5,
['comment'] = 6,
['pi'] = 7
}
local function flush_text(str)
for c in utfcharacters(str) do
if c == " " then texsprint(ctxcatcodes,"\\obs") else texwrite(c) end
end
end
local function process_attribute(str)
local name, value, state = "", "", 0
buffers.currentcolors = colors
local name,value = match(str,"^(.-)=(\".-\")$")
state = change_state(states['attrname'], state)
flush_text(name)
state = finish_state(state)
texwrite("=")
state = change_state(states['attrvalue'], state)
flush_text(value)
state = finish_state(state)
end
local function process_namespace(str)
local state = 0
buffers.currentcolors = colors
state = change_state(states['namespace'], state)
flush_text(str)
state = finish_state(state)
texwrite(":")
end
local function process_element(str)
local state = 0
buffers.currentcolors = colors
state = change_state(states['element'], state)
flush_text(str)
state = finish_state(state)
end
local function process_comment(str)
local state = 0
buffers.currentcolors = colors
state = change_state(states['comment'], state)
flush_text(str)
state = finish_state(state)
end
function process_tag(str)
local name, value, state = "", "", 0
buffers.currentcolors = colors
if match(str,"^<%?xml.-%?>$") then
local prolog = match(str,"^<%?xml(.-)%?>$")
state = change_state(states['pi'], state)
texwrite("<?")
state = finish_state(state)
state = change_state(states['prolog'], state)
texwrite("xml")
state = finish_state(state)
repeat prolog=recursive_processing(prolog) until prolog==nil
state = change_state(states['pi'], state)
texwrite("?>")
state = finish_state(state)
elseif match(str,"^<!%-%-.-%-%->$") then
process_comment(str)
elseif match(str,"^<[%a_]%w-%s*/?>$") or match(str,"^</?[%a_]%w-%s*>$") then
local btag, name, etag = match(str,"^(</?)([%a_]%w-%s*)(/?>)$")
texwrite(btag)
process_element(name)
texwrite(etag)
elseif match(str,"^<%a%w-:[%a_]%w-%s*/?>$") or match(str,"^</?%a%w-:[%a_]%w-%s*>$") then
local btag, ns, name, etag = match(str,"^(</?)(%a%w-):([%a_]%w-%s*)(/?>)$")
texwrite(btag)
process_namespace(ns)
process_element(name)
texwrite(etag)
elseif match(str,"^<%a%w-:[%a_][%w%-]-%s.*/?>$") or match(str,"^</?%a%w-:[%a_][%w%-]-%s.*>$") then
local btag, ns, name, attributes, etag = match(str,"^(</?)(%a%w-):([%a_][%w%-]-%s)(.*)(/?>)$")
texwrite(btag)
process_namespace(ns)
process_element(name)
repeat attributes=recursive_processing(attributes) until attributes==nil
texwrite(etag)
elseif match(str,"^<[%a_]%w-%s.*/?>$") or match(str,"^</?[%a_]%w-%s.*>$") then
local btag, name, attributes, etag = match(str,"^(</?)([%a_]%w-%s)(.*)(/?>)$")
texwrite(btag)
process_element(name)
repeat attributes=recursive_processing(attributes) until attributes==nil
texwrite(etag)
end
end
function process_uncomplete_starttag(str)
local name, value, state = "", "", 0
buffers.currentcolors = colors
if match(str,"^<%a%w-:[%a_]%w-%s.*$") then
local btag, ns, name, attributes = match(str,"^(<)(%a%w-):([%a_]%w-%s)(.*)$")
texwrite(btag)
process_namespace(ns)
process_element(name)
repeat attributes=recursive_processing(attributes) until attributes==nil
elseif match(str,"^<[%a_]%w-%s.*$") then
local btag, name, attributes = match(str,"^(<)([%a_]%w-%s)(.*)$")
texwrite(btag)
process_element(name)
repeat attributes=recursive_processing(attributes) until attributes==nil
end
end
function recursive_processing(str)
local first, second, third, attribute = "", "", "", ""
if match(str, "^(.-)(%-%->)(.*)$") then
-- stop multiline comment
first, second, third = match(str, "^(.-)(%-%->)(.*)$")
process_comment(first..second)
incomment = false
return third
elseif incomment then
process_comment(str)
elseif match(str, "^(.-)(%b<>)(.*)$") then
-- standard tag
first, second, third = match(str, "^(.-)(%b<>)(.*)$")
repeat first=recursive_processing(first) until first==nil
process_tag(second)
return third
elseif match(str, "^(.-)(<[%a_]%w-:?%w-[%s%c])(.*)$") then
-- multiline starttag
first, second, third = match(str, "^(.-)(<[%a_]%w-:?%w-[%s%c])(.*)$")
repeat first=recursive_processing(first) until first==nil
process_uncomplete_starttag(second)
return third
-- elseif match(str, "^(.-)(<%?xml)(.*)$") then
-- TODO manage multiline prolog
-- first, second, third = match(str, "^(.-)(<%?xml)(.*)$")
-- return third
elseif match(str, "^(.-)(<!%-%-)(.*)$") then
-- start multiline comment
first, second, third = match(str, "^(.-)(<!%-%-)(.*)$")
repeat first=recursive_processing(first) until first==nil
process_comment(second..third)
incomment = true
return nil
elseif match(str, "^(.-=\".-\")(.*)$") then
-- attribute
local attribute, after = match(str, "^(.-=\".-\")(.*)$")
process_attribute(attribute)
return after
elseif match(str, "^(.*)$") then
-- other
first = match(str, "^(.*)$")
flush_text(str)
end
return nil
end
function buffers.visualizers.xml.flush_line(str,nested)
repeat str=recursive_processing(str) until str==nil
end
___________________________________________________________________________________
If your question is of interest to others as well, please add an entry to the
Wiki!
maillist : ntg-context@ntg.nl / http://www.ntg.nl/mailman/listinfo/ntg-context
webpage : http://www.pragma-ade.nl / http://tex.aanhet.net
archive : https://foundry.supelec.fr/projects/contextrev/
wiki : http://contextgarden.net
___________________________________________________________________________________