Hi folks !

I have just finished a first draft of pret-xml.lua:
- I need to improve its coverage (html);
- DTD declaration is not yet managed;
- I do nothing about re-indentation since I prefer to format my xml sample by myself (by hand or using xmllint); - That's my first try to lua/luatex (after several months of Java...) so my definitions (esp. for functions) is not clean at all (you have been warned);

I have done it the "trial/error" way without much design reflexion just for fun (I'm on vacation)... I'm not sure it will be reusable...

Take all your test files and please report issues (or give me advices)! ;)

Thank you Matthijs!

Regards,

Renaud

Matthijs Kooijman a écrit :
Hey all,

./tex/texmf-context/tex/context/base/verb-.*\.lua !
Actually, in newer versions (since a month or so), that's pret-*.lua.

Where to start with this topic (current state in Mark IV, roadmap, ...) ?
I've been struggling with this a bit as well lately and found there was next
to no documentation. I've managed to create my own pretty printer, and tried
to update the docs a bit. See [1] and [2] on the wiki for more info. There are
still some details I don't get (why is there a line() hook, what is all this
nesting stuff, etc.), so feel free to find out more and improve these pages!

Gr.

Matthijs

[1]: http://wiki.contextgarden.net/Verbatim_text#Your_own_formatter
[2]: http://wiki.contextgarden.net/Custom_pretty_printer

------------------------------------------------------------------------

___________________________________________________________________________________
If your question is of interest to others as well, please add an entry to the 
Wiki!

maillist : ntg-context@ntg.nl / http://www.ntg.nl/mailman/listinfo/ntg-context
webpage  : http://www.pragma-ade.nl / http://tex.aanhet.net
archive  : https://foundry.supelec.fr/projects/contextrev/
wiki     : http://contextgarden.net
___________________________________________________________________________________

if not modules then modules = { } end modules ['pret-xml'] = {
    version   = 1.001,
    comment   = "from pret-.*\.lua, http://wiki.contextgarden.net/Verbatim_text#Your_own_formatter and http://wiki.contextgarden.net/Custom_pretty_printer";,
    author    = "Renaud AUBIN",
    copyright = "to be defined",
    license   = "to be defined"
}

local utf = unicode.utf8

local utfcharacters, utfvalues = string.utfcharacters, string.utfvalues
local utfbyte, utffind = utf.byte, utf.find
local byte, sub, find, gfind, match = string.byte, string.sub, string.find, string.gfind, string.match
local texsprint, texwrite = tex.sprint, tex.write
local ctxcatcodes = tex.ctxcatcodes

local change_state, finish_state = buffers.change_state, buffers.finish_state

buffers.visualizers.xml             = buffers.visualizers.xml             or { }
buffers.visualizers.xml.identifiers = buffers.visualizers.xml.identifiers or { }

incomment = false

local colors = {
   "prettyone",
   "prettytwo",
   "prettythree",
   "prettyfour",
   "prettyfive",
   "prettysix",
   "prettyseven"
}

local states = {
   ['namespace']        =  1,
   ['element']          =  2,
   ['attrname']         =  3,
   ['attrvalue']        =  4,
   ['prolog']           =  5,
   ['comment']          =  6,
   ['pi']               =  7
}

local function flush_text(str)
   for c in utfcharacters(str) do
      if c == " " then texsprint(ctxcatcodes,"\\obs") else texwrite(c) end
   end
end

local function process_attribute(str)
   local name, value, state = "", "", 0
   buffers.currentcolors = colors
   local name,value = match(str,"^(.-)=(\".-\")$")

   state = change_state(states['attrname'], state)
   flush_text(name)
   state = finish_state(state)
   texwrite("=")
   state = change_state(states['attrvalue'], state)
   flush_text(value)
   state = finish_state(state)
end

local function process_namespace(str)
   local state = 0
   buffers.currentcolors = colors
   
   state = change_state(states['namespace'], state)
   flush_text(str)
   state = finish_state(state)
   texwrite(":")
end

local function process_element(str)
   local state = 0
   buffers.currentcolors = colors
   
   state = change_state(states['element'], state)
   flush_text(str)
   state = finish_state(state)
end

local function process_comment(str)
   local state = 0
   buffers.currentcolors = colors
   
   state = change_state(states['comment'], state)
   flush_text(str)
   state = finish_state(state)
end

function process_tag(str)
   local name, value, state = "", "", 0
   buffers.currentcolors = colors

   if match(str,"^<%?xml.-%?>$") then
      local prolog = match(str,"^<%?xml(.-)%?>$")      
      state = change_state(states['pi'], state)
      texwrite("<?")
      state = finish_state(state)
      state = change_state(states['prolog'], state)
      texwrite("xml")
      state = finish_state(state)
      repeat prolog=recursive_processing(prolog) until prolog==nil
      state = change_state(states['pi'], state)
      texwrite("?>")
      state = finish_state(state)
   elseif match(str,"^<!%-%-.-%-%->$") then
      process_comment(str)
   elseif match(str,"^<[%a_]%w-%s*/?>$") or match(str,"^</?[%a_]%w-%s*>$") then
      local btag, name, etag = match(str,"^(</?)([%a_]%w-%s*)(/?>)$")
      texwrite(btag)
      process_element(name)
      texwrite(etag) 
   elseif match(str,"^<%a%w-:[%a_]%w-%s*/?>$") or match(str,"^</?%a%w-:[%a_]%w-%s*>$") then
      local btag, ns, name, etag = match(str,"^(</?)(%a%w-):([%a_]%w-%s*)(/?>)$")
      texwrite(btag)
      process_namespace(ns)
      process_element(name)
      texwrite(etag)
   elseif match(str,"^<%a%w-:[%a_][%w%-]-%s.*/?>$") or match(str,"^</?%a%w-:[%a_][%w%-]-%s.*>$") then
      local btag, ns, name, attributes, etag = match(str,"^(</?)(%a%w-):([%a_][%w%-]-%s)(.*)(/?>)$")
      texwrite(btag)
      process_namespace(ns)
      process_element(name)
      repeat attributes=recursive_processing(attributes) until attributes==nil
      texwrite(etag)
   elseif match(str,"^<[%a_]%w-%s.*/?>$") or match(str,"^</?[%a_]%w-%s.*>$") then
      local btag, name, attributes, etag = match(str,"^(</?)([%a_]%w-%s)(.*)(/?>)$")
      texwrite(btag)
      process_element(name)
      repeat attributes=recursive_processing(attributes) until attributes==nil
      texwrite(etag)
   end
end

function process_uncomplete_starttag(str)
   local name, value, state = "", "", 0
   buffers.currentcolors = colors

   if match(str,"^<%a%w-:[%a_]%w-%s.*$") then
      local btag, ns, name, attributes = match(str,"^(<)(%a%w-):([%a_]%w-%s)(.*)$")
      texwrite(btag)
      process_namespace(ns)
      process_element(name)
      repeat attributes=recursive_processing(attributes) until attributes==nil
   elseif match(str,"^<[%a_]%w-%s.*$") then
      local btag, name, attributes = match(str,"^(<)([%a_]%w-%s)(.*)$")
      texwrite(btag)
      process_element(name)
      repeat attributes=recursive_processing(attributes) until attributes==nil
   end
end

function recursive_processing(str)
   local first, second, third, attribute = "", "", "", ""
   
   if match(str, "^(.-)(%-%->)(.*)$") then
      -- stop multiline comment
      first, second, third = match(str, "^(.-)(%-%->)(.*)$")
      process_comment(first..second)
      incomment = false
      return third
   elseif incomment then
      process_comment(str)
   elseif match(str, "^(.-)(%b<>)(.*)$") then
      -- standard tag
      first, second, third = match(str, "^(.-)(%b<>)(.*)$")
      repeat first=recursive_processing(first) until first==nil
      process_tag(second)
      return third
   elseif match(str, "^(.-)(<[%a_]%w-:?%w-[%s%c])(.*)$") then
      -- multiline starttag
      first, second, third = match(str, "^(.-)(<[%a_]%w-:?%w-[%s%c])(.*)$")
      repeat first=recursive_processing(first) until first==nil
      process_uncomplete_starttag(second)
      return third
   -- elseif match(str, "^(.-)(<%?xml)(.*)$") then
   -- TODO manage multiline prolog
   -- first, second, third = match(str, "^(.-)(<%?xml)(.*)$")
   -- return third
   elseif match(str, "^(.-)(<!%-%-)(.*)$") then
      -- start multiline comment
      first, second, third = match(str, "^(.-)(<!%-%-)(.*)$")
      repeat first=recursive_processing(first) until first==nil
      process_comment(second..third)
      incomment = true
      return nil
   elseif match(str, "^(.-=\".-\")(.*)$") then
      -- attribute
      local attribute, after = match(str, "^(.-=\".-\")(.*)$")
      process_attribute(attribute)
      return after
   elseif match(str, "^(.*)$") then
      -- other
      first = match(str, "^(.*)$")
      flush_text(str)
   end
   return nil
end

function buffers.visualizers.xml.flush_line(str,nested)

   repeat str=recursive_processing(str) until str==nil
end
___________________________________________________________________________________
If your question is of interest to others as well, please add an entry to the 
Wiki!

maillist : ntg-context@ntg.nl / http://www.ntg.nl/mailman/listinfo/ntg-context
webpage  : http://www.pragma-ade.nl / http://tex.aanhet.net
archive  : https://foundry.supelec.fr/projects/contextrev/
wiki     : http://contextgarden.net
___________________________________________________________________________________

Reply via email to