# HG changeset patch # User Matthew Wild # Date 1294093249 0 # Node ID b3dffb6bc1aae31d8059dec029cb07c4622117a8 # Parent cbfa0ea6668b325709c27645a30e0b478cbb44ca# Parent de77ec2b49bc1d759dba0995750cfde52d8af760 Merge diff -r cbfa0ea6668b -r b3dffb6bc1aa util/xmllex.lua --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/util/xmllex.lua Mon Jan 03 22:20:49 2011 +0000 @@ -0,0 +1,187 @@ +local assert, ipairs , pairs , setmetatable , rawget , rawset , tostring = + assert, ipairs , pairs , setmetatable , rawget , rawset , tostring +local strsub = string.sub +local tblconcat = table.concat +local tblinsert = table.insert + +local function getstring ( msgs , startpos , finishpos ) + if #msgs == 1 then --All originated in same string + return strsub ( msgs[1] , startpos , finishpos ) + else -- Over multiple source strings + return strsub ( msgs[1] , startpos , -1 ) + .. tblconcat ( msgs , "" , 2 , #msgs - 1 ) + .. strsub ( msgs[#msgs] , 1 , finishpos ) + end +end + +local m_mt = { + __tostring = function ( v ) + local str = v.stringform + if str then + return str + else + str = getstring ( v.msgs , v.start , v.finish ) + v.stringform = str + return str + end + end +} + +local function handleoutside ( str , r , initial ) + local a , b , close = str:find ( "<(/?)" , initial ) + if not a then + r.state = "outside" + return false + end + + --Finalise text object + local m = r[#r] + m.finish = a - 1 + m.type = "text" + + local m = setmetatable ( { + msgs = { str } ; + start = a ; + starte = b + 1 ; + } , m_mt ) + + if close ~= "/" then + r.depth = r.depth + 1 + m.type = "open" + else + r.depth = r.depth - 1 + m.type = "close" + end + + tblinsert ( r , m ) + + r.state = "inside" + return true +end + +local function handleinside ( str, r , initial ) + local c , d , selfclosing = str:find ( "(/?)>" , initial ) + if not c then + r.state = "inside" + return false + end + + local m = r[#r] + m.finish = d + m.finishs = c - 1 + if selfclosing == "/" then + m.type = "selfclosing" + r.depth = r.depth - 1 + end + + local m = setmetatable ( { + msgs = { str } ; + start = d + 1 ; + type = "text" ; + } , m_mt ) + tblinsert ( r , m ) + + r.state = "outside" + return true +end + +local function index ( str , r ) + r = r or { depth = 0, state = "outside" } + + if not r[#r] then + r[1] = setmetatable ( { + msgs = { str } ; + type = "text" ; + start = 1 ; + } , m_mt ) + else + tblinsert ( r[#r].msgs , str ) + end + + repeat + if r.state == "outside" then + if not handleoutside ( str , r , r[#r].start ) then + break + end + else + if not handleinside ( str , r , r[#r].start ) then + break + end + end + until false + + return r +end + +local function process_starttag ( starttag ) + local str = tostring ( starttag ) + local attr = { } + + local elem = str:match ( "[^%s=> 0 then - -- We have some character data in the buffer - t_insert(stanza, t_concat(chardata)); - chardata = {}; - end - local curr_ns,name = tagname:match(ns_pattern); - if name == "" then - curr_ns, name = "", curr_ns; - end - - if curr_ns ~= stream_default_ns or non_streamns_depth > 0 then - attr.xmlns = curr_ns; - non_streamns_depth = non_streamns_depth + 1; - end - - -- FIXME !!!!! - for i=1,#attr do - local k = attr[i]; - attr[i] = nil; - local ns, nm = k:match(ns_pattern); - if nm ~= "" then - ns = ns_prefixes[ns]; - if ns then - attr[ns..":"..nm] = attr[k]; - attr[k] = nil; - end - end - end - - if not stanza then --if we are not currently inside a stanza - if session.notopen then - if tagname == stream_tag then - non_streamns_depth = 0; - if cb_streamopened then - cb_streamopened(session, attr); - end - else - -- Garbage before stream? - cb_error(session, "no-stream"); - end - return; - end - if curr_ns == "jabber:client" and name ~= "iq" and name ~= "presence" and name ~= "message" then - cb_error(session, "invalid-top-level-element"); - end - - stanza = setmetatable({ name = name, attr = attr, tags = {} }, stanza_mt); - else -- we are inside a stanza, so add a tag - t_insert(stack, stanza); - local oldstanza = stanza; - stanza = setmetatable({ name = name, attr = attr, tags = {} }, stanza_mt); - t_insert(oldstanza, stanza); - t_insert(oldstanza.tags, stanza); - end + local function feed(stream, data) + index(data, end - function xml_handlers:CharacterData(data) - if stanza then - t_insert(chardata, data); - end - end - function xml_handlers:EndElement(tagname) - if non_streamns_depth > 0 then - non_streamns_depth = non_streamns_depth - 1; - end - if stanza then - if #chardata > 0 then - -- We have some character data in the buffer - t_insert(stanza, t_concat(chardata)); - chardata = {}; - end - -- Complete stanza - if #stack == 0 then - if tagname ~= stream_error_tag then - cb_handlestanza(session, stanza); - else - cb_error(session, "stream-error", stanza); - end - stanza = nil; - else - stanza = t_remove(stack); - end - else - if tagname == stream_tag then - if cb_streamclosed then - cb_streamclosed(session); - end - else - local curr_ns,name = tagname:match(ns_pattern); - if name == "" then - curr_ns, name = "", curr_ns; - end - cb_error(session, "parse-error", "unexpected-element-close", name); - end - stanza, chardata = nil, {}; - stack = {}; - end - end - - local function reset() - stanza, chardata = nil, {}; - stack = {}; - end - - local function set_session(stream, new_session) - session = new_session; - log = new_session.log or default_log; - end - - return xml_handlers, { reset = reset, set_session = set_session }; -end - -function new(session, stream_callbacks) - local handlers, meta = new_sax_handlers(session, stream_callbacks); - local parser = new_parser(handlers, ns_separator); - local parse = parser.parse; return { reset = function ()