Created
May 2, 2010 18:29
-
-
Save zeen/387337 to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
local st = require "util.stanza"; | |
local lxp = require "lxp"; | |
-- XML parser | |
local parse_xml = (function() | |
local ns_prefixes = { | |
["http://www.w3.org/XML/1998/namespace"] = "xml"; | |
}; | |
local ns_separator = "\1"; | |
local ns_pattern = "^([^"..ns_separator.."]*)"..ns_separator.."?(.*)$"; | |
return function(xml) | |
local handler = {}; | |
local stanza = st.stanza("root"); | |
function handler:StartElement(tagname, attr) | |
local curr_ns,name = tagname:match(ns_pattern); | |
if name == "" then | |
curr_ns, name = "", curr_ns; | |
end | |
attr.xmlns = curr_ns; | |
for i=1,#attr do | |
local k = attr[i]; | |
attr[i] = nil; | |
local ns, nm = k:match(ns_pattern); | |
if nm ~= "" then | |
ns = ns_prefixes[ns]; | |
if ns then | |
attr[ns..":"..nm] = attr[k]; | |
attr[k] = nil; | |
end | |
end | |
end | |
stanza:tag(name, attr); | |
end | |
function handler:CharacterData(data) | |
stanza:text(data); | |
end | |
function handler:EndElement(tagname) | |
stanza:up(); | |
end | |
local parser = lxp.new(handler, "\1"); | |
local ok, err = parser:parse(xml); | |
if ok then | |
return stanza.tags[1]; | |
else | |
return ok, err; | |
end | |
end; | |
end)(); | |
-- end of XML parser |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment