2010-01-01 06:57:36 -05:00
|
|
|
require 'libxml'
|
2010-03-28 08:15:02 -04:00
|
|
|
require 'active_support/core_ext/object/blank'
|
2011-01-18 14:45:52 -05:00
|
|
|
require 'stringio'
|
2010-01-01 06:57:36 -05:00
|
|
|
|
|
|
|
# = XmlMini LibXML implementation using a SAX-based parser
|
|
|
|
module ActiveSupport
|
|
|
|
module XmlMini_LibXMLSAX
|
|
|
|
extend self
|
|
|
|
|
|
|
|
# Class that will build the hash while the XML document
|
|
|
|
# is being parsed using SAX events.
|
|
|
|
class HashBuilder
|
|
|
|
|
|
|
|
include LibXML::XML::SaxParser::Callbacks
|
|
|
|
|
|
|
|
CONTENT_KEY = '__content__'.freeze
|
|
|
|
HASH_SIZE_KEY = '__hash_size__'.freeze
|
|
|
|
|
|
|
|
attr_reader :hash
|
|
|
|
|
|
|
|
def current_hash
|
|
|
|
@hash_stack.last
|
|
|
|
end
|
|
|
|
|
|
|
|
def on_start_document
|
2010-01-01 07:44:42 -05:00
|
|
|
@hash = { CONTENT_KEY => '' }
|
2010-01-01 06:57:36 -05:00
|
|
|
@hash_stack = [@hash]
|
|
|
|
end
|
|
|
|
|
|
|
|
def on_end_document
|
2010-01-01 07:44:42 -05:00
|
|
|
@hash = @hash_stack.pop
|
|
|
|
@hash.delete(CONTENT_KEY)
|
2010-01-01 06:57:36 -05:00
|
|
|
end
|
|
|
|
|
|
|
|
def on_start_element(name, attrs = {})
|
|
|
|
new_hash = { CONTENT_KEY => '' }.merge(attrs)
|
|
|
|
new_hash[HASH_SIZE_KEY] = new_hash.size + 1
|
|
|
|
|
|
|
|
case current_hash[name]
|
|
|
|
when Array then current_hash[name] << new_hash
|
|
|
|
when Hash then current_hash[name] = [current_hash[name], new_hash]
|
|
|
|
when nil then current_hash[name] = new_hash
|
|
|
|
end
|
|
|
|
|
|
|
|
@hash_stack.push(new_hash)
|
|
|
|
end
|
|
|
|
|
|
|
|
def on_end_element(name)
|
|
|
|
if current_hash.length > current_hash.delete(HASH_SIZE_KEY) && current_hash[CONTENT_KEY].blank? || current_hash[CONTENT_KEY] == ''
|
|
|
|
current_hash.delete(CONTENT_KEY)
|
|
|
|
end
|
|
|
|
@hash_stack.pop
|
|
|
|
end
|
|
|
|
|
|
|
|
def on_characters(string)
|
|
|
|
current_hash[CONTENT_KEY] << string
|
|
|
|
end
|
|
|
|
|
|
|
|
alias_method :on_cdata_block, :on_characters
|
|
|
|
end
|
|
|
|
|
|
|
|
attr_accessor :document_class
|
|
|
|
self.document_class = HashBuilder
|
|
|
|
|
|
|
|
def parse(data)
|
|
|
|
if !data.respond_to?(:read)
|
|
|
|
data = StringIO.new(data || '')
|
|
|
|
end
|
|
|
|
|
|
|
|
char = data.getc
|
|
|
|
if char.nil?
|
|
|
|
{}
|
|
|
|
else
|
|
|
|
data.ungetc(char)
|
2010-01-01 07:44:42 -05:00
|
|
|
|
|
|
|
LibXML::XML::Error.set_handler(&LibXML::XML::Error::QUIET_HANDLER)
|
2010-01-01 06:57:36 -05:00
|
|
|
parser = LibXML::XML::SaxParser.io(data)
|
2010-01-01 07:44:42 -05:00
|
|
|
document = self.document_class.new
|
|
|
|
|
2010-01-01 06:57:36 -05:00
|
|
|
parser.callbacks = document
|
|
|
|
parser.parse
|
|
|
|
document.hash
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
2011-01-18 14:45:52 -05:00
|
|
|
end
|