2003-06-09 21:31:01 -04:00
|
|
|
require 'rexml/parsers/streamparser'
|
|
|
|
require 'rexml/parsers/baseparser'
|
|
|
|
|
|
|
|
module REXML
|
2008-10-01 09:46:53 -04:00
|
|
|
module Parsers
|
|
|
|
class UltraLightParser
|
|
|
|
def initialize stream
|
|
|
|
@stream = stream
|
|
|
|
@parser = REXML::Parsers::BaseParser.new( stream )
|
|
|
|
end
|
2003-06-09 21:31:01 -04:00
|
|
|
|
2004-06-09 22:01:04 -04:00
|
|
|
def add_listener( listener )
|
|
|
|
@parser.add_listener( listener )
|
|
|
|
end
|
|
|
|
|
2003-06-09 21:31:01 -04:00
|
|
|
def rewind
|
|
|
|
@stream.rewind
|
|
|
|
@parser.stream = @stream
|
|
|
|
end
|
|
|
|
|
2008-10-01 09:46:53 -04:00
|
|
|
def parse
|
|
|
|
root = context = []
|
|
|
|
while true
|
|
|
|
event = @parser.pull
|
|
|
|
case event[0]
|
|
|
|
when :end_document
|
|
|
|
break
|
|
|
|
when :end_doctype
|
|
|
|
context = context[1]
|
|
|
|
when :start_element, :doctype
|
|
|
|
context << event
|
|
|
|
event[1,0] = [context]
|
|
|
|
context = event
|
|
|
|
when :end_element
|
|
|
|
context = context[1]
|
|
|
|
else
|
|
|
|
context << event
|
|
|
|
end
|
|
|
|
end
|
|
|
|
root
|
|
|
|
end
|
|
|
|
end
|
2003-06-09 21:31:01 -04:00
|
|
|
|
2008-10-01 09:46:53 -04:00
|
|
|
# An element is an array. The array contains:
|
2011-05-18 20:07:25 -04:00
|
|
|
# 0 The parent element
|
|
|
|
# 1 The tag name
|
|
|
|
# 2 A hash of attributes
|
|
|
|
# 3..-1 The child elements
|
2008-10-01 09:46:53 -04:00
|
|
|
# An element is an array of size > 3
|
|
|
|
# Text is a String
|
|
|
|
# PIs are [ :processing_instruction, target, data ]
|
|
|
|
# Comments are [ :comment, data ]
|
|
|
|
# DocTypes are DocType structs
|
|
|
|
# The root is an array with XMLDecls, Text, DocType, Array, Text
|
|
|
|
end
|
2003-06-09 21:31:01 -04:00
|
|
|
end
|