mirror of
https://github.com/ruby/ruby.git
synced 2022-11-09 12:17:21 -05:00
7d21c237cc
for encoding changes. This should be the case on all 1.8 installations. When it isn't found (<1.6), the native REXML encoding mechanism is used. This cleaned out some files, and tightened up the code a bit; and iconv should be faster than the pure Ruby code. * Changed deprecated assert_not_nil to assert throughout the tests. * Parse exceptions are a little more verbose, and extend RuntimeError. * Bug fixes to XPathParser * The Light API is still shifting, like the sands of the desert. * Fixed a new Ruby 1.8.0 warning, added some speed optimizations, and tightened error reporting in the base parser git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@4737 b2dd03c8-39d4-4d8f-98ff-823fe69b080e
56 lines
1.3 KiB
Ruby
56 lines
1.3 KiB
Ruby
require 'rexml/parsers/streamparser'
|
|
require 'rexml/parsers/baseparser'
|
|
require 'rexml/light/node'
|
|
|
|
module REXML
|
|
module Parsers
|
|
class LightParser
|
|
def initialize stream
|
|
@stream = stream
|
|
@parser = REXML::Parsers::BaseParser.new( stream )
|
|
end
|
|
|
|
def rewind
|
|
@stream.rewind
|
|
@parser.stream = @stream
|
|
end
|
|
|
|
def parse
|
|
root = context = [ :document ]
|
|
while true
|
|
event = @parser.pull
|
|
case event[0]
|
|
when :end_document
|
|
break
|
|
when :end_doctype
|
|
context = context[1]
|
|
when :start_element, :start_doctype
|
|
new_node = event
|
|
context << new_node
|
|
new_node[1,0] = [context]
|
|
context = new_node
|
|
when :end_element, :end_doctype
|
|
context = context[1]
|
|
else
|
|
new_node = event
|
|
context << new_node
|
|
new_node[1,0] = [context]
|
|
end
|
|
end
|
|
root
|
|
end
|
|
end
|
|
|
|
# An element is an array. The array contains:
|
|
# 0 The parent element
|
|
# 1 The tag name
|
|
# 2 A hash of attributes
|
|
# 3..-1 The child elements
|
|
# An element is an array of size > 3
|
|
# Text is a String
|
|
# PIs are [ :processing_instruction, target, data ]
|
|
# Comments are [ :comment, data ]
|
|
# DocTypes are DocType structs
|
|
# The root is an array with XMLDecls, Text, DocType, Array, Text
|
|
end
|
|
end
|