diff options
Diffstat (limited to 'trunk/lib/rss/rexmlparser.rb')
-rw-r--r-- | trunk/lib/rss/rexmlparser.rb | 54 |
1 files changed, 54 insertions, 0 deletions
diff --git a/trunk/lib/rss/rexmlparser.rb b/trunk/lib/rss/rexmlparser.rb new file mode 100644 index 0000000000..4dabf59199 --- /dev/null +++ b/trunk/lib/rss/rexmlparser.rb @@ -0,0 +1,54 @@ +require "rexml/document" +require "rexml/streamlistener" + +/\A(\d+)\.(\d+)(?:\.\d+)+\z/ =~ REXML::Version +if ([$1.to_i, $2.to_i] <=> [2, 5]) < 0 + raise LoadError, "needs REXML 2.5 or later (#{REXML::Version})" +end + +module RSS + + class REXMLParser < BaseParser + + class << self + def listener + REXMLListener + end + end + + private + def _parse + begin + REXML::Document.parse_stream(@rss, @listener) + rescue RuntimeError => e + raise NotWellFormedError.new{e.message} + rescue REXML::ParseException => e + context = e.context + line = context[0] if context + raise NotWellFormedError.new(line){e.message} + end + end + + end + + class REXMLListener < BaseListener + + include REXML::StreamListener + include ListenerMixin + + class << self + def raise_for_undefined_entity? + false + end + end + + def xmldecl(version, encoding, standalone) + super(version, encoding, standalone == "yes") + # Encoding is converted to UTF-8 when REXML parse XML. + @encoding = 'UTF-8' + end + + alias_method(:cdata, :text) + end + +end |