diff options
Diffstat (limited to 'lib/rss/rexmlparser.rb')
-rw-r--r-- | lib/rss/rexmlparser.rb | 47 |
1 files changed, 47 insertions, 0 deletions
diff --git a/lib/rss/rexmlparser.rb b/lib/rss/rexmlparser.rb new file mode 100644 index 0000000000..13ab0e277b --- /dev/null +++ b/lib/rss/rexmlparser.rb @@ -0,0 +1,47 @@ +require "rexml/document" +require "rexml/streamlistener" + +/\A(\d+)\.(\d+)(?:\.\d+)+\z/ =~ REXML::Version +if ([$1.to_i, $2.to_i] <=> [2, 5]) < 0 + raise LoadError, "needs REXML 2.5 or later (#{REXML::Version})" +end + +module RSS + + class REXMLParser < BaseParser + + private + + def listener + REXMLListener + end + + def _parse + begin + REXML::Document.parse_stream(@rss, @listener) + rescue RuntimeError => e + raise NotWellFormedError.new{e.message} + rescue REXML::ParseException => e + context = e.context + line = context[0] if context + raise NotWellFormedError.new(line){e.message} + end + end + + end + + class REXMLListener < BaseListener + + include REXML::StreamListener + include ListenerMixin + + def xmldecl(version, encoding, standalone) + super + # Encoding is converted to UTF-8 when REXML parse XML. + @encoding = 'UTF-8' + end + + alias_method(:cdata, :text) + end + +end |