summaryrefslogtreecommitdiff
path: root/lib/rexml/source.rb
diff options
context:
space:
mode:
Diffstat (limited to 'lib/rexml/source.rb')
-rw-r--r--lib/rexml/source.rb25
1 files changed, 18 insertions, 7 deletions
diff --git a/lib/rexml/source.rb b/lib/rexml/source.rb
index c51f504811..2fee99c0e9 100644
--- a/lib/rexml/source.rb
+++ b/lib/rexml/source.rb
@@ -6,7 +6,7 @@ module REXML
# Generates a Source object
# @param arg Either a String, or an IO
# @return a Source, or nil if a bad argument was given
- def SourceFactory::create_from arg#, slurp=true
+ def SourceFactory::create_from(arg)
if arg.kind_of? String
Source.new(arg)
elsif arg.respond_to? :read and
@@ -35,16 +35,23 @@ module REXML
# Constructor
# @param arg must be a String, and should be a valid XML document
- def initialize(arg)
+ # @param encoding if non-null, sets the encoding of the source to this
+ # value, overriding all encoding detection
+ def initialize(arg, encoding=nil)
@orig = @buffer = arg
- self.encoding = check_encoding( @buffer )
+ if encoding
+ self.encoding = encoding
+ else
+ self.encoding = check_encoding( @buffer )
+ end
@line = 0
end
+
# Inherited from Encoding
# Overridden to support optimized en/decoding
def encoding=(enc)
- super
+ return unless super
@line_break = encode( '>' )
if enc != UTF_8
@buffer = decode(@buffer)
@@ -124,7 +131,7 @@ module REXML
#attr_reader :block_size
# block_size has been deprecated
- def initialize(arg, block_size=500)
+ def initialize(arg, block_size=500, encoding=nil)
@er_source = @source = arg
@to_utf = false
# Determining the encoding is a deceptively difficult issue to resolve.
@@ -134,10 +141,12 @@ module REXML
# if there is one. If there isn't one, the file MUST be UTF-8, as per
# the XML spec. If there is one, we can determine the encoding from
# it.
+ @buffer = ""
str = @source.read( 2 )
- if /\A(?:\xfe\xff|\xff\xfe)/n =~ str
+ if encoding
+ self.encoding = encoding
+ elsif /\A(?:\xfe\xff|\xff\xfe)/n =~ str
self.encoding = check_encoding( str )
- @line_break = encode( '>' )
else
@line_break = '>'
end
@@ -159,6 +168,8 @@ module REXML
str = @source.readline(@line_break)
str = decode(str) if @to_utf and str
@buffer << str
+ rescue Iconv::IllegalSequence
+ raise
rescue
@source = nil
end