diff options
Diffstat (limited to 'ruby_1_9_3/lib/rexml/encoding.rb')
-rw-r--r-- | ruby_1_9_3/lib/rexml/encoding.rb | 62 |
1 files changed, 62 insertions, 0 deletions
diff --git a/ruby_1_9_3/lib/rexml/encoding.rb b/ruby_1_9_3/lib/rexml/encoding.rb new file mode 100644 index 0000000000..d1d5172841 --- /dev/null +++ b/ruby_1_9_3/lib/rexml/encoding.rb @@ -0,0 +1,62 @@ +module REXML + module Encoding + # ID ---> Encoding name + attr_reader :encoding + def encoding=(encoding) + encoding = encoding.name if encoding.is_a?(Encoding) + if encoding.is_a?(String) + original_encoding = encoding + encoding = find_encoding(encoding) + unless encoding + raise ArgumentError, "Bad encoding name #{original_encoding}" + end + end + return false if defined?(@encoding) and encoding == @encoding + if encoding + @encoding = encoding.upcase + else + @encoding = 'UTF-8' + end + true + end + + def check_encoding(xml) + # We have to recognize UTF-16BE, UTF-16LE, and UTF-8 + if xml[0, 2] == "\xfe\xff" + xml[0, 2] = "" + return 'UTF-16BE' + elsif xml[0, 2] == "\xff\xfe" + xml[0, 2] = "" + return 'UTF-16LE' + end + xml =~ /^\s*<\?xml\s+version\s*=\s*(['"]).*?\1\s+encoding\s*=\s*(["'])(.*?)\2/m + return $3 ? $3.upcase : 'UTF-8' + end + + def encode(string) + string.encode(@encoding) + end + + def decode(string) + string.encode(::Encoding::UTF_8, @encoding) + end + + private + def find_encoding(name) + case name + when /\Ashift-jis\z/i + return "SHIFT_JIS" + when /\ACP-(\d+)\z/ + name = "CP#{$1}" + when /\AUTF-8\z/i + return name + end + begin + ::Encoding::Converter.search_convpath(name, 'UTF-8') + rescue ::Encoding::ConverterNotFoundError + return nil + end + name + end + end +end |