summaryrefslogtreecommitdiff
path: root/trunk/enc/make_encdb.rb
diff options
context:
space:
mode:
Diffstat (limited to 'trunk/enc/make_encdb.rb')
-rwxr-xr-xtrunk/enc/make_encdb.rb77
1 files changed, 77 insertions, 0 deletions
diff --git a/trunk/enc/make_encdb.rb b/trunk/enc/make_encdb.rb
new file mode 100755
index 0000000000..5a420aed32
--- /dev/null
+++ b/trunk/enc/make_encdb.rb
@@ -0,0 +1,77 @@
+#
+# OnigEncodingDefine(foo, Foo) = {
+# ..
+# "Shift_JIS", /* Canonical Name */
+# ..
+# };
+# ENC_ALIAS("SJIS", "Shift_JIS")
+# ENC_REPLICATE("Windows-31J", "Shift_JIS")
+# ENC_ALIAS("CP932", "Windows-31J")
+#
+
+def check_duplication(defs, name, fn, line)
+ if defs[name]
+ raise ArgumentError, "%s:%d: encoding %s is already registered(%s:%d)" %
+ [fn, line, name, *defs[name]]
+ else
+ defs[name.upcase] = [fn,line]
+ end
+end
+
+count = 0
+lines = []
+encodings = []
+defs = {}
+encdirs = ARGV.dup
+outhdr = encdirs.shift || 'encdb.h'
+encdirs << 'enc' if encdirs.empty?
+files = {}
+encdirs.each do |encdir|
+ next unless File.directory?(encdir)
+ Dir.open(encdir) {|d| d.grep(/.+\.[ch]\z/)}.sort_by {|e|
+ e.scan(/(\d+)|(\D+)/).map {|n,a| a||[n.size,n.to_i]}.flatten
+ }.each do |fn|
+ next if files[fn]
+ files[fn] = true
+ open(File.join(encdir,fn)) do |f|
+ orig = nil
+ name = nil
+ f.each_line do |line|
+ if (/^OnigEncodingDefine/ =~ line)..(/"(.*?)"/ =~ line)
+ if $1
+ check_duplication(defs, $1, fn, $.)
+ encodings << $1
+ count += 1
+ end
+ else
+ case line
+ when /^\s*rb_enc_register\(\s*"([^"]+)"/
+ count += 1
+ line = nil
+ when /^ENC_REPLICATE\(\s*"([^"]+)"\s*,\s*"([^"]+)"/
+ raise ArgumentError,
+ '%s:%d: ENC_REPLICATE: %s is not defined yet. (replica %s)' %
+ [fn, $., $2, $1] unless defs[$2.upcase]
+ count += 1
+ when /^ENC_ALIAS\(\s*"([^"]+)"\s*,\s*"([^"]+)"/
+ raise ArgumentError,
+ '%s:%d: ENC_ALIAS: %s is not defined yet. (alias %s)' %
+ [fn, $., $2, $1] unless defs[$2.upcase]
+ when /^ENC_DUMMY\(\s*"([^"]+)"/
+ count += 1
+ else
+ next
+ end
+ check_duplication(defs, $1, fn, $.)
+ lines << line.sub(/;.*/m, "").chomp + ";\n" if line
+ end
+ end
+ end
+ end
+end
+
+result = encodings.map {|e| %[ENC_DEFINE("#{e}");\n]}.join + lines.join +
+ "\n#define ENCODING_COUNT #{count}\n"
+open(outhdr, 'wb') do |f|
+ f.print result
+end