summaryrefslogtreecommitdiff
path: root/enc/make_encdb.rb
blob: 2cd76999442ee70db63b2d7a250020ff3d0d9242 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
#! ./miniruby

#
# OnigEncodingDefine(foo, Foo) = {
#   ..
#   "Shift_JIS", /* Canonical Name */
#   ..
# };
# ENC_ALIAS("SJIS", "Shift_JIS")
# ENC_REPLICATE("Windows-31J", "Shift_JIS")
# ENC_ALIAS("CP932", "Windows-31J")
#

require 'mkmf'

encodings = []
replicas = {}
aliases = {}
Dir.open($srcdir) {|d| d.grep(/.+\.c\z/)}.each do |fn|
  open(File.join($srcdir,fn)) do |f|
    orig = nil
    name = nil
    f.each_line do |line|
      break if /^OnigEncodingDefine/o =~ line
    end
    f.each_line do |line|
      break if /"(.*?)"/ =~ line
    end
    encodings << $1 if $1
    f.each_line do |line|
      if /^ENC_REPLICATE\(\s*"([^"]+)"\s*,\s*"([^"]+)"/o =~ line
	replicas[$1] = $2
      elsif /^ENC_ALIAS\(\s*"([^"]+)"\s*,\s*"([^"]+)"/o =~ line
	aliases[$1] = $2
      end
    end
  end
end
open('encdb.h', 'wb') do |f|
  f.puts 'static const char *enc_name_list[] = {'
  encodings.each {|name| f.puts'    "%s",' % name}
  replicas.each_key {|name| f.puts'    "%s",' % name}
  f.puts(<<"_TEXT_")
    NULL
};
static const int enc_name_list_size = #{encodings.length + replicas.length};
static const int enc_aliases_size = #{aliases.length};
static st_table *enc_table_replica_name;
static st_table *enc_table_alias_name;

static void enc_init_db(void)
{
    if (!enc_table_replica_name) {
	enc_table_replica_name = st_init_strcasetable();
    }
    if (!enc_table_alias_name) {
	enc_table_alias_name = st_init_strcasetable();
    }
_TEXT_
  replicas.each_pair {|name, orig|
    f.puts'    st_insert(enc_table_replica_name, (st_data_t)"%s", (st_data_t)"%s");' % [name, orig]}
  aliases.each_pair {|name, orig|
    f.puts'    st_insert(enc_table_alias_name, (st_data_t)"%s", (st_data_t)"%s");' % [name, orig]}
  f.puts '}'
end