aboutsummaryrefslogtreecommitdiffstats
path: root/enc/make_encdb.rb
blob: c140007f677d2e9a1e77b7a4315f4a75ebf97b53 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
#
# OnigEncodingDefine(foo, Foo) = {
#   ..
#   "Shift_JIS", /* Canonical Name */
#   ..
# };
# ENC_ALIAS("SJIS", "Shift_JIS")
# ENC_REPLICATE("Windows-31J", "Shift_JIS")
# ENC_ALIAS("CP932", "Windows-31J")
#

def check_duplication(encs, name, fn, line)
  if encs.include?(name)
    raise ArgumentError, "%s:%d: encoding %s is already registered" % [fn, line, name]
  end
end

encodings = []
replicas = {}
aliases = {}
encdir = ARGV[0]
Dir.open(encdir) {|d| d.grep(/.+\.c\z/)}.sort.each do |fn|
  open(File.join(encdir,fn)) do |f|
    orig = nil
    name = nil
    encs = []
    f.each_line do |line|
      break if /^OnigEncodingDefine/o =~ line
    end
    f.each_line do |line|
      break if /"(.*?)"/ =~ line
    end
    if $1
      check_duplication(encs, $1, fn, $.)
      encs << $1.upcase
      encodings << $1 
      f.each_line do |line|
	if /^ENC_REPLICATE\(\s*"([^"]+)"\s*,\s*"([^"]+)"/o =~ line
	  raise ArgumentError,
	    '%s:%d: ENC_REPLICATE: %s is not defined yet. (replica %s)' %
	    [fn, $., $2, $1] unless encs.include?($2.upcase)
	  check_duplication(encs, $1, fn, $.)
	  encs << $1.upcase
	  encodings << $1
	  replicas[$1] = $2
	elsif /^ENC_ALIAS\(\s*"([^"]+)"\s*,\s*"([^"]+)"/o =~ line
	  raise ArgumentError,
	    '%s:%d: ENC_ALIAS: %s is not defined yet. (alias %s)' %
	    [fn, $., $2, $1] unless encs.include?($2.upcase)
	  check_duplication(encs, $1, fn, $.)
	  encodings << $1
	  aliases[$1] = $2
	end
      end
    end
  end
end

open('encdb.h', 'wb') do |f|
  f.puts 'static const char *const enc_name_list[] = {'
  encodings.each {|name| f.puts'    "%s",' % name}
  f.puts('};', '', 'static void', 'enc_init_db(void)', '{')
  replicas.each_pair {|name, orig|
    f.puts '    ENC_REPLICATE("%s", "%s");' % [name, orig]
  }
  aliases.each_pair {|name, orig|
    f.puts '    ENC_ALIAS("%s", "%s");' % [name, orig]
  }
  f.puts '}'
end