-
Notifications
You must be signed in to change notification settings - Fork 28
/
Copy pathmkxref.pl
32 lines (28 loc) · 981 Bytes
/
mkxref.pl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
use strict;
use utf8;
open IN, '<:utf8', 'x-華語對照表.csv';
binmode IN, ':utf8';
<IN>;
my %a2t = qw( 萌 發穎 );
my %t2a = qw( 發穎 萌 );
# TODO: Add everything in ext, at least 臺華共同詞
my $moedict_basedir = shift || "../moedict-webkit";
die "Usage: $0 /path/to/moedict-webkit
Please checkout $moedict_basedir and have /a/*.json ready." unless -d $moedict_basedir;
my %seen;
while (<IN>) {
chomp;
my ($m, undef, $t) = split /,/, $_;
next unless -e $moedict_basedir . "/a/$m.json";
next if $seen{$m,$t}++;
next if $t =~ /\d/;
$a2t{$m} .= "," if $a2t{$m};
$a2t{$m} .= ($t eq $m) ? '' : $t;
$t2a{$t} .= "," if $t2a{$t};
$t2a{$t} .= ($t eq $m) ? '' : $m;
}
use JSON;
use File::Slurp 'write_file';
mkdir $moedict_basedir . '/a' unless -e $moedict_basedir . '/a';
write_file $moedict_basedir . '/a/xref.json' => encode_json({ t => \%a2t })."\n";
write_file $moedict_basedir . '/t/xref.json' => encode_json({ a => \%t2a })."\n";