aboutsummaryrefslogtreecommitdiff
path: root/libjava/scripts/blocks.pl
blob: 9142a49f87a302439598e9d34a80566d0eccdb6d (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
#! /usr/bin/perl

if ($ARGV[0] eq '')
{
    $file = 'Blocks.txt';
    if (! -f $file)
    {
	# Too painful to figure out how to get Perl to do it.
	system 'wget -o .wget-log http://www.unicode.org/Public/UNIDATA/Blocks.txt';
    }
}
else
{
    $file = $ARGV[0];
}

open (INPUT, "< $file") || die "couldn't open $file: $!";

@array = ();
while (<INPUT>)
{
    next if /^#/;
    chop;
    next if /^$/;

    ($start, $to, $text) = split (/; /);
    ($symbol = $text) =~ tr/a-z/A-Z/;
    $symbol =~ s/[- ]/_/g;

    # Special case for one of the SPECIALS.
    next if $start eq 'FEFF';

    # Special case some areas that our heuristic mishandles.
    if ($symbol eq 'HIGH_SURROGATES')
    {
	$symbol = 'SURROGATES_AREA';
	$text = 'Surrogates Area';
	$to = 'DFFF';
    }
    elsif ($symbol =~ /SURROGATES/)
    {
	next;
    }
    elsif ($symbol eq 'PRIVATE_USE')
    {
	$symbol .= '_AREA';
	$text = 'Private Use Area';
    }

    printf "    public static final UnicodeBlock %s = new UnicodeBlock (\"%s\", '\\u%s', '\\u%s');\n",
           $symbol, $text, $start, $to;

    push (@array, $symbol);
}

printf "    private static final UnicodeBlock[] blocks = {\n";
foreach (@array)
{
    printf "      %s", $_;
    printf "," unless $_ eq 'SPECIALS';
    printf "\n";
}
printf "    };\n";

close (INPUT);