1 #!/usr/local/bin/perl -wC
3 # SPDX-License-Identifier: BSD-2-Clause-FreeBSD
5 # Copyright 2009 Edwin Groothuis <edwin@FreeBSD.org>
6 # Copyright 2015 John Marino <draco@marino.st>
8 # Redistribution and use in source and binary forms, with or without
9 # modification, are permitted provided that the following conditions
11 # 1. Redistributions of source code must retain the above copyright
12 # notice, this list of conditions and the following disclaimer.
13 # 2. Redistributions in binary form must reproduce the above copyright
14 # notice, this list of conditions and the following disclaimer in the
15 # documentation and/or other materials provided with the distribution.
17 # THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18 # ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 # ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
21 # FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22 # DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23 # OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24 # HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25 # LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26 # OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
38 use Digest::SHA qw(sha1_hex);
39 require "charmaps.pm";
43 print "Usage: $0 --unidir=<unidir> --etc=<etcdir> --type=<type>\n";
47 my $DEFENCODING = "UTF-8";
53 my $result = GetOptions (
54 "unidir=s" => \$UNIDIR,
65 my %translations = ();
67 my %alternativemonths = ();
73 get_utf8map("$UNIDIR/posix/$DEFENCODING.cm");
74 get_encodings("$ETCDIR/charmaps");
77 tie(%keys, "Tie::IxHash");
78 tie(%hashtable, "Tie::IxHash");
81 "monetdef" => "LC_MONETARY",
82 "timedef" => "LC_TIME",
83 "msgdef" => "LC_MESSAGES",
84 "numericdef" => "LC_NUMERIC",
85 "colldef" => "LC_COLLATE",
86 "ctypedef" => "LC_CTYPE"
90 mdorder => \&callback_mdorder,
91 altmon => \&callback_altmon,
92 cformat => \&callback_cformat,
93 dformat => \&callback_dformat,
94 dtformat => \&callback_dtformat,
95 cbabmon => \&callback_abmon,
96 cbampm => \&callback_ampm,
103 "decimal_point" => "decimal_point",
104 "thousands_sep" => "thousands_sep",
105 "grouping" => "grouping",
108 "int_curr_symbol" => "int_curr_symbol (last character always " .
110 "currency_symbol" => "currency_symbol",
111 "mon_decimal_point" => "mon_decimal_point",
112 "mon_thousands_sep" => "mon_thousands_sep",
113 "mon_grouping" => "mon_grouping",
114 "positive_sign" => "positive_sign",
115 "negative_sign" => "negative_sign",
116 "int_frac_digits" => "int_frac_digits",
117 "frac_digits" => "frac_digits",
118 "p_cs_precedes" => "p_cs_precedes",
119 "p_sep_by_space" => "p_sep_by_space",
120 "n_cs_precedes" => "n_cs_precedes",
121 "n_sep_by_space" => "n_sep_by_space",
122 "p_sign_posn" => "p_sign_posn",
123 "n_sign_posn" => "n_sign_posn",
126 "yesexpr" => "yesexpr",
127 "noexpr" => "noexpr",
128 "yesstr" => "yesstr",
132 "abmon" => "Short month names",
133 "mon" => "Long month names (as in a date)",
134 "abday" => "Short weekday names",
135 "day" => "Long weekday names",
140 "d_t_fmt" => "date_fmt",
141 "altmon" => "Long month names (without case ending)",
142 "md_order" => "md_order",
143 "t_fmt_ampm" => "ampm_fmt",
146 if ($TYPE eq "colldef") {
147 transform_collation();
151 if ($TYPE eq "ctypedef") {
156 if ($TYPE eq "numericdef") {
158 "decimal_point" => "s",
159 "thousands_sep" => "s",
167 if ($TYPE eq "monetdef") {
169 "int_curr_symbol" => "s",
170 "currency_symbol" => "s",
171 "mon_decimal_point" => "s",
172 "mon_thousands_sep" => "s",
173 "mon_grouping" => "ai",
174 "positive_sign" => "s",
175 "negative_sign" => "s",
176 "int_frac_digits" => "i",
177 "frac_digits" => "i",
178 "p_cs_precedes" => "i",
179 "p_sep_by_space" => "i",
180 "n_cs_precedes" => "i",
181 "n_sep_by_space" => "i",
182 "p_sign_posn" => "i",
190 if ($TYPE eq "msgdef") {
202 if ($TYPE eq "timedef") {
204 "abmon" => "<cbabmon<abmon<as",
209 "d_fmt" => "<dformat<d_fmt<s",
210 "c_fmt" => "<cformat<d_t_fmt<s",
211 "am_pm" => "<cbampm<am_pm<as",
212 "d_t_fmt" => "<dtformat<d_t_fmt<s",
213 "altmon" => "<altmon<mon<as",
214 "md_order" => "<mdorder<d_fmt<s",
224 my $nl = $callback{data}{l} . "_" . $callback{data}{c};
225 my $enc = $callback{data}{e};
227 if ($nl eq 'ru_RU') {
228 if ($enc eq 'UTF-8') {
231 my $converter = Text::Iconv->new("utf-8", "$enc");
232 $s = $converter->convert("дп;пп");
238 sub callback_cformat {
240 my $nl = $callback{data}{l} . "_" . $callback{data}{c};
242 if ($nl eq 'ko_KR') {
243 $s =~ s/(> )(%p)/$1%A $2/;
248 $s =~ s/^"%e\./%A %e/;
249 $s =~ s/^"(%B %e, )/"%A, $1/;
250 $s =~ s/^"(%e %B )/"%A $1/;
254 sub callback_dformat {
257 $s =~ s/(%m(<SOLIDUS>|[-.]))%e/$1%d/;
258 $s =~ s/%e((<SOLIDUS>|[-.])%m)/%d$1/;
262 sub callback_dtformat {
264 my $nl = $callback{data}{l} . "_" . $callback{data}{c};
266 if ($nl eq 'ja_JP') {
267 $s =~ s/(> )(%H)/$1%A $2/;
268 } elsif ($nl eq 'ko_KR' || $nl eq 'zh_CN' || $nl eq 'zh_TW') {
269 if ($nl ne 'ko_KR') {
272 $s =~ s/(> )(%p)/$1%A $2/;
275 $s =~ s/^"%e\./%A %e/;
276 $s =~ s/^"(%B %e, )/"%A, $1/;
277 $s =~ s/^"(%e %B )/"%A $1/;
281 sub callback_mdorder {
283 return undef if (!defined $s);
289 sub callback_altmon {
290 # if the language/country is known in %alternative months then
291 # return that, otherwise repeat mon
294 if (defined $alternativemonths{$callback{data}{l}}{$callback{data}{c}}) {
295 my @altnames = split(";",$alternativemonths{$callback{data}{l}}{$callback{data}{c}});
303 return join(";",@cleaned);
310 # for specified CJK locales, pad result with a space to enable
311 # columns to line up (style established in FreeBSD in 2001)
313 my $nl = $callback{data}{l} . "_" . $callback{data}{c};
315 if ($nl eq 'ja_JP' || $nl eq 'ko_KR' || $nl eq 'zh_CN' ||
316 $nl eq 'zh_HK' || $nl eq 'zh_TW') {
317 my @monthnames = split(";", $s);
319 foreach (@monthnames)
321 if ($_ =~ /^"<(two|three|four|five|six|seven|eight|nine)>/ ||
322 ($_ =~ /^"<one>/ && $_ !~ /^"<one>(<zero>|<one>|<two>)/))
324 $_ =~ s/^"/"<space>/;
328 return join(";",@cleaned);
333 ############################
336 my $directory = shift;
338 open(FIN, "$directory/UnicodeData.txt")
339 or die("Cannot open $directory/UnicodeData.txt");;
344 foreach my $l (@lines) {
345 my @a = split(/;/, $l);
347 $ucd{code2name}{"$a[0]"} = $a[1]; # Unicode name
348 $ucd{name2code}{"$a[1]"} = $a[0]; # Unicode code
363 foreach my $l (@lines) {
365 next if ($l =~ /^\#/);
368 if ($l eq "CHARMAP") {
373 next if (!$incharmap);
374 last if ($l eq "END CHARMAP");
376 $l =~ /^<([^\s]+)>\s+(.*)/;
379 $k =~ s/_/ /g; # unicode char string
380 $v =~ s/\\x//g; # UTF-8 char code
383 $utf8aliases{$k} = $prev_k if ($prev_v eq $v);
392 foreach my $e (sort(keys(%encodings))) {
393 if (!open(FIN, "$dir/$e.TXT")) {
394 print "Cannot open charmap for $e\n";
402 foreach my $l (@lines) {
404 next if ($l =~ /^\#/);
407 my @a = split(" ", $l);
409 $a[0] =~ s/^0[xX]//; # local char code
410 $a[1] =~ s/^0[xX]//; # unicode char code
411 $convertors{$e}{uc($a[1])} = uc($a[0]);
417 my %data = get_xmldata($ETCDIR);
418 %languages = %{$data{L}};
419 %translations = %{$data{T}};
420 %alternativemonths = %{$data{AM}};
421 %encodings = %{$data{E}};
424 sub transform_ctypes {
426 $languages{"C"}{"x"}{data}{"x"}{$DEFENCODING} = undef;
428 foreach my $l (sort keys(%languages)) {
429 foreach my $f (sort keys(%{$languages{$l}})) {
430 foreach my $c (sort keys(%{$languages{$l}{$f}{data}})) {
431 next if (defined $languages{$l}{$f}{definitions}
432 && $languages{$l}{$f}{definitions} !~ /$TYPE/);
433 $languages{$l}{$f}{data}{$c}{$DEFENCODING} = 0; # unread
435 $file .= "_" . $f if ($f ne "x");
436 $file .= "_" . $c if ($c ne "x");
439 my $filename = "$UNIDIR/posix/xx_Comm_C.UTF-8.src";
440 if (! -f $filename) {
441 print STDERR "Cannot open $filename\n";
444 open(FIN, "$filename");
445 print "Reading from $filename for ${l}_${f}_${c}\n";
446 $languages{$l}{$f}{data}{$c}{$DEFENCODING} = 1; # read
454 $shex = sha1_hex(join("\n", @lines));
455 $languages{$l}{$f}{data}{$c}{$DEFENCODING} = $shex;
456 $hashtable{$shex}{"${l}_${f}_${c}.$DEFENCODING"} = 1;
457 open(FOUT, ">$TYPE.draft/$actfile.$DEFENCODING.src");
460 foreach my $enc (sort keys(%{$languages{$l}{$f}{data}{$c}})) {
461 next if ($enc eq $DEFENCODING);
462 $filename = "$UNIDIR/posix/$file.$DEFENCODING.src";
463 if (! -f $filename) {
464 print STDERR "Cannot open $filename\n";
468 open(FIN, "$filename");
470 if ((/^comment_char\s/) || (/^escape_char\s/)){
473 if (/^LC_CTYPE/../^END LC_CTYPE/) {
478 $uhex = sha1_hex(join("\n", @lines) . $enc);
479 $languages{$l}{$f}{data}{$c}{$enc} = $uhex;
480 $hashtable{$uhex}{"${l}_${f}_${c}.$enc"} = 1;
481 open(FOUT, ">$TYPE.draft/$actfile.$enc.src");
483 # Warning: Do not edit. This file is automatically extracted from the
484 # tools in /usr/src/tools/tools/locale. The data is obtained from the
485 # CLDR project, obtained from http://cldr.unicode.org/
486 # -----------------------------------------------------------------------------
497 sub transform_collation {
498 foreach my $l (sort keys(%languages)) {
499 foreach my $f (sort keys(%{$languages{$l}})) {
500 foreach my $c (sort keys(%{$languages{$l}{$f}{data}})) {
501 next if (defined $languages{$l}{$f}{definitions}
502 && $languages{$l}{$f}{definitions} !~ /$TYPE/);
503 $languages{$l}{$f}{data}{$c}{$DEFENCODING} = 0; # unread
506 $file .= $f . "_" if ($f ne "x");
510 my $filename = "$UNIDIR/posix/$file.$DEFENCODING.src";
511 $filename = "$ETCDIR/$file.$DEFENCODING.src"
514 && defined $languages{$l}{$f}{fallback}) {
515 $file = $languages{$l}{$f}{fallback};
516 $filename = "$UNIDIR/posix/$file.$DEFENCODING.src";
518 $filename = "$UNIDIR/posix/$file.$DEFENCODING.src"
520 if (! -f $filename) {
522 "Cannot open $file.$DEFENCODING.src or fallback\n";
525 open(FIN, "$filename");
526 print "Reading from $filename for ${l}_${f}_${c}\n";
527 $languages{$l}{$f}{data}{$c}{$DEFENCODING} = 1; # read
531 if ((/^comment_char\s/) || (/^escape_char\s/)){
534 if (/^LC_COLLATE/../^END LC_COLLATE/) {
540 $shex = sha1_hex(join("\n", @lines));
541 $languages{$l}{$f}{data}{$c}{$DEFENCODING} = $shex;
542 $hashtable{$shex}{"${l}_${f}_${c}.$DEFENCODING"} = 1;
543 open(FOUT, ">$TYPE.draft/$actfile.$DEFENCODING.src");
545 # Warning: Do not edit. This file is automatically extracted from the
546 # tools in /usr/src/tools/tools/locale. The data is obtained from the
547 # CLDR project, obtained from http://cldr.unicode.org/
548 # -----------------------------------------------------------------------------
553 foreach my $enc (sort keys(%{$languages{$l}{$f}{data}{$c}})) {
554 next if ($enc eq $DEFENCODING);
555 copy ("$TYPE.draft/$actfile.$DEFENCODING.src",
556 "$TYPE.draft/$actfile.$enc.src");
557 $languages{$l}{$f}{data}{$c}{$enc} = $shex;
558 $hashtable{$shex}{"${l}_${f}_${c}.$enc"} = 1;
566 foreach my $l (sort keys(%languages)) {
567 foreach my $f (sort keys(%{$languages{$l}})) {
568 foreach my $c (sort keys(%{$languages{$l}{$f}{data}})) {
569 next if (defined $languages{$l}{$f}{definitions}
570 && $languages{$l}{$f}{definitions} !~ /$TYPE/);
572 $languages{$l}{$f}{data}{$c}{$DEFENCODING} = 0; # unread
575 $file .= $f . "_" if ($f ne "x");
578 my $filename = "$UNIDIR/posix/$file.$DEFENCODING.src";
579 $filename = "$ETCDIR/$file.$DEFENCODING.src"
582 && defined $languages{$l}{$f}{fallback}) {
583 $file = $languages{$l}{$f}{fallback};
584 $filename = "$UNIDIR/posix/$file.$DEFENCODING.src";
586 $filename = "$UNIDIR/posix/$file.$DEFENCODING.src"
588 if (! -f $filename) {
590 "Cannot open $file.$DEFENCODING.src or fallback\n";
593 open(FIN, "$filename");
594 print "Reading from $filename for ${l}_${f}_${c}\n";
595 $languages{$l}{$f}{data}{$c}{$DEFENCODING} = 1; # read
600 foreach my $k (keys(%keys)) {
601 foreach my $line (@lines) {
603 next if (!$continue && $line !~ /^$k\s/);
610 $values{$l}{$f}{$c}{$k} = ""
611 if (!defined $values{$l}{$f}{$c}{$k});
613 $continue = ($line =~ /\/$/);
614 $line =~ s/\/$// if ($continue);
616 while ($line =~ /_/) {
618 s/\<([^>_]+)_([^>]+)\>/<$1 $2>/;
620 die "_ in data - $line" if ($line =~ /_/);
621 $values{$l}{$f}{$c}{$k} .= $line;
623 last if (!$continue);
639 # Conversion to UTF-8 can be done from the Unicode name to
640 # the UTF-8 character code.
643 die "Cannot convert $s in $e (charmap)" if (!defined $v);
646 # Conversion to these encodings can be done from the Unicode
647 # name to Unicode code to the encodings code.
650 $ucc = $ucd{name2code}{$s} if (defined $ucd{name2code}{$s});
651 $ucc = $ucd{name2code}{$utf8aliases{$s}}
654 && defined $ucd{name2code}{$utf8aliases{$s}});
657 if (defined $translations{$e}{$s}{hex}) {
658 $v = $translations{$e}{$s}{hex};
660 } elsif (defined $translations{$e}{$s}{ucc}) {
661 $ucc = $translations{$e}{$s}{ucc};
665 die "Cannot convert $s in $e (ucd string)" if (!defined $ucc);
666 $v = $convertors{$e}{$ucc} if (!defined $v);
668 $v = $translations{$e}{$s}{hex}
669 if (!defined $v && defined $translations{$e}{$s}{hex});
671 if (!defined $v && defined $translations{$e}{$s}{unicode}) {
672 my $ucn = $translations{$e}{$s}{unicode};
673 $ucc = $ucd{name2code}{$ucn}
674 if (defined $ucd{name2code}{$ucn});
675 $ucc = $ucd{name2code}{$utf8aliases{$ucn}}
677 && defined $ucd{name2code}{$utf8aliases{$ucn}});
678 $v = $convertors{$e}{$ucc};
681 die "Cannot convert $s in $e (charmap)" if (!defined $v);
684 return pack("C", hex($v)) if (length($v) == 2);
685 return pack("CC", hex(substr($v, 0, 2)), hex(substr($v, 2, 2)))
686 if (length($v) == 4);
687 return pack("CCC", hex(substr($v, 0, 2)), hex(substr($v, 2, 2)),
688 hex(substr($v, 4, 2))) if (length($v) == 6);
689 print STDERR "Cannot convert $e $s\n";
690 return "length = " . length($v);
698 return $translations{$enc}{$v} if (defined $translations{$enc}{$v});
703 foreach my $l (sort keys(%languages)) {
704 foreach my $f (sort keys(%{$languages{$l}})) {
705 foreach my $c (sort keys(%{$languages{$l}{$f}{data}})) {
706 next if (defined $languages{$l}{$f}{definitions}
707 && $languages{$l}{$f}{definitions} !~ /$TYPE/);
708 foreach my $enc (sort keys(%{$languages{$l}{$f}{data}{$c}})) {
709 if ($languages{$l}{$f}{data}{$c}{$DEFENCODING} eq "0") {
710 print "Skipping ${l}_" .
711 ($f eq "x" ? "" : "${f}_") .
716 $file .= "_" . $f if ($f ne "x");
718 print "Writing to $file in $enc\n";
720 if ($enc ne $DEFENCODING &&
721 !defined $convertors{$enc}) {
722 print "Failed! Cannot convert to $enc.\n";
726 open(FOUT, ">$TYPE.draft/$file.$enc.new");
730 # Warning: Do not edit. This file is automatically generated from the
731 # tools in /usr/src/tools/tools/locale. The data is obtained from the
732 # CLDR project, obtained from http://cldr.unicode.org/
733 # -----------------------------------------------------------------------------
735 foreach my $k (keys(%keys)) {
738 die("Unknown $k in \%DESC")
739 if (!defined $DESC{$k});
741 $output .= "#\n# $DESC{$k}\n";
743 # Replace one row with another
751 $callback{data}{c} = $c;
752 $callback{data}{k} = $k;
753 $callback{data}{f} = $f;
754 $callback{data}{l} = $l;
755 $callback{data}{e} = $enc;
756 my @a = split(/\</, substr($g, 1));
758 &{$callback{$a[0]}}($values{$l}{$f}{$c}{$a[1]});
759 $values{$l}{$f}{$c}{$k} = $rv;
761 $callback{data} = ();
764 my $v = $values{$l}{$f}{$c}{$k};
765 $v = "undef" if (!defined $v);
779 while ($v =~ /^(.*?)<(.*?)>(.*)/) {
784 my $rv = decodecldr($enc, $cm);
785 # $rv = translate($enc, $cm)
789 "Could not convert $k ($cm) from $DEFENCODING to $enc\n";
794 $v = $p1 . $rv . $p3;
800 foreach my $v (split(/;/, $v)) {
804 while ($v =~ /^(.*?)<(.*?)>(.*)/) {
812 # $rv = translate($enc,
817 "Could not convert $k ($cm) from $DEFENCODING to $enc\n";
833 $languages{$l}{$f}{data}{$c}{$enc} = sha1_hex($output);
834 $hashtable{sha1_hex($output)}{"${l}_${f}_${c}.$enc"} = 1;
835 print FOUT "$output# EOF\n";
839 rename("$TYPE.draft/$file.$enc.new",
840 "$TYPE.draft/$file.$enc.src");
842 rename("$TYPE.draft/$file.$enc.new",
843 "$TYPE.draft/$file.$enc.failed");
852 print "Creating Makefile for $TYPE\n";
858 if ($TYPE eq "colldef") {
859 $SRCOUT = "localedef \${LOCALEDEF_ENDIAN} -D -U " .
860 "-i \${.IMPSRC} \\\n" .
861 "\t-f \${MAPLOC}/map.\${.TARGET:T:R:E:C/@.*//} " .
862 "\${.OBJDIR}/\${.IMPSRC:T:R}";
863 $MAPLOC = "MAPLOC=\t\t\${.CURDIR}/../../tools/tools/" .
864 "locale/etc/final-maps\n";
865 $SRCOUT2 = "LC_COLLATE";
867 ".for f t in \${LOCALES_MAPPED}\n" .
868 "FILES+=\t\$t.LC_COLLATE\n" .
869 "FILESDIR_\$t.LC_COLLATE=\t\${LOCALEDIR}/\$t\n" .
870 "\$t.LC_COLLATE: \${.CURDIR}/\$f.src\n" .
871 "\tlocaledef \${LOCALEDEF_ENDIAN} -D -U " .
872 "-i \${.ALLSRC} \\\n" .
873 "\t\t-f \${MAPLOC}/map.\${.TARGET:T:R:E:C/@.*//} \\\n" .
874 "\t\t\${.OBJDIR}/\${.TARGET:T:R}\n" .
876 $SRCOUT4 = "## LOCALES_MAPPED\n";
878 elsif ($TYPE eq "ctypedef") {
879 $SRCOUT = "localedef \${LOCALEDEF_ENDIAN} -D -U -c " .
880 "-w \${MAPLOC}/widths.txt \\\n" .
881 "\t-f \${MAPLOC}/map.\${.IMPSRC:T:R:E} " .
882 "\\\n\t-i \${.IMPSRC} \${.OBJDIR}/\${.IMPSRC:T:R} " .
884 $SRCOUT2 = "LC_CTYPE";
885 $MAPLOC = "MAPLOC=\t\t\${.CURDIR}/../../tools/tools/" .
886 "locale/etc/final-maps\n";
887 $SRCOUT3 = "## SYMPAIRS\n\n" .
888 ".for s t in \${SYMPAIRS}\n" .
889 "\${t:S/src\$/LC_CTYPE/}: " .
891 "\tlocaledef \${LOCALEDEF_ENDIAN} -D -U -c " .
892 "-w \${MAPLOC}/widths.txt \\\n" .
893 "\t-f \${MAPLOC}/map.\${.TARGET:T:R:C/^.*\\.//} " .
894 "\\\n\t-i \${.ALLSRC} \${.OBJDIR}/\${.TARGET:T:R} " .
899 $SRCOUT = "grep -v -E '^(\#\$\$|\#[ ])' < \${.IMPSRC} > \${.TARGET}";
903 open(FOUT, ">$TYPE.draft/Makefile");
906 # Warning: Do not edit. This file is automatically generated from the
907 # tools in /usr/src/tools/tools/locale.
909 LOCALEDIR= \${SHAREDIR}/locale
910 FILESNAME= $FILESNAMES{$TYPE}
911 .SUFFIXES: .src .${SRCOUT2}
915 if ($TYPE eq "colldef" || $TYPE eq "ctypedef") {
917 .include <bsd.endian.mk>
932 foreach my $hash (keys(%hashtable)) {
933 # For colldef, weight LOCALES to UTF-8
934 # Sort as upper-case and reverse to achieve it
935 # Make en_US, ru_RU, and ca_AD preferred
937 if ($TYPE eq "colldef") {
939 if ($a eq 'en_x_US.UTF-8' ||
940 $a eq 'ru_x_RU.UTF-8' ||
941 $a eq 'ca_x_AD.UTF-8') { return -1; }
942 elsif ($b eq 'en_x_US.UTF-8' ||
943 $b eq 'ru_x_RU.UTF-8' ||
944 $b eq 'ca_x_AD.UTF-8') { return 1; }
945 else { return uc($b) cmp uc($a); }
946 } keys(%{$hashtable{$hash}});
947 } elsif ($TYPE eq "ctypedef") {
949 if ($a eq 'C_x_x.UTF-8') { return -1; }
950 elsif ($b eq 'C_x_x.UTF-8') { return 1; }
951 if ($a =~ /^en_x_US/) { return -1; }
952 elsif ($b =~ /^en_x_US/) { return 1; }
954 if ($a =~ /^en_x_GB.ISO8859-15/ ||
955 $a =~ /^ru_x_RU/) { return -1; }
956 elsif ($b =~ /^en_x_GB.ISO8859-15/ ||
957 $b =~ /ru_x_RU/) { return 1; }
958 else { return uc($b) cmp uc($a); }
960 } keys(%{$hashtable{$hash}});
963 if ($a =~ /_Comm_/ ||
964 $b eq 'en_x_US.UTF-8') { return 1; }
965 elsif ($b =~ /_Comm_/ ||
966 $a eq 'en_x_US.UTF-8') { return -1; }
967 else { return uc($b) cmp uc($a); }
968 } keys(%{$hashtable{$hash}});
971 my $link = shift(@files);
972 $link =~ s/_x_x//; # special case for C
973 $link =~ s/_x_/_/; # strip family if none there
974 foreach my $file (@files) {
975 my @a = split(/_/, $file);
976 my @b = split(/\./, $a[-1]);
978 print FOUT "SAME+=\t\t$link $file\n";
979 undef($languages{$a[0]}{$a[1]}{data}{$b[0]}{$b[1]});
984 foreach my $l (sort keys(%languages)) {
985 foreach my $f (sort keys(%{$languages{$l}})) {
986 foreach my $c (sort keys(%{$languages{$l}{$f}{data}})) {
987 next if (defined $languages{$l}{$f}{definitions}
988 && $languages{$l}{$f}{definitions} !~ /$TYPE/);
989 if (defined $languages{$l}{$f}{data}{$c}{$DEFENCODING}
990 && $languages{$l}{$f}{data}{$c}{$DEFENCODING} eq "0") {
991 print "Skipping ${l}_" . ($f eq "x" ? "" : "${f}_") .
995 foreach my $e (sort keys(%{$languages{$l}{$f}{data}{$c}})) {
997 $file .= "_" . $f if ($f ne "x");
998 $file .= "_" . $c if ($c ne "x");
999 next if (!defined $languages{$l}{$f}{data}{$c}{$e});
1000 print FOUT "LOCALES+=\t$file.$e\n";
1003 if (defined $languages{$l}{$f}{nc_link}) {
1004 foreach my $e (sort keys(%{$languages{$l}{$f}{data}{$c}})) {
1005 my $file = $l . "_";
1006 $file .= $f . "_" if ($f ne "x");
1008 print FOUT "SAME+=\t\t$file.$e $languages{$l}{$f}{nc_link}.$e\t# legacy (lang/country change)\n";
1012 if (defined $languages{$l}{$f}{e_link}) {
1013 foreach my $el (split(" ", $languages{$l}{$f}{e_link})) {
1014 my @a = split(/:/, $el);
1015 my $file = $l . "_";
1016 $file .= $f . "_" if ($f ne "x");
1018 print FOUT "SAME+=\t\t$file.$a[0] $file.$a[1]\t# legacy (same charset)\n";
1028 FILES= \${LOCALES:S/\$/.${SRCOUT2}/}
1029 CLEANFILES= \${FILES}
1031 .for f t in \${SAME}
1032 SYMLINKS+= ../\$f/\${FILESNAME} \\
1033 \${LOCALEDIR}/\$t/\${FILESNAME}
1036 .for f in \${LOCALES}
1037 FILESDIR_\${f}.${SRCOUT2}= \${LOCALEDIR}/\${f}
1040 ${SRCOUT3}.include <bsd.prog.mk>