rockbox/tools/updatelang

#!/usr/bin/perl -s -w
#             __________               __   ___.
#   Open      \______   \ ____   ____ |  | _\_ |__   _______  ___
#   Source     |       _//  _ \_/ ___\|  |/ /| __ \ /  _ \  \/  /
#   Jukebox    |    |   (  <_> )  \___|    < | \_\ (  <_> > <  <
#   Firmware   |____|_  /\____/ \___  >__|_ \|___  /\____/__/\_ \
#                     \/            \/     \/    \/            \/
#
# Copyright (C) 2020 Solomon Peachy
#

use utf8;
use File::Basename;

sub trim {
    my ($string) = @_;
    $string =~ s/^\s+//;
    $string =~ s/\s+$//;
    return $string;
}

sub parselangfile {
    my ($filename) = @_;
    my %phrases;
    my @order;
    my %empty = ( #'phrase' => {},
		  #'source' => {},
		  #'dest' => {},
		  #'voice' => {},
		  'notes' => "",
		  'new' => 0
	);
    my %thisphrase = %empty;

    open(FH, "<$filename") || die ("Can't open $filename");
    my @lines = <FH>;
    close(FH);

    my $pos = 'lang';
    my $id = '';
    my @comments;

    foreach my $line (@lines) {
	$line = trim($line);
        if($line =~ /^ *###/) {
	    # Filter out warnings from prior runs
	    next;
        } elsif($line =~ /^ *#/) {
	    push(@comments, "$line\n") if ($pos eq 'lang');
            # comments are ignored!
            next;
        } elsif ($pos eq 'phrase' && $line =~ /^([^:]+): ?(.*)$/) {
	    $thisphrase{$pos}->{$1} = $2;
	    if ($1 eq 'id') {
		push(@order, $2);
		$id = $2;
	    }
	} elsif ($pos ne 'phrase' && $line =~ /^([^:]+): ?\"?([^\"]*)\"?$/) {
	    my @targets = split(',', $1);
	    my $w = $2;

	    foreach (@targets) {
		my $l = trim($_);
		# Convert some obsolete keys
		if ($l eq "swcodec") {
		    $l = "*";
		} elsif ($l eq "lcd_bitmap") {
		    $l = "*";
		} elsif ($l eq "recording_swcodec") {
		    $l = "recording";
#		} elsif ($id =~ /USB_MODE/ && $l =~ /ibassodx/) {
#		    $l = "*";
		}

		$thisphrase{$pos}->{$l} = $w;
	    }
	}
	if ($line eq '</voice>' ||
	    $line eq '</dest>' ||
	    $line eq '</source>' ||
	    $line eq '<phrase>') {
	    $pos = 'phrase';
	} elsif ($line eq '</phrase>') {
	    my %copy = %thisphrase;
	    $phrases{$id} = \%copy;
	    %thisphrase = %empty;
	    $pos = 'lang';
	    $id = '';
	} elsif ($line eq '<source>') {
	    $pos = 'source';
	} elsif ($line eq '<dest>') {
	    $pos = 'dest';
	} elsif ($line eq '<voice>') {
	    $pos = 'voice';
	}
    }
    $phrases{'HEADER'} = \@comments;
    $phrases{'ORDER'} = \@order;
    return %phrases;
}

sub combinetgts {
    my (%tgtmap) = (@_);
    my %strmap;
    my %combined;

    # Reverse-map things
    foreach my $tgt (sort(keys(%tgtmap))) {
	next if ($tgt eq '*');  # Do not combine anything with fallback
	if (defined($strmap{$tgtmap{$tgt}})) {
	    $strmap{$tgtmap{$tgt}} .= ",$tgt";
	} else {
	    $strmap{$tgtmap{$tgt}} = "$tgt";
	}
    }

    # Copy over default/fallback as it was skipped
    $combined{'*'} = $tgtmap{'*'};

    foreach my $str (keys(%strmap)) {
	$combined{$strmap{$str}} = $str;
    }

    return %combined;
}

##################

if($#ARGV != 2) {
    print "Usage: updatelang <english.lang> <otherlang> <outfile|->\n";
    exit;
}

# Parse master file
my %english = parselangfile($ARGV[0]);
my @englishorder = @{$english{'ORDER'}};

# Parse secondary file
my %lang = parselangfile($ARGV[1]);
my @langorder = @{$lang{'ORDER'}};
my @langheader = @{$lang{'HEADER'}};

# Clean up
delete $english{'ORDER'};
delete $english{'HEADER'};
delete $lang{'ORDER'};
delete $lang{'HEADER'};

# Extract language names
my @tmp = split(/\./, basename($ARGV[0]));
my $f1 = $tmp[0];
@tmp = split(/\./, basename($ARGV[1]));
my $f2 = $tmp[0];
undef @tmp;

# Read in ignore list
my $igname = dirname($0) . "/langignorelist.txt";
open (FH, "<$igname") || die ("Can't open $igname!");
my @ignorelist = <FH>;
close (FH);
sub not_ignorelist {
    my ($key) = @_;
    foreach (@ignorelist) {
	chomp;
	if ($_ eq $key) {
	    return 0;
	}
    }
    return 1;
}
undef $igname;

# Do we care about notes?
my $printnotes = 1;
my $ignoredups = 0;

if ($f1 eq $f2) {
    # Ignore all notes for master language
    $printnotes = 0;
}

if (index($f2, $f1) > -1) {
    # Ignore duplicates for sub-languages
    $ignoredups = 1;
}

# work out the missing phrases
my %missing;
my @missingorder;

foreach (@englishorder) {
    $missing{$_} = 1;
}
foreach (@langorder) {
    if (!defined($english{$_})) {
	delete($lang{$_});
#	print "#!! '$_' no longer needed\n";
	next;
    }
    delete $missing{$_};
}
foreach (@englishorder) {
    push(@missingorder, $_) if defined($missing{$_});
}
# And add them to the phrase list.
foreach (@missingorder) {
#    print "#!! '$_' missing\n";
    push(@langorder, $_);
    $lang{$_} = $english{$_};
    $lang{$_}{'notes'} .= "### This phrase is missing entirely, copying from english!\n";
    $lang{$_}{'new'} = 1;
}
undef @missingorder;
undef %missing;

# Sanity-check a few things
foreach my $id (@langorder) {
    if (!defined($english{$id})) {
	next;
    }
    my %ep = %{$english{$id}{'phrase'}};
    my %lp = %{$lang{$id}{'phrase'}};

    if ($lp{'desc'} ne $ep{'desc'} || $ep{'desc'} eq 'deprecated') {
	if ($ep{'desc'} eq 'deprecated') {
	    # Nuke all deprecated targets; just copy from English
#	    print "#!! '$id' deprecated, deleting\n";
	    $lang{$id} = $english{$id};
	} else {
	    $lang{$id}{'notes'} .= "### The 'desc' field for '$id' differs from the english!\n### the previously used desc is commented below:\n### desc: $lp{desc}\n";
	    $lang{$id}{'phrase'}{'desc'} = 	$english{$id}{'phrase'}{'desc'};
	    #	print "#!! '$id' changed description\n";
	}
    }

    if (!defined($ep{'user'}) || length($ep{'user'}) == 0) {
	$lp{'user'} = 'core';
    }

    if (!defined($lp{'user'}) || $lp{'user'} ne $ep{'user'}) {
	$lang{$id}{'notes'} .= "### The 'user' field for '$id' differs from the english!\n### the previously used desc is commented below:\n### desc: $lp{user}\n";
	if (!defined($lp{'user'}) || length($lp{'user'}) == 0) {
	    $lp{'user'} = $ep{'user'};
	}
	$lang{$id}{'phrase'}{'user'} = $english{$id}{'phrase'}{'user'};
#	print "#!! '$id' changed user\n";
    }
}

# Check sources
foreach my $id (@langorder) {
    if (!defined($english{$id})) {
	next;
    }
    my %ep = %{$english{$id}{'source'}};
    my %lp;

    if (defined($lang{$id}{'source'})) {
	%lp = %{$lang{$id}{'source'}};
    } else {
	%lp = ();
    }

    foreach my $tgt (keys(%lp)) {
	if (!defined($ep{$tgt})) {
	    # Delete any targets that have been nuked in master
	    delete($lang{$id}{'source'}{$tgt});
	}
    }
    foreach my $tgt (keys(%ep)) {
	if (!defined($lp{$tgt})) {
	    # If it doesn't exist in the language, copy it from English
	    if ($ep{$tgt} ne 'none' && $ep{$tgt} ne '' ) {
		$lang{$id}{'notes'} .= "### The <source> section for '$id:$tgt' is missing! Copying from english!\n";
#		print "#!! '$id:$tgt' source missing\n";
	    }
	    $lang{$id}{'source'}{$tgt} = $english{$id}{'source'}{$tgt};
	} elsif ($lp{$tgt} ne $ep{$tgt}) {
	    # If the source string differs, complain, and copy from English
	    $lang{$id}{'notes'} .= "### The <source> section for '$id:$tgt' differs from the english!\n";
	    $lang{$id}{'notes'} .= "### the previously used one is commented below:\n";
            $lang{$id}{'notes'} .= "### $english{$id}{source}{$tgt}\n";
#	    print "#!! '$id:$tgt' source changed ('$lp{$tgt}' vs '$ep{$tgt}')\n";
	    $lang{$id}{'source'}{$tgt} = $english{$id}{'source'}{$tgt};
	}
    }
}

# Check dests
foreach my $id (@langorder) {
    if (!defined($english{$id})) {
	next;
    }
    my %ep = %{$english{$id}{'dest'}};
    my %lp;

    if (defined($lang{$id}{'dest'})) {
	%lp = %{$lang{$id}{'dest'}};
    } else {
	%lp = ();
    }

    foreach my $tgt (keys(%lp)) {
	if (!defined($ep{$tgt})) {
	    # Delete any targets that have been nuked in master
	    delete($lang{$id}{'dest'}{$tgt});
	}
    }
    foreach my $tgt (keys(%ep)) {
	if (!defined($lp{$tgt}) || ($lp{$tgt} eq 'none')) {
	    # If it doesn't exist in the language, copy it from English
	    if ($ep{$tgt} ne 'none' && $ep{$tgt} ne '' ) {
		$lang{$id}{'notes'} .= "### The <dest> section for '$id:$tgt' is missing! Copying from english!\n";
#		print "#!! '$id:$tgt' dest missing\n";
	    }
	    $lang{$id}{'dest'}{$tgt} = $english{$id}{'dest'}{$tgt};
	} elsif ($lp{$tgt} ne $ep{$tgt}) {
	    # If the source string differs, complain, and copy from English
	    if ($lp{$tgt} eq '' && $ep{$tgt} ne '') {
		$lang{$id}{'notes'} .= "### The <dest> section for '$id:$tgt' is blank! Copying from english!\n";
#		print "#!! '$id:$tgt' dest is blank ('$lp{$tgt}' vs '$ep{$tgt}')\n";
		$lang{$id}{'dest'}{$tgt} = $english{$id}{'dest'}{$tgt};
	    } elsif ($lp{$tgt} ne '' && $ep{$tgt} eq '') {
		# It should be kept blank!
		$lang{$id}{'notes'} .= "### The <dest> section for '$id:$tgt' is not blank!\n";
		$lang{$id}{'notes'} .= "### the previously used one is commented below:\n";
		$lang{$id}{'notes'} .= "### $english{$id}{dest}{$tgt}\n";
#		print "#!! '$id:$tgt' dest not blank ('$lp{$tgt}' vs '$ep{$tgt}')\n";
		$lang{$id}{'dest'}{$tgt} = $english{$id}{'dest'}{$tgt};
	    }
	} elsif ($lp{$tgt} ne 'none' && $lp{$tgt} ne '' && not_ignorelist($id) && !$lang{$id}{'new'} && !$ignoredups) {
	    $lang{$id}{'notes'} .= "### The <dest> section for '$id:$tgt' is identical to english!\n";
#	    print "#!! '$id:$tgt' dest identical ('$lp{$tgt}')\n";
	}
    }
}

# Check voices
foreach my $id (@langorder) {
    if (!defined($english{$id})) {
	next;
    }
    my %ep = %{$english{$id}{'voice'}};
    my %lp;

    if (defined($lang{$id}{'voice'})) {
	%lp = %{$lang{$id}{'voice'}};
    } else {
	%lp = ();
    }

    foreach my $tgt (keys(%lp)) {
	if (!defined($ep{$tgt})) {
	    # Delete any targets that have been nuked in master
	    delete($lang{$id}{'voice'}{$tgt});
	}
    }
    foreach my $tgt (keys(%ep)) {
	if (!defined($lp{$tgt}) || ($lp{$tgt} eq 'none')) {
	    # If it doesn't exist in the language, copy it from English
	    if ($ep{$tgt} ne 'none' && $ep{$tgt} ne '' ) {
		$lang{$id}{'notes'} .= "### The <voice> section for '$id:$tgt' is missing! Copying from english!\n";
#		print "#!! '$id:$tgt' voice missing\n";
	    }
	    $lang{$id}{'voice'}{$tgt} = $english{$id}{'voice'}{$tgt};
	} elsif ($lp{$tgt} ne $ep{$tgt}) {
	    if ($lp{$tgt} eq '' && $ep{$tgt} ne '') {
		# If the lang voice string is blank, complain, and copy from English
		$lang{$id}{'notes'} .= "### The <voice> section for '$id:$tgt' is blank! Copying from english!\n";
#		print "#!! '$id:$tgt' voice is blank ('$lp{$tgt}' vs '$ep{$tgt}')\n";
		$lang{$id}{'voice'}{$tgt} = $english{$id}{'voice'}{$tgt};
	    } elsif ($lp{$tgt} ne '' && $ep{$tgt} eq '') {
		if ($id ne 'VOICE_NUMERIC_TENS_SWAP_SEPARATOR') {
		    # If it's not blank, clear it and complain!
		    $lang{$id}{'notes'} .= "### The <voice> section for '$id:$tgt' is not blank!\n";
		    $lang{$id}{'notes'} .= "### the previously used one is commented below:\n";
		    $lang{$id}{'notes'} .= "### $english{$id}{voice}{$tgt}\n";
		    #		print "#!! '$id:$tgt' voice not blank ('$lp{$tgt}' vs '$ep{$tgt}')\n";
		    $lang{$id}{'voice'}{$tgt} = $english{$id}{'voice'}{$tgt};
		}
	    }
	} elsif ($lp{$tgt} ne 'none' && $lp{$tgt} ne '' && not_ignorelist($id) && !$lang{$id}{'new'} && !$ignoredups) {
	    $lang{$id}{'notes'} .= "### The <voice> section for '$id:$tgt' is identical to english!\n";
#	    print "#!! '$id:$tgt' voice identical ('$lp{$tgt}')\n";
	}
    }
}

########## Write new language file
my $fh;
if ($ARGV[2] ne '-') {
    open(FH, ">$ARGV[2]") || die ("Can't open $ARGV[2]");
    $fh = *FH;
} else {
    $fh = *STDOUT;
}

foreach (@langheader) {
    print $fh $_;
}

my @finalorder = @langorder;  # TODO make configurable vs @englishorder
foreach my $id (@finalorder) {
    if (!defined($english{$id})) {
	next;
    }
    my %lp;

    # phrase
    %lp = %{$lang{$id}{'phrase'}};

    # Drop all deprecated phrases?
#    next if ($lp{'desc'} eq 'deprecated');

    if (length($lang{$id}{'notes'}) && $printnotes) {
	print $fh "$lang{$id}{notes}";
    }
    print $fh "<phrase>\n";
    print $fh "  id: $lp{id}\n";
    if ($lp{'desc'} ne '') {
	print $fh "  desc: $lp{desc}\n";
    } else {
	print $fh "  desc:\n";
    }
    print $fh "  user: $lp{user}\n";

    # source
    %lp = combinetgts(%{$lang{$id}{'source'}});
    print $fh "  <source>\n";
    foreach my $tgt (sort(keys(%lp))) {
	if ($lp{$tgt} eq 'none') {
	    print $fh "    $tgt: $lp{$tgt}\n";
	} else {
	    print $fh "    $tgt: \"$lp{$tgt}\"\n";
	}
    }
    print $fh "  </source>\n";

    # dest
    %lp = combinetgts(%{$lang{$id}{'dest'}});
    print $fh "  <dest>\n";
    foreach my $tgt (sort(keys(%lp))) {
	if ($lp{$tgt} eq 'none') {
	    print $fh "    $tgt: $lp{$tgt}\n";
	} else {
	    print $fh "    $tgt: \"$lp{$tgt}\"\n";
	}
    }
    print $fh "  </dest>\n";

    # voice
    %lp = combinetgts(%{$lang{$id}{'voice'}});
    print $fh "  <voice>\n";
    foreach my $tgt (sort(keys(%lp))) {
	if ($lp{$tgt} eq 'none') {
	    print $fh "    $tgt: $lp{$tgt}\n";
	} else {
	    print $fh "    $tgt: \"$lp{$tgt}\"\n";
	}
    }
    print $fh "  </voice>\n";

    # FiN
    print $fh "</phrase>\n";
}

if ($ARGV[2] ne '-') {
    close(FH);
}
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`#!/usr/bin/perl -s -w`
			`# __________ __ ___.`
			`# Open \______ \ ____ ____ \| \| _\_ \|__ _______ ___`
			`# Source \| _// _ \_/ ___\\| \|/ /\| __ \ / _ \ \/ /`
			`# Jukebox \| \| ( <_> ) \___\| < \| \_\ ( <_> > < <`
			`# Firmware \|____\|_ /\____/ \___ >__\|_ \\|___ /\____/__/\_ \`
			`# \/ \/ \/ \/ \/`
			`#`
			`# Copyright (C) 2020 Solomon Peachy`
			`#`

			`use utf8;`
			`use File::Basename;`

			`sub trim {`
			`my ($string) = @_;`
			`$string =~ s/^\s+//;`
			`$string =~ s/\s+$//;`
			`return $string;`
			`}`

			`sub parselangfile {`
			`my ($filename) = @_;`
			`my %phrases;`
			`my @order;`
			`my %empty = ( #'phrase' => {},`
			`#'source' => {},`
			`#'dest' => {},`
			`#'voice' => {},`
			`'notes' => "",`
			`'new' => 0`
			`);`
			`my %thisphrase = %empty;`

			`open(FH, "<$filename") \|\| die ("Can't open $filename");`
			`my @lines = <FH>;`
			`close(FH);`

			`my $pos = 'lang';`
			`my $id = '';`
			`my @comments;`

			`foreach my $line (@lines) {`
			`$line = trim($line);`
updatelang: Fix false warnings about deprecated strings Change-Id: Ia208909ed42dc7f9b8bd7d22ca88f1a1e47d0576 2020-07-28 13:14:56 +00:00			`if($line =~ /^ *###/) {`
			`# Filter out warnings from prior runs`
			`next;`
			`} elsif($line =~ /^ *#/) {`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`push(@comments, "$line\n") if ($pos eq 'lang');`
			`# comments are ignored!`
			`next;`
			`} elsif ($pos eq 'phrase' && $line =~ /^([^:]+): ?(.*)$/) {`
			`$thisphrase{$pos}->{$1} = $2;`
			`if ($1 eq 'id') {`
			`push(@order, $2);`
			`$id = $2;`
			`}`
			`} elsif ($pos ne 'phrase' && $line =~ /^([^:]+): ?\"?([^\"]*)\"?$/) {`
			`my @targets = split(',', $1);`
lang: More automated rejiggering, USB_MODE_* is no longer ibasso-specific Change-Id: I8e7eb3bb3c5ed61572c0ade4059c3e3527558932 2020-11-22 14:43:39 +00:00			`my $w = $2;`

updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`foreach (@targets) {`
			`my $l = trim($_);`
languages: convert recording_swcodec -> recording Change-Id: I481a53284d63457717f4a6524edc5b477f29a20a 2020-11-19 14:51:23 +00:00			`# Convert some obsolete keys`
			`if ($l eq "swcodec") {`
			`$l = "*";`
			`} elsif ($l eq "lcd_bitmap") {`
			`$l = "*";`
			`} elsif ($l eq "recording_swcodec") {`
			`$l = "recording";`
lang: More automated rejiggering, USB_MODE_* is no longer ibasso-specific Change-Id: I8e7eb3bb3c5ed61572c0ade4059c3e3527558932 2020-11-22 14:43:39 +00:00			`# } elsif ($id =~ /USB_MODE/ && $l =~ /ibassodx/) {`
			`# $l = "*";`
languages: convert recording_swcodec -> recording Change-Id: I481a53284d63457717f4a6524edc5b477f29a20a 2020-11-19 14:51:23 +00:00			`}`
lang: Make all swcodec &\| lcd_bitmap strings default. Change-Id: Id0a3282884c3e258c5b2f24b35aa7e618a8e8bbe 2020-11-17 15:02:11 +00:00
lang: More automated rejiggering, USB_MODE_* is no longer ibasso-specific Change-Id: I8e7eb3bb3c5ed61572c0ade4059c3e3527558932 2020-11-22 14:43:39 +00:00			`$thisphrase{$pos}->{$l} = $w;`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`}`
			`}`
			`if ($line eq '</voice>' \|\|`
			`$line eq '</dest>' \|\|`
			`$line eq '</source>' \|\|`
			`$line eq '<phrase>') {`
			`$pos = 'phrase';`
			`} elsif ($line eq '</phrase>') {`
updatelang: Don't rely on non-core modules Change-Id: I262f47e10aee51116375238b458270e92e25154d 2020-07-27 19:18:21 +00:00			`my %copy = %thisphrase;`
			`$phrases{$id} = \%copy;`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`%thisphrase = %empty;`
			`$pos = 'lang';`
			`$id = '';`
			`} elsif ($line eq '<source>') {`
			`$pos = 'source';`
			`} elsif ($line eq '<dest>') {`
			`$pos = 'dest';`
			`} elsif ($line eq '<voice>') {`
			`$pos = 'voice';`
			`}`
			`}`
			`$phrases{'HEADER'} = \@comments;`
			`$phrases{'ORDER'} = \@order;`
			`return %phrases;`
			`}`

			`sub combinetgts {`
			`my (%tgtmap) = (@_);`
			`my %strmap;`
			`my %combined;`

			`# Reverse-map things`
			`foreach my $tgt (sort(keys(%tgtmap))) {`
			`next if ($tgt eq '*'); # Do not combine anything with fallback`
			`if (defined($strmap{$tgtmap{$tgt}})) {`
			`$strmap{$tgtmap{$tgt}} .= ",$tgt";`
			`} else {`
			`$strmap{$tgtmap{$tgt}} = "$tgt";`
			`}`
			`}`

			`# Copy over default/fallback as it was skipped`
			`$combined{''} = $tgtmap{''};`

			`foreach my $str (keys(%strmap)) {`
			`$combined{$strmap{$str}} = $str;`
			`}`

			`return %combined;`
			`}`

			`##################`

			`if($#ARGV != 2) {`
updatelang: Extract langstr ignore list into a separate file so it can be shared Change-Id: I4b77e1fe435e1f02df665f18e69b5c1db0a2e0b5 2020-07-28 15:11:30 +00:00			`print "Usage: updatelang <english.lang> <otherlang> <outfile\|->\n";`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`exit;`
			`}`

			`# Parse master file`
			`my %english = parselangfile($ARGV[0]);`
			`my @englishorder = @{$english{'ORDER'}};`

			`# Parse secondary file`
			`my %lang = parselangfile($ARGV[1]);`
			`my @langorder = @{$lang{'ORDER'}};`
			`my @langheader = @{$lang{'HEADER'}};`

			`# Clean up`
			`delete $english{'ORDER'};`
			`delete $english{'HEADER'};`
			`delete $lang{'ORDER'};`
			`delete $lang{'HEADER'};`

updatelang: more tweaks for master language and sub-languages Change-Id: I5af62b2f03bb4ee34518592e14c6ded3ccfea4e3 2020-07-28 04:12:23 +00:00			`# Extract language names`
			`my @tmp = split(/\./, basename($ARGV[0]));`
			`my $f1 = $tmp[0];`
			`@tmp = split(/\./, basename($ARGV[1]));`
			`my $f2 = $tmp[0];`
			`undef @tmp;`

updatelang: Extract langstr ignore list into a separate file so it can be shared Change-Id: I4b77e1fe435e1f02df665f18e69b5c1db0a2e0b5 2020-07-28 15:11:30 +00:00			`# Read in ignore list`
			`my $igname = dirname($0) . "/langignorelist.txt";`
			`open (FH, "<$igname") \|\| die ("Can't open $igname!");`
			`my @ignorelist = <FH>;`
			`close (FH);`
			`sub not_ignorelist {`
			`my ($key) = @_;`
			`foreach (@ignorelist) {`
updatelang: Fix the ignore list having issues with line endings. Change-Id: Ib4add14ff7415c42d0cc2ec11ec918ec02fac72d 2020-07-28 22:55:16 +00:00			`chomp;`
updatelang: Extract langstr ignore list into a separate file so it can be shared Change-Id: I4b77e1fe435e1f02df665f18e69b5c1db0a2e0b5 2020-07-28 15:11:30 +00:00			`if ($_ eq $key) {`
			`return 0;`
			`}`
			`}`
			`return 1;`
			`}`
			`undef $igname;`

updatelang: more tweaks for master language and sub-languages Change-Id: I5af62b2f03bb4ee34518592e14c6ded3ccfea4e3 2020-07-28 04:12:23 +00:00			`# Do we care about notes?`
			`my $printnotes = 1;`
			`my $ignoredups = 0;`

			`if ($f1 eq $f2) {`
			`# Ignore all notes for master language`
			`$printnotes = 0;`
			`}`

			`if (index($f2, $f1) > -1) {`
			`# Ignore duplicates for sub-languages`
			`$ignoredups = 1;`
			`}`

			`# work out the missing phrases`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`my %missing;`
			`my @missingorder;`

			`foreach (@englishorder) {`
			`$missing{$_} = 1;`
			`}`
			`foreach (@langorder) {`
			`if (!defined($english{$_})) {`
			`delete($lang{$_});`
			`# print "#!! '$_' no longer needed\n";`
			`next;`
			`}`
			`delete $missing{$_};`
			`}`
			`foreach (@englishorder) {`
			`push(@missingorder, $_) if defined($missing{$_});`
			`}`
			`# And add them to the phrase list.`
			`foreach (@missingorder) {`
			`# print "#!! '$_' missing\n";`
			`push(@langorder, $_);`
			`$lang{$_} = $english{$_};`
			`$lang{$_}{'notes'} .= "### This phrase is missing entirely, copying from english!\n";`
			`$lang{$_}{'new'} = 1;`
			`}`
			`undef @missingorder;`
			`undef %missing;`

			`# Sanity-check a few things`
			`foreach my $id (@langorder) {`
			`if (!defined($english{$id})) {`
			`next;`
			`}`
			`my %ep = %{$english{$id}{'phrase'}};`
			`my %lp = %{$lang{$id}{'phrase'}};`

updatelang: Fix false warnings about deprecated strings Change-Id: Ia208909ed42dc7f9b8bd7d22ca88f1a1e47d0576 2020-07-28 13:14:56 +00:00			`if ($lp{'desc'} ne $ep{'desc'} \|\| $ep{'desc'} eq 'deprecated') {`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`if ($ep{'desc'} eq 'deprecated') {`
			`# Nuke all deprecated targets; just copy from English`
			`# print "#!! '$id' deprecated, deleting\n";`
			`$lang{$id} = $english{$id};`
			`} else {`
			`$lang{$id}{'notes'} .= "### The 'desc' field for '$id' differs from the english!\n### the previously used desc is commented below:\n### desc: $lp{desc}\n";`
			`$lang{$id}{'phrase'}{'desc'} = $english{$id}{'phrase'}{'desc'};`
			`# print "#!! '$id' changed description\n";`
			`}`
			`}`

lang: Make all swcodec &\| lcd_bitmap strings default. Change-Id: Id0a3282884c3e258c5b2f24b35aa7e618a8e8bbe 2020-11-17 15:02:11 +00:00			`if (!defined($ep{'user'}) \|\| length($ep{'user'}) == 0) {`
			`$lp{'user'} = 'core';`
			`}`

updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`if (!defined($lp{'user'}) \|\| $lp{'user'} ne $ep{'user'}) {`
lang: Make all swcodec &\| lcd_bitmap strings default. Change-Id: Id0a3282884c3e258c5b2f24b35aa7e618a8e8bbe 2020-11-17 15:02:11 +00:00			`$lang{$id}{'notes'} .= "### The 'user' field for '$id' differs from the english!\n### the previously used desc is commented below:\n### desc: $lp{user}\n";`
			`if (!defined($lp{'user'}) \|\| length($lp{'user'}) == 0) {`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`$lp{'user'} = $ep{'user'};`
			`}`
			`$lang{$id}{'phrase'}{'user'} = $english{$id}{'phrase'}{'user'};`
			`# print "#!! '$id' changed user\n";`
			`}`
			`}`

			`# Check sources`
			`foreach my $id (@langorder) {`
			`if (!defined($english{$id})) {`
			`next;`
			`}`
			`my %ep = %{$english{$id}{'source'}};`
			`my %lp;`

			`if (defined($lang{$id}{'source'})) {`
			`%lp = %{$lang{$id}{'source'}};`
			`} else {`
			`%lp = ();`
			`}`

			`foreach my $tgt (keys(%lp)) {`
			`if (!defined($ep{$tgt})) {`
			`# Delete any targets that have been nuked in master`
			`delete($lang{$id}{'source'}{$tgt});`
			`}`
			`}`
			`foreach my $tgt (keys(%ep)) {`
			`if (!defined($lp{$tgt})) {`
			`# If it doesn't exist in the language, copy it from English`
updatelang: Fix a few straggling issues Change-Id: I549a33c94c339151cf5a74f13a8ecb73454bbfd4 2020-07-27 20:17:33 +00:00			`if ($ep{$tgt} ne 'none' && $ep{$tgt} ne '' ) {`
			`$lang{$id}{'notes'} .= "### The <source> section for '$id:$tgt' is missing! Copying from english!\n";`
			`# print "#!! '$id:$tgt' source missing\n";`
			`}`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`$lang{$id}{'source'}{$tgt} = $english{$id}{'source'}{$tgt};`
			`} elsif ($lp{$tgt} ne $ep{$tgt}) {`
			`# If the source string differs, complain, and copy from English`
			`$lang{$id}{'notes'} .= "### The <source> section for '$id:$tgt' differs from the english!\n";`
			`$lang{$id}{'notes'} .= "### the previously used one is commented below:\n";`
			`$lang{$id}{'notes'} .= "### $english{$id}{source}{$tgt}\n";`
			`# print "#!! '$id:$tgt' source changed ('$lp{$tgt}' vs '$ep{$tgt}')\n";`
			`$lang{$id}{'source'}{$tgt} = $english{$id}{'source'}{$tgt};`
			`}`
			`}`
			`}`

			`# Check dests`
			`foreach my $id (@langorder) {`
			`if (!defined($english{$id})) {`
			`next;`
			`}`
			`my %ep = %{$english{$id}{'dest'}};`
			`my %lp;`

			`if (defined($lang{$id}{'dest'})) {`
			`%lp = %{$lang{$id}{'dest'}};`
			`} else {`
			`%lp = ();`
			`}`

			`foreach my $tgt (keys(%lp)) {`
			`if (!defined($ep{$tgt})) {`
			`# Delete any targets that have been nuked in master`
			`delete($lang{$id}{'dest'}{$tgt});`
			`}`
			`}`
			`foreach my $tgt (keys(%ep)) {`
updatelang: Handle/flag the bad data that led to english-us breaking Change-Id: Ifffea9557d50ab5a103e13473ebe074ae1aa7b6d 2021-03-05 17:42:23 +00:00			`if (!defined($lp{$tgt}) \|\| ($lp{$tgt} eq 'none')) {`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`# If it doesn't exist in the language, copy it from English`
updatelang: Fix a few straggling issues Change-Id: I549a33c94c339151cf5a74f13a8ecb73454bbfd4 2020-07-27 20:17:33 +00:00			`if ($ep{$tgt} ne 'none' && $ep{$tgt} ne '' ) {`
updatelang: Fix a couple of typos in the output used by the translate site Change-Id: I13fe3e106c128dbc646906b5cb2c9702feb6bda2 2020-12-13 03:26:35 +00:00			`$lang{$id}{'notes'} .= "### The <dest> section for '$id:$tgt' is missing! Copying from english!\n";`
updatelang: Fix a few straggling issues Change-Id: I549a33c94c339151cf5a74f13a8ecb73454bbfd4 2020-07-27 20:17:33 +00:00			`# print "#!! '$id:$tgt' dest missing\n";`
			`}`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`$lang{$id}{'dest'}{$tgt} = $english{$id}{'dest'}{$tgt};`
			`} elsif ($lp{$tgt} ne $ep{$tgt}) {`
			`# If the source string differs, complain, and copy from English`
			`if ($lp{$tgt} eq '' && $ep{$tgt} ne '') {`
			`$lang{$id}{'notes'} .= "### The <dest> section for '$id:$tgt' is blank! Copying from english!\n";`
			`# print "#!! '$id:$tgt' dest is blank ('$lp{$tgt}' vs '$ep{$tgt}')\n";`
updatelang: Fix a few straggling issues Change-Id: I549a33c94c339151cf5a74f13a8ecb73454bbfd4 2020-07-27 20:17:33 +00:00			`$lang{$id}{'dest'}{$tgt} = $english{$id}{'dest'}{$tgt};`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`} elsif ($lp{$tgt} ne '' && $ep{$tgt} eq '') {`
			`# It should be kept blank!`
			`$lang{$id}{'notes'} .= "### The <dest> section for '$id:$tgt' is not blank!\n";`
			`$lang{$id}{'notes'} .= "### the previously used one is commented below:\n";`
			`$lang{$id}{'notes'} .= "### $english{$id}{dest}{$tgt}\n";`
			`# print "#!! '$id:$tgt' dest not blank ('$lp{$tgt}' vs '$ep{$tgt}')\n";`
updatelang: Fix a few straggling issues Change-Id: I549a33c94c339151cf5a74f13a8ecb73454bbfd4 2020-07-27 20:17:33 +00:00			`$lang{$id}{'dest'}{$tgt} = $english{$id}{'dest'}{$tgt};`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`}`
updatelang: more tweaks for master language and sub-languages Change-Id: I5af62b2f03bb4ee34518592e14c6ded3ccfea4e3 2020-07-28 04:12:23 +00:00			`} elsif ($lp{$tgt} ne 'none' && $lp{$tgt} ne '' && not_ignorelist($id) && !$lang{$id}{'new'} && !$ignoredups) {`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`$lang{$id}{'notes'} .= "### The <dest> section for '$id:$tgt' is identical to english!\n";`
			`# print "#!! '$id:$tgt' dest identical ('$lp{$tgt}')\n";`
			`}`
			`}`
			`}`

			`# Check voices`
			`foreach my $id (@langorder) {`
			`if (!defined($english{$id})) {`
			`next;`
			`}`
			`my %ep = %{$english{$id}{'voice'}};`
			`my %lp;`

			`if (defined($lang{$id}{'voice'})) {`
			`%lp = %{$lang{$id}{'voice'}};`
			`} else {`
			`%lp = ();`
			`}`

			`foreach my $tgt (keys(%lp)) {`
			`if (!defined($ep{$tgt})) {`
			`# Delete any targets that have been nuked in master`
			`delete($lang{$id}{'voice'}{$tgt});`
			`}`
			`}`
			`foreach my $tgt (keys(%ep)) {`
updatelang: Handle/flag the bad data that led to english-us breaking Change-Id: Ifffea9557d50ab5a103e13473ebe074ae1aa7b6d 2021-03-05 17:42:23 +00:00			`if (!defined($lp{$tgt}) \|\| ($lp{$tgt} eq 'none')) {`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`# If it doesn't exist in the language, copy it from English`
updatelang: Fix a few straggling issues Change-Id: I549a33c94c339151cf5a74f13a8ecb73454bbfd4 2020-07-27 20:17:33 +00:00			`if ($ep{$tgt} ne 'none' && $ep{$tgt} ne '' ) {`
updatelang: Fix a couple of typos in the output used by the translate site Change-Id: I13fe3e106c128dbc646906b5cb2c9702feb6bda2 2020-12-13 03:26:35 +00:00			`$lang{$id}{'notes'} .= "### The <voice> section for '$id:$tgt' is missing! Copying from english!\n";`
updatelang: Fix a few straggling issues Change-Id: I549a33c94c339151cf5a74f13a8ecb73454bbfd4 2020-07-27 20:17:33 +00:00			`# print "#!! '$id:$tgt' voice missing\n";`
			`}`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`$lang{$id}{'voice'}{$tgt} = $english{$id}{'voice'}{$tgt};`
			`} elsif ($lp{$tgt} ne $ep{$tgt}) {`
			`if ($lp{$tgt} eq '' && $ep{$tgt} ne '') {`
			`# If the lang voice string is blank, complain, and copy from English`
			`$lang{$id}{'notes'} .= "### The <voice> section for '$id:$tgt' is blank! Copying from english!\n";`
			`# print "#!! '$id:$tgt' voice is blank ('$lp{$tgt}' vs '$ep{$tgt}')\n";`
updatelang: Fix a few straggling issues Change-Id: I549a33c94c339151cf5a74f13a8ecb73454bbfd4 2020-07-27 20:17:33 +00:00			`$lang{$id}{'voice'}{$tgt} = $english{$id}{'voice'}{$tgt};`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`} elsif ($lp{$tgt} ne '' && $ep{$tgt} eq '') {`
talk: Add support for languages that swap the tens position in numbers For example, English would say "231" as "two hundred thirty one" but many other languages would say "two hundred one and thirty" So, if VOICE_NUMERIC_TENS_SWAP_SEPARATOR is not an empty string, swap the tens and ones position and use that string ("and" in the above example) as the voiced separator. Change-Id: I69f8064d44b3995827327cabae6ad352bf257d04 2021-09-21 23:16:23 +00:00			`if ($id ne 'VOICE_NUMERIC_TENS_SWAP_SEPARATOR') {`
			`# If it's not blank, clear it and complain!`
			`$lang{$id}{'notes'} .= "### The <voice> section for '$id:$tgt' is not blank!\n";`
			`$lang{$id}{'notes'} .= "### the previously used one is commented below:\n";`
			`$lang{$id}{'notes'} .= "### $english{$id}{voice}{$tgt}\n";`
			`# print "#!! '$id:$tgt' voice not blank ('$lp{$tgt}' vs '$ep{$tgt}')\n";`
			`$lang{$id}{'voice'}{$tgt} = $english{$id}{'voice'}{$tgt};`
			`}`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`}`
updatelang: more tweaks for master language and sub-languages Change-Id: I5af62b2f03bb4ee34518592e14c6ded3ccfea4e3 2020-07-28 04:12:23 +00:00			`} elsif ($lp{$tgt} ne 'none' && $lp{$tgt} ne '' && not_ignorelist($id) && !$lang{$id}{'new'} && !$ignoredups) {`
updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`$lang{$id}{'notes'} .= "### The <voice> section for '$id:$tgt' is identical to english!\n";`
			`# print "#!! '$id:$tgt' voice identical ('$lp{$tgt}')\n";`
			`}`
			`}`
			`}`

			`########## Write new language file`
			`my $fh;`
			`if ($ARGV[2] ne '-') {`
			`open(FH, ">$ARGV[2]") \|\| die ("Can't open $ARGV[2]");`
			`$fh = *FH;`
			`} else {`
			`$fh = *STDOUT;`
			`}`

			`foreach (@langheader) {`
			`print $fh $_;`
			`}`

			`my @finalorder = @langorder; # TODO make configurable vs @englishorder`
			`foreach my $id (@finalorder) {`
			`if (!defined($english{$id})) {`
			`next;`
			`}`
			`my %lp;`

			`# phrase`
			`%lp = %{$lang{$id}{'phrase'}};`
lang: Make all swcodec &\| lcd_bitmap strings default. Change-Id: Id0a3282884c3e258c5b2f24b35aa7e618a8e8bbe 2020-11-17 15:02:11 +00:00
			`# Drop all deprecated phrases?`
			`# next if ($lp{'desc'} eq 'deprecated');`

updatelang: New tool to update language files. Change-Id: I3c18bb34770b4b4b321199149a2ea693dfbdb7f4 2020-07-27 05:10:34 +00:00			`if (length($lang{$id}{'notes'}) && $printnotes) {`
			`print $fh "$lang{$id}{notes}";`
			`}`
			`print $fh "<phrase>\n";`
			`print $fh " id: $lp{id}\n";`
			`if ($lp{'desc'} ne '') {`
			`print $fh " desc: $lp{desc}\n";`
			`} else {`
			`print $fh " desc:\n";`
			`}`
			`print $fh " user: $lp{user}\n";`

			`# source`
			`%lp = combinetgts(%{$lang{$id}{'source'}});`
			`print $fh " <source>\n";`
			`foreach my $tgt (sort(keys(%lp))) {`
			`if ($lp{$tgt} eq 'none') {`
			`print $fh " $tgt: $lp{$tgt}\n";`
			`} else {`
			`print $fh " $tgt: \"$lp{$tgt}\"\n";`
			`}`
			`}`
			`print $fh " </source>\n";`

			`# dest`
			`%lp = combinetgts(%{$lang{$id}{'dest'}});`
			`print $fh " <dest>\n";`
			`foreach my $tgt (sort(keys(%lp))) {`
			`if ($lp{$tgt} eq 'none') {`
			`print $fh " $tgt: $lp{$tgt}\n";`
			`} else {`
			`print $fh " $tgt: \"$lp{$tgt}\"\n";`
			`}`
			`}`
			`print $fh " </dest>\n";`

			`# voice`
			`%lp = combinetgts(%{$lang{$id}{'voice'}});`
			`print $fh " <voice>\n";`
			`foreach my $tgt (sort(keys(%lp))) {`
			`if ($lp{$tgt} eq 'none') {`
			`print $fh " $tgt: $lp{$tgt}\n";`
			`} else {`
			`print $fh " $tgt: \"$lp{$tgt}\"\n";`
			`}`
			`}`
			`print $fh " </voice>\n";`

			`# FiN`
			`print $fh "</phrase>\n";`
			`}`

			`if ($ARGV[2] ne '-') {`
			`close(FH);`
			`}`