build: i18n-scan.pl: support extracting translations from menu json
authorJo-Philipp Wich <jo@mein.io>
Fri, 6 Dec 2019 13:54:45 +0000 (14:54 +0100)
committerJo-Philipp Wich <jo@mein.io>
Mon, 16 Dec 2019 17:07:17 +0000 (18:07 +0100)
Signed-off-by: Jo-Philipp Wich <jo@mein.io>
build/i18n-scan.pl

index c19a4386ce5652e09a9baec206bcc0bbb44d71cd..5ac1cb77d4986854051cb39b5adb51e83da4afcc 100755 (executable)
@@ -1,5 +1,6 @@
 #!/usr/bin/perl
 
+use utf8;
 use strict;
 use warnings;
 use Text::Balanced qw(extract_tagged gen_delimited_pat);
@@ -15,12 +16,49 @@ my %stringtable;
 sub dec_lua_str
 {
        my $s = shift;
-       $s =~ s/\\n/\n/g;
-       $s =~ s/\\t/\t/g;
-       $s =~ s/\\(.)/$1/sg;
+       my %rep = (
+               'a' => "\x07",
+               'b' => "\x08",
+               'f' => "\x0c",
+               'n' => "\n",
+               'r' => "\r",
+               't' => "\t",
+               'v' => "\x76"
+       );
+
+       $s =~ s!\\(?:([0-9]{1,2})|(.))!
+               $1 ? chr(int($1)) : ($rep{$2} || $2)
+       !segx;
+
+       $s =~ s/[\s\n]+/ /g;
+       $s =~ s/^ //;
+       $s =~ s/ $//;
+
+       return $s;
+}
+
+sub dec_json_str
+{
+       my $s = shift;
+       my %rep = (
+               '"' => '"',
+               '/' => '/',
+               'b' => "\x08",
+               'f' => "\x0c",
+               'n' => "\n",
+               'r' => "\r",
+               't' => "\t",
+               '\\' => '\\'
+       );
+
+       $s =~ s!\\([\\/"bfnrt]|u([0-9a-fA-F]{4}))!
+               $2 ? chr(hex($2)) : $rep{$1}
+       !egx;
+
        $s =~ s/[\s\n]+/ /g;
        $s =~ s/^ //;
        $s =~ s/ $//;
+
        return $s;
 }
 
@@ -43,6 +81,8 @@ if( open F, "find @ARGV -type f '(' -name '*.htm' -o -name '*.lua' -o -name '*.j
 
                if( open S, "< $file" )
                {
+                       binmode S, ':utf8';
+
                        local $/ = undef;
                        my $raw = <S>;
                        close S;
@@ -148,9 +188,84 @@ if( open F, "find @ARGV -type f '(' -name '*.htm' -o -name '*.lua' -o -name '*.j
        close F;
 }
 
+if( open F, "find @ARGV -type f -path '*/menu.d/*.json' | sort |" )
+{
+       while( defined( my $file = readline F ) )
+       {
+               chomp $file;
+
+               if( open S, "< $file" )
+               {
+                       binmode S, ':utf8';
+
+                       local $/ = undef;
+                       my $raw = <S>;
+                       close S;
+
+                       my $text = $raw;
+                       my $line = 1;
+
+                       while ($text =~ s/ ^ (.*?) "title" ([\n\s]*) : //sgx)
+                       {
+                               my ($prefix, $suffix) = ($1, $2);
+                               my $code;
+                               my $res = "";
+                               my $sub = "";
+
+                               $line += () = $prefix =~ /\n/g;
+
+                               my $position = "$file:$line";
+
+                               $line += () = $suffix =~ /\n/g;
+
+                               while (defined $sub)
+                               {
+                                       undef $sub;
+
+                                       if ($text =~ /^ ([\n\s]*) " /sx)
+                                       {
+                                               my $ws = $1;
+                                               my $re = gen_delimited_pat('"', '\\');
+
+                                               if ($text =~ m/\G\s*($re)/gcs)
+                                               {
+                                                       $sub = $1;
+                                                       $text = substr $text, pos $text;
+                                               }
+
+                                               $line += () = $ws =~ /\n/g;
+
+                                               if (defined($sub) && length($sub)) {
+                                                       $line += () = $sub =~ /\n/g;
+
+                                                       $sub =~ s/^"//;
+                                                       $sub =~ s/"$//;
+                                                       $res .= $sub;
+                                               }
+                                       }
+                               }
+
+                               if (defined($res))
+                               {
+                                       $res = dec_json_str($res);
+
+                                       if ($res) {
+                                               $stringtable{$res} ||= [ ];
+                                               push @{$stringtable{$res}}, $position;
+                                       }
+                               }
+                       }
+               }
+       }
+
+       close F;
+}
+
 
 if( open C, "| msgcat -" )
 {
+       binmode C, ':utf8';
+
        printf C "msgid \"\"\nmsgstr \"Content-Type: text/plain; charset=UTF-8\"\n\n";
 
        foreach my $key ( sort keys %stringtable )