luci/build/i18n-scan.pl

289 lines
4.8 KiB
Perl
Raw Normal View History

#!/usr/bin/perl
use utf8;
use strict;
use warnings;
use Text::Balanced qw(extract_tagged gen_delimited_pat);
use POSIX;
POSIX::setlocale(POSIX::LC_ALL, "C");
@ARGV >= 1 || die "Usage: $0 <source directory>\n";
my %stringtable;
sub dec_lua_str
{
my $s = shift;
my %rep = (
'a' => "\x07",
'b' => "\x08",
'f' => "\x0c",
'n' => "\n",
'r' => "\r",
't' => "\t",
'v' => "\x76"
);
$s =~ s!\\(?:([0-9]{1,2})|(.))!
$1 ? chr(int($1)) : ($rep{$2} || $2)
!segx;
$s =~ s/[\s\n]+/ /g;
$s =~ s/^ //;
$s =~ s/ $//;
return $s;
}
sub dec_json_str
{
my $s = shift;
my %rep = (
'"' => '"',
'/' => '/',
'b' => "\x08",
'f' => "\x0c",
'n' => "\n",
'r' => "\r",
't' => "\t",
'\\' => '\\'
);
$s =~ s!\\([\\/"bfnrt]|u([0-9a-fA-F]{4}))!
$2 ? chr(hex($2)) : $rep{$1}
!egx;
$s =~ s/[\s\n]+/ /g;
$s =~ s/^ //;
$s =~ s/ $//;
return $s;
}
sub dec_tpl_str
{
my $s = shift;
$s =~ s/-$//;
$s =~ s/[\s\n]+/ /g;
$s =~ s/^ //;
$s =~ s/ $//;
$s =~ s/\\/\\\\/g;
return $s;
}
if( open F, "find @ARGV -type f '(' -name '*.htm' -o -name '*.lua' -o -name '*.js' ')' | sort |" )
{
while( defined( my $file = readline F ) )
{
chomp $file;
if( open S, "< $file" )
{
binmode S, ':utf8';
local $/ = undef;
my $raw = <S>;
close S;
my $text = $raw;
my $line = 1;
while ($text =~ s/ ^ (.*?) (?:translate|translatef|i18n|_) ([\n\s]*) \( //sgx)
{
my ($prefix, $suffix) = ($1, $2);
my $code;
my $res = "";
my $sub = "";
$line += () = $prefix =~ /\n/g;
my $position = "$file:$line";
$line += () = $suffix =~ /\n/g;
while (defined $sub)
{
undef $sub;
if ($text =~ /^ ([\n\s]*(?:\.\.[\n\s]*)?) (\[=*\[) /sx)
{
my $ws = $1;
my $stag = quotemeta $2;
(my $etag = $stag) =~ y/[/]/;
($sub, $text) = extract_tagged($text, $stag, $etag, q{\s*(?:\.\.\s*)?});
$line += () = $ws =~ /\n/g;
if (defined($sub) && length($sub)) {
$line += () = $sub =~ /\n/g;
$sub =~ s/^$stag//;
$sub =~ s/$etag$//;
$res .= $sub;
}
}
elsif ($text =~ /^ ([\n\s]*(?:\.\.[\n\s]*)?) (['"]) /sx)
{
my $ws = $1;
my $quote = $2;
my $re = gen_delimited_pat($quote, '\\');
if ($text =~ m/\G\s*(?:\.\.\s*)?($re)/gcs)
2012-04-03 00:35:54 +00:00
{
$sub = $1;
$text = substr $text, pos $text;
2012-04-03 00:35:54 +00:00
}
$line += () = $ws =~ /\n/g;
if (defined($sub) && length($sub)) {
$line += () = $sub =~ /\n/g;
$sub =~ s/^$quote//;
$sub =~ s/$quote$//;
$res .= $sub;
}
}
}
if (defined($res))
{
$res = dec_lua_str($res);
if ($res) {
$stringtable{$res} ||= [ ];
push @{$stringtable{$res}}, $position;
}
}
}
$text = $raw;
$line = 1;
while( $text =~ s/ ^ (.*?) <% -? [:_] /<%/sgx )
{
$line += () = $1 =~ /\n/g;
( my $code, $text ) = extract_tagged($text, '<%', '%>');
if( defined $code )
{
my $position = "$file:$line";
$line += () = $code =~ /\n/g;
$code = dec_tpl_str(substr $code, 2, length($code) - 4);
$stringtable{$code} ||= [];
push @{$stringtable{$code}}, $position;
}
}
}
}
close F;
}
if( open F, "find @ARGV -type f -path '*/menu.d/*.json' | sort |" )
{
while( defined( my $file = readline F ) )
{
chomp $file;
if( open S, "< $file" )
{
binmode S, ':utf8';
local $/ = undef;
my $raw = <S>;
close S;
my $text = $raw;
my $line = 1;
while ($text =~ s/ ^ (.*?) "title" ([\n\s]*) : //sgx)
{
my ($prefix, $suffix) = ($1, $2);
my $code;
my $res = "";
my $sub = "";
$line += () = $prefix =~ /\n/g;
my $position = "$file:$line";
$line += () = $suffix =~ /\n/g;
while (defined $sub)
{
undef $sub;
if ($text =~ /^ ([\n\s]*) " /sx)
{
my $ws = $1;
my $re = gen_delimited_pat('"', '\\');
if ($text =~ m/\G\s*($re)/gcs)
{
$sub = $1;
$text = substr $text, pos $text;
}
$line += () = $ws =~ /\n/g;
if (defined($sub) && length($sub)) {
$line += () = $sub =~ /\n/g;
$sub =~ s/^"//;
$sub =~ s/"$//;
$res .= $sub;
}
}
}
if (defined($res))
{
$res = dec_json_str($res);
if ($res) {
$stringtable{$res} ||= [ ];
push @{$stringtable{$res}}, $position;
}
}
}
}
}
close F;
}
if( open C, "| msgcat -" )
{
binmode C, ':utf8';
printf C "msgid \"\"\nmsgstr \"Content-Type: text/plain; charset=UTF-8\"\n\n";
foreach my $key ( sort keys %stringtable )
{
if( length $key )
{
my @positions = @{$stringtable{$key}};
$key =~ s/\\/\\\\/g;
$key =~ s/\n/\\n/g;
$key =~ s/\t/\\t/g;
$key =~ s/"/\\"/g;
printf C "#: %s\nmsgid \"%s\"\nmsgstr \"\"\n\n",
join(' ', @positions), $key;
}
}
close C;
}