summaryrefslogtreecommitdiffhomepage
diff options
context:
space:
mode:
authorJo-Philipp Wich <jow@openwrt.org>2009-11-01 00:48:15 +0000
committerJo-Philipp Wich <jow@openwrt.org>2009-11-01 00:48:15 +0000
commit58b3b2156fa807332a102e7145d18eec62c69f4b (patch)
treea6381afc6cffbb7da87a728a72e160b81f897203
parent202ac9d3632b3b6deecf3098374fe3e91c1e0aab (diff)
build: update i18n-scan.pl, now reliably finds template and Lua i18n tokens
-rwxr-xr-xbuild/i18n-scan.pl147
1 files changed, 72 insertions, 75 deletions
diff --git a/build/i18n-scan.pl b/build/i18n-scan.pl
index 03ab0292e..8523ced1a 100755
--- a/build/i18n-scan.pl
+++ b/build/i18n-scan.pl
@@ -2,54 +2,36 @@
use strict;
use warnings;
-use Text::Balanced qw(extract_codeblock);
+use Text::Balanced qw(extract_bracketed extract_delimited extract_tagged);
@ARGV == 1 || die "Usage: $0 <source direcory>\n";
-sub _parse
-{
- my ( $code ) = @_;
- my ( $k, $v );
-
- if( $code =~ s/^<%:-?\s*(.+)\s*%>/$1/s )
- {
- my ( $key, @text ) = split /[\n\s]+/, $code;
+my %stringtable;
- $k = $key;
- $v = join ' ', @text;
- }
- elsif( $code =~ s/^\(\s*(.+)\s*\)/$1/s )
- {
- if( $code =~ /^(?:"(\w+)"|'(\w+)')\s*,\s*(?:"(.+?)"|'(.+?)')/s )
- {
- $k = $1 || $2;
- $v = $3 || $4 || '';
- $v =~ s/\s+/ /sg;
- }
- elsif( $code =~ /^(?:"(\w+)"|'(\w+)')/ )
- {
- $k = $1 || $2;
- $v = '';
- }
- else
- {
- return ();
- }
- }
- else
- {
- return ();
- }
+sub dec_lua_str
+{
+ my $s = shift;
+ $s =~ s/\\n/\n/g;
+ $s =~ s/\\t/\n/g;
+ $s =~ s/\\(.)/$1/g;
+ $s =~ s/[\s\n]+/ /g;
+ $s =~ s/^ //;
+ $s =~ s/ $//;
+ return $s;
+}
- $v =~ s/\\"/"/g;
- $v =~ s/"/\\"/g;
-
- return ( $k, $v );
+sub dec_tpl_str
+{
+ my $s = shift;
+ $s =~ s/[\s\n]+/ /g;
+ $s =~ s/^ //;
+ $s =~ s/ $//;
+ return $s;
}
-if( open F, "find $ARGV[0] -type f -name '*.htm' -or -name '*.lua' |" )
+if( open F, "find $ARGV[0] -type f '(' -name '*.htm' -or -name '*.lua' ')' |" )
{
while( defined( my $file = readline F ) )
{
@@ -57,52 +39,67 @@ if( open F, "find $ARGV[0] -type f -name '*.htm' -or -name '*.lua' |" )
if( open S, "< $file" )
{
- my $text = '';
- $text .= $_ foreach( readline S );
-
- while(
- $text =~ s/
- ^ .*?
- (?:
- (?: translate f? | i18n )
- [\s\n]* ( \( )
- |
- ( \<%: -? )
- )
- /$1 || $2/segx
- ) {
- my $code;
-
- ( $code, $text ) = extract_codeblock( $text, '', '^', '()' );
- if( ! $code ) {
- ( $code, $text ) = extract_codeblock( $text, '', '^', '<>' );
- }
+ local $/ = undef;
+ my $raw = <S>;
+ close S;
- if( ! $code ) {
- # Corner case:
- $text =~ s/(#[^\n]*)%>/$1\n%>/;
- ( $code, $text ) = extract_codeblock( $text, '<>', '^' );
- if( ! $code ) {
- last;
- }
- }
- my ( $k, $v ) = _parse( $code );
- if( $k && defined($v) )
+ my $text = $raw;
+
+ while( $text =~ s/ ^ .*? (?:translate|translatef|i18n|_) [\n\s]* \( /(/sgx )
+ {
+ ( my $code, $text ) = extract_bracketed($text, q{('")});
+ $code =~ s/^\(//; $code =~ s/\)$//;
+
+ my $res = "";
+ my $sub = "";
+
+ while( defined $sub )
{
- if( $v )
+ ( $sub, $code ) = extract_delimited($code, q{'"}, q{\s*(?:\.\.\s*)?});
+
+ if( defined $sub )
{
- printf "#. %s\n", $v || $k;
+ $res .= substr $sub, 1, length($sub) - 2;
}
-
- printf "msgid \"%s\"\nmsgstr \"%s\"\n\n",
- $k, $v;
}
+
+ $res = dec_lua_str($res);
+ $stringtable{$res}++;
}
- close S;
+
+ $text = $raw;
+
+ while( $text =~ s/ ^ .*? <% [:_] -? /<%/sgx )
+ {
+ ( my $code, $text ) = extract_tagged($text, '<%', '%>');
+
+ if( defined $code )
+ {
+ $code = dec_tpl_str(substr $code, 2, length($code) - 4);
+ $stringtable{$code}++;
+ }
+ }
}
}
close F;
}
+
+
+if( open C, "| msgcat -" )
+{
+ printf C "msgid \"\"\nmsgstr \"Content-Type: text/plain; charset=UTF-8\"\n\n";
+
+ foreach my $key ( sort keys %stringtable )
+ {
+ if( length $key )
+ {
+ $key =~ s/"/\\"/g;
+ printf C "msgid \"%s\"\nmsgstr \"\"\n\n", $key;
+ }
+ }
+
+ close C;
+}