diff options
author | Jo-Philipp Wich <jow@openwrt.org> | 2009-05-17 19:39:32 +0000 |
---|---|---|
committer | Jo-Philipp Wich <jow@openwrt.org> | 2009-05-17 19:39:32 +0000 |
commit | 5193631c04142200494761440eda67514c11d649 (patch) | |
tree | d9ec89a649a4bd35313992243d0556cbac60095b /build/i18n-scan.pl | |
parent | 62fade570951964115136f2cd47487633cd529be (diff) |
build: add script to extract i18n tags from sources and generate *.po snippets
Diffstat (limited to 'build/i18n-scan.pl')
-rwxr-xr-x | build/i18n-scan.pl | 114 |
1 files changed, 114 insertions, 0 deletions
diff --git a/build/i18n-scan.pl b/build/i18n-scan.pl new file mode 100755 index 000000000..102ae5f7a --- /dev/null +++ b/build/i18n-scan.pl @@ -0,0 +1,114 @@ +#!/usr/bin/perl + +use strict; +use warnings; +use Text::Balanced qw(extract_codeblock); + +@ARGV == 1 || die "Usage: $0 <source direcory>\n"; + + +sub _parse +{ + my ( $code ) = @_; + my ( $k, $v ); + + if( $code =~ s/^<%:-?\s*(.+)\s*%>/$1/s ) + { + my ( $key, @text ) = split /[\n\s]+/, $code; + + $k = $key; + $v = join ' ', @text; + } + elsif( $code =~ s/^\(\s*(.+)\s*\)/$1/s ) + { + if( $code =~ /^(?:"(\w+)"|'(\w+)')\s*,\s*(?:"(.+?)"|'(.+?)')/s ) + { + $k = $1 || $2; + $v = $3 || $4 || ''; + $v =~ s/\s+/ /sg; + } + elsif( $code =~ /^(?:"(\w+)"|'(\w+)')/ ) + { + $k = $1 || $2; + $v = ''; + } + else + { + return (); + } + } + else + { + return (); + } + + $v =~ s/\\"/"/g; + $v =~ s/"/\\"/g; + + return ( $k, $v ); +} + + +if( open F, "find $ARGV[0] -type f -name '*.htm' -or -name '*.lua' |" ) +{ + while( defined( my $file = readline F ) ) + { + chomp $file; + + if( open S, "< $file" ) + { + my $text = ''; + $text .= $_ foreach( readline S ); + + while( + $text =~ s/ + ^ .*? + (?: + (?: translate f? | i18n ) + [\s\n]* ( \( ) + | + ( \<%: -? ) + ) + /$1 || $2/segx + ) { + #$text =~ s/^ .*? (?: (?: translate f? | i18n ) [\s\n]* ( \( ) | ( <%: -? ) ) / $1 || $2 /sex; + #warn "T[$text]"; + my $code; + + reparse: + ( $code, $text ) = extract_codeblock( $text, '', '^', '()' ); + if( ! $code ) { + ( $code, $text ) = extract_codeblock( $text, '', '^', '<>' ); + } + + if( ! $code ) { + # Corner case: + $text =~ s/(#[^\n]*)%>/$1\n%>/; + ( $code, $text ) = extract_codeblock( $text, '<>', '^' ); + if( ! $code ) { + last; + } + } + + my ( $k, $v ) = _parse( $code ); + #warn "M[$code]"; + #last; + + if( $k && defined($v) ) + { + if( $v ) + { + printf "#. %s\n", $v || $k; + } + + printf "msgid \"%s\"\nmsgstr \"%s\"\n\n", + $k, $v; + } + } + + close S; + } + } + + close F; +} |