1243545ac5134b2ef371257264e904b92ef6c411
[project/luci.git] / build / i18n-scan.pl
1 #!/usr/bin/perl
2
3 use strict;
4 use warnings;
5 use Text::Balanced qw(extract_bracketed extract_delimited extract_tagged);
6
7 @ARGV >= 1 || die "Usage: $0 <source direcory>\n";
8
9
10 my %stringtable;
11
12 sub dec_lua_str
13 {
14         my $s = shift;
15         $s =~ s/[\s\n]+/ /g;
16         $s =~ s/\\n/\n/g;
17         $s =~ s/\\t/\t/g;
18         $s =~ s/\\(.)/$1/g;
19         $s =~ s/^ //;
20         $s =~ s/ $//;
21         return $s;
22 }
23
24 sub dec_tpl_str
25 {
26         my $s = shift;
27         $s =~ s/-$//;
28         $s =~ s/[\s\n]+/ /g;
29         $s =~ s/^ //;
30         $s =~ s/ $//;
31         return $s;
32 }
33
34
35 if( open F, "find @ARGV -type f '(' -name '*.htm' -o -name '*.lua' ')' |" )
36 {
37         while( defined( my $file = readline F ) )
38         {
39                 chomp $file;
40
41                 if( open S, "< $file" )
42                 {
43                         local $/ = undef;
44                         my $raw = <S>;
45                         close S;
46
47
48                         my $text = $raw;
49
50                         while( $text =~ s/ ^ .*? (?:translate|translatef|i18n|_) [\n\s]* \( /(/sgx )
51                         {
52                                 ( my $code, $text ) = extract_bracketed($text, q{('")});
53
54                                 $code =~ s/\\\n/ /g;
55                                 $code =~ s/^\([\n\s]*//;
56                                 $code =~ s/[\n\s]*\)$//;
57
58                                 my $res = "";
59                                 my $sub = "";
60
61                                 if( $code =~ /^['"]/ )
62                                 {
63                                         while( defined $sub && length($sub) > 0 )
64                                         {
65                                                 ( $sub, $code ) = extract_delimited($code, q{'"}, q{\s*(?:\.\.\s*)?});
66
67                                                 if( defined $sub && length($sub) > 2 )
68                                                 {
69                                                         $res .= substr $sub, 1, length($sub) - 2;
70                                                 }
71                                         }
72                                 }
73                                 elsif( $code =~ /^(\[=*\[)/ )
74                                 {
75                                         my $stag = quotemeta $1;
76                                         my $etag = $stag;
77                                            $etag =~ s/\[/]/g;
78
79                                         ( $res ) = extract_tagged($code, $stag, $etag);
80
81                                         $res =~ s/^$stag//;
82                                         $res =~ s/$etag$//;
83                                 }
84
85                                 $res = dec_lua_str($res);
86                                 $stringtable{$res}++ if $res;
87                         }
88
89
90                         $text = $raw;
91
92                         while( $text =~ s/ ^ .*? <% -? [:_] /<%/sgx )
93                         {
94                                 ( my $code, $text ) = extract_tagged($text, '<%', '%>');
95
96                                 if( defined $code )
97                                 {
98                                         $code = dec_tpl_str(substr $code, 2, length($code) - 4);
99                                         $stringtable{$code}++;
100                                 }
101                         }
102                 }
103         }
104
105         close F;
106 }
107
108
109 if( open C, "| msgcat -" )
110 {
111         printf C "msgid \"\"\nmsgstr \"Content-Type: text/plain; charset=UTF-8\"\n\n";
112
113         foreach my $key ( sort keys %stringtable )
114         {
115                 if( length $key )
116                 {
117                         $key =~ s/"/\\"/g;
118                         printf C "msgid \"%s\"\nmsgstr \"\"\n\n", $key;
119                 }
120         }
121
122         close C;
123 }