3 # -n do not include custom_ scripts
4 # -v verbose mode, shows progress stuff
6 # this version of locles processes not only all required .pl files
7 # but also all parse_html_templated files.
15 use File::Slurp qw(slurp);
19 use List::Util qw(first);
23 $OUTPUT_AUTOFLUSH = 1;
32 my $basedir = "../..";
33 my $locales_dir = ".";
34 my $bindir = "$basedir/bin/mozilla";
35 my @progdirs = ( "$basedir/SL" );
36 my $dbupdir = "$basedir/sql/Pg-upgrade";
37 my $dbupdir2 = "$basedir/sql/Pg-upgrade2";
38 my $menufile = "menu.ini";
39 my $submitsearch = qr/type\s*=\s*[\"\']?submit/i;
44 my (%referenced_html_files, %locale, %htmllocale, %alllocales, %cached, %submit);
45 my ($ALL_HEADER, $MISSING_HEADER, $LOST_HEADER);
50 my ($top_dir_name) = @_;
57 tie my %dir_h, 'IO::Dir', $dir_name;
59 push @files, grep { -f } map { "${dir_name}/${_}" } keys %dir_h;
60 my @sub_dirs = grep { -d } map { "${dir_name}/${_}" } grep { ! m/^\.\.?$/ } keys %dir_h;
62 $finder->($_) for @sub_dirs;
65 $finder->($top_dir_name);
71 # overwrite existing entries with the ones from 'missing'
72 $self->{texts}->{$_} = $missing->{$_} for grep { $missing->{$_} } keys %alllocales;
74 # try to set missing entries from lost ones
75 my %lost_by_text = map { ($_->{text} => $_->{translation}) } @lost;
76 $self->{texts}->{$_} = $lost_by_text{$_} for grep { !$self->{texts}{$_} } keys %alllocales;
79 my @bindir_files = find_files($bindir);
80 my @progfiles = map { m:^(.+)/([^/]+)$:; [ $2, $1 ] } grep { /\.pl$/ && !/_custom/ } @bindir_files;
81 my @customfiles = grep /_custom/, @bindir_files;
83 push @progfiles, map { m:^(.+)/([^/]+)$:; [ $2, $1 ] } grep { /\.pm$/ } map { find_files($_) } @progdirs;
85 # put customized files into @customfiles
86 my (@menufiles, %dir_h);
90 @menufiles = ($menufile);
92 tie %dir_h, 'IO::Dir', $basedir;
93 @menufiles = map { "$basedir/$_" } grep { /.*?_$menufile$/ } keys %dir_h;
94 unshift @menufiles, "$basedir/$menufile";
97 tie %dir_h, 'IO::Dir', $dbupdir;
98 my @dbplfiles = grep { /\.pl$/ } keys %dir_h;
100 tie %dir_h, 'IO::Dir', $dbupdir2;
101 my @dbplfiles2 = grep { /\.pl$/ } keys %dir_h;
103 # slurp the translations in
104 if (-f "$locales_dir/all") {
105 require "$locales_dir/all";
107 if (-f "$locales_dir/missing") {
108 require "$locales_dir/missing" ;
109 unlink "$locales_dir/missing";
111 if (-f "$locales_dir/lost") {
112 require "$locales_dir/lost";
113 unlink "$locales_dir/lost";
116 my $charset = slurp("$locales_dir/charset") || 'utf-8';
119 my %old_texts = %{ $self->{texts} || {} };
121 handle_file(@{ $_ }) for @progfiles;
122 handle_file($_, $dbupdir) for @dbplfiles;
123 handle_file($_, $dbupdir2) for @dbplfiles2;
124 scanmenu($_) for @menufiles;
126 # merge entries to translate with entries from files 'missing' and 'lost'
131 file => "$locales_dir/all",
132 header => $ALL_HEADER,
133 data_name => '$self->{texts}',
134 data_sub => sub { _print_line($_, $self->{texts}{$_}, @_) for sort keys %alllocales },
137 foreach my $text (keys %$missing) {
138 if ($locale{$text} || $htmllocale{$text}) {
139 unless ($self->{texts}{$text}) {
140 $self->{texts}{$text} = $missing->{$text};
146 # calc and generate missing
147 my @new_missing = grep { !$self->{texts}{$_} } sort keys %alllocales;
151 file => "$locales_dir/missing",
152 header => $MISSING_HEADER,
153 data_name => '$missing',
154 data_sub => sub { _print_line($_, '', @_) for @new_missing },
158 # calc and generate lost
159 while (my ($text, $translation) = each %old_texts) {
160 next if ($alllocales{$text});
161 push @lost, { 'text' => $text, 'translation' => $translation };
165 splice @lost, 0, (scalar @lost - 50) if (scalar @lost > 50);
167 file => "$locales_dir/lost",
168 header => $LOST_HEADER,
170 data_name => '@lost',
172 _print_line($_->{text}, $_->{translation}, @_, template => " { 'text' => %s, 'translation' => %s },\n") for @lost;
177 my $trlanguage = slurp("$locales_dir/LANGUAGE");
180 search_unused_htmlfiles() if $opt_c;
182 my $count = scalar keys %alllocales;
183 my $notext = scalar @new_missing;
184 my $per = sprintf("%.1f", ($count - $notext) / $count * 100);
185 print "\n$trlanguage - ${per}%";
186 print " - $notext/$count missing" if $notext;
195 # These are all the texts to build the translations files.
196 # The file has the form of 'english text' => 'foreign text',
197 # you can add the translation in this file or in the 'missing' file
198 # run locales.pl from this directory to rebuild the translation files
200 $MISSING_HEADER = <<EOL;
201 # add the missing texts and run locales.pl to rebuild
203 $LOST_HEADER = <<EOL;
204 # The last 50 text strings, that have been removed.
205 # This file has been auto-generated by locales.pl. Please don't edit!
213 'no-custom-files' => \$opt_n,
214 'check-files' => \$opt_c,
215 'verbose' => \$opt_v,
227 pod2usage(-exitstatus => 0, -verbose => 2);
232 my $arg = shift @ARGV;
234 foreach my $dir ("../locale/$arg", "locale/$arg", "../$arg", $arg) {
235 next unless -d $dir && -f "$dir/all" && -f "$dir/LANGUAGE";
241 print "The locale directory '$arg' could not be found.\n";
245 } elsif (!-f 'all' || !-f 'LANGUAGE') {
246 print "locales.pl was not called from a locale/* subdirectory,\n"
247 . "and no locale directory name was given.\n";
253 my ($file, $dir) = @_;
254 print "\n$file" if $opt_v;
258 &scanfile("$dir/$file");
260 # scan custom_{module}.pl or {login}_{module}.pl files
261 foreach my $customfile (@customfiles) {
262 if ($customfile =~ /_$file/) {
263 if (-f "$dir/$customfile") {
264 &scanfile("$dir/$customfile");
272 sub extract_text_between_parenthesis {
273 my ($fh, $line) = @_;
274 my ($inside_string, $pos, $text, $quote_next) = (undef, 0, "", 0);
277 if (length($line) <= $pos) {
279 return ($text, "") unless ($line);
283 my $cur_char = substr($line, $pos, 1);
285 if (!$inside_string) {
286 if ((length($line) >= ($pos + 3)) && (substr($line, $pos, 2)) eq "qq") {
287 $inside_string = substr($line, $pos + 2, 1);
290 } elsif ((length($line) >= ($pos + 2)) &&
291 (substr($line, $pos, 1) eq "q")) {
292 $inside_string = substr($line, $pos + 1, 1);
295 } elsif (($cur_char eq '"') || ($cur_char eq '\'')) {
296 $inside_string = $cur_char;
298 } elsif (($cur_char eq ")") || ($cur_char eq ',')) {
299 return ($text, substr($line, $pos + 1));
304 $text .= '\\' unless $cur_char eq "'";
308 } elsif ($cur_char eq '\\') {
311 } elsif ($cur_char eq $inside_string) {
312 undef($inside_string);
325 my $dont_include_subs = shift;
326 my $scanned_files = shift;
331 $scanned_files = {} unless ($scanned_files);
332 return if ($scanned_files->{$file});
333 $scanned_files->{$file} = 1;
335 if (!defined $cached{$file}) {
337 return unless (-f "$file");
339 my $fh = new FileHandle;
340 open $fh, "$file" or die "$! : $file";
342 my ($is_submit, $line_no, $sub_line_no) = (0, 0, 0);
345 last if /^\s*__END__/;
349 # is this another file
350 if (/require\s+\W.*\.pl/) {
352 $newfile =~ s/require\s+\W//;
353 $newfile =~ s|bin/mozilla||;
354 $cached{$file}{scan}{"$bindir/$newfile"} = 1;
355 } elsif (/use\s+SL::([\w:]*)/) {
358 $cached{$file}{scannosubs}{"../../SL/${module}.pm"} = 1;
361 # Some calls to render() are split over multiple lines. Deal
363 while (/(?:parse_html_template2?|render)\s*\( *$/) {
368 # is this a template call?
369 if (/(?:parse_html_template2?|render)\s*\(\s*[\"\']([\w\/]+)\s*[\"\']/) {
370 my $new_file_base = "$basedir/templates/webpages/$1.";
371 if (/parse_html_template2/) {
372 print "E: " . strip_base($file) . " is still using 'parse_html_template2' for " . strip_base("${new_file_base}html") . ".\n";
376 foreach my $ext (qw(html js json)) {
377 my $new_file = "${new_file_base}${ext}";
379 $cached{$file}{scanh}{$new_file} = 1;
385 if ($opt_c && !$found_one) {
386 print "W: missing HTML template: " . strip_base($new_file_base) . "{html,json,js} (referenced from " . strip_base($file) . ")\n";
395 my ($null, $country) = split /,/;
396 $country =~ s/^ +[\"\']//;
397 $country =~ s/[\"\'].*//;
403 # is it a submit button before $locale->
404 if (/$submitsearch/) {
406 if ($` !~ /locale->text/) {
408 $sub_line_no = $line_no;
412 my ($found) = / (?: locale->text | \b t8 ) \b .*? \(/x;
417 ($string, $_) = extract_text_between_parenthesis($fh, $postmatch);
420 # if there is no $ in the string record it
421 unless (($string =~ /\$\D.*/) || ("" eq $string)) {
423 # this guarantees one instance of string
424 $cached{$file}{locale}{$string} = 1;
426 # this one is for all the locales
427 $cached{$file}{all}{$string} = 1;
429 # is it a submit button before $locale->
431 $cached{$file}{submit}{$string} = 1;
434 } elsif ($postmatch =~ />/) {
438 # exit loop if there are no more locales on this line
439 ($rc) = ($postmatch =~ /locale->text | \b t8/x);
441 if ( ($postmatch =~ />/)
442 || (!$found && ($sub_line_no != $line_no) && />/)) {
452 $alllocales{$_} = 1 for keys %{$cached{$file}{all}};
453 $locale{$_} = 1 for keys %{$cached{$file}{locale}};
454 $submit{$_} = 1 for keys %{$cached{$file}{submit}};
456 scanfile($_, 0, $scanned_files) for keys %{$cached{$file}{scan}};
457 scanfile($_, 1, $scanned_files) for keys %{$cached{$file}{scannosubs}};
458 scanhtmlfile($_) for keys %{$cached{$file}{scanh}};
460 $referenced_html_files{$_} = 1 for keys %{$cached{$file}{scanh}};
466 my $fh = new FileHandle;
467 open $fh, "$file" or die "$! : $file";
469 my @a = grep m/^\[/, <$fh>;
473 grep { s/(\[|\])//g } @a;
475 foreach my $item (@a) {
476 my @b = split /--/, $item;
477 foreach my $string (@b) {
479 $locale{$string} = 1;
480 $alllocales{$string} = 1;
486 sub unescape_template_string {
497 if (!defined $cached{$file}) {
498 my %plugins = ( 'loaded' => { }, 'needed' => { } );
500 open(IN, $file) || die $file;
505 while (my $line = <IN>) {
508 while ($line =~ m/\[\%[^\w]*use[^\w]+(\w+)[^\w]*?\%\]/gi) {
509 $plugins{loaded}->{$1} = 1;
512 while ($line =~ m/\[\%[^\w]*(\w+)\.\w+\(/g) {
514 $plugins{needed}->{$plugin} = 1 if (first { $_ eq $plugin } qw(HTML LxERP JavaScript MultiColumnIterator JSON L P));
517 $plugins{needed}->{T8} = 1 if $line =~ m/\[\%.*\|.*\$T8/;
519 while ($line =~ m/(?: # Start von Variante 1: LxERP.t8('...'); ohne darumliegende [% ... %]-Tags
520 (LxERP\.t8)\( # LxERP.t8( ::Parameter $1::
521 ([\'\"]) # Anfang des zu übersetzenden Strings ::Parameter $2::
522 (.*?) # Der zu übersetzende String ::Parameter $3::
523 (?<!\\)\2 # Ende des zu übersetzenden Strings
524 | # Start von Variante 2: [% '...' | $T8 %]
525 \[\% # Template-Start-Tag
526 [\-~#]? # Whitespace-Unterdrückung
527 \s* # Optional beliebig viele Whitespace
528 ([\'\"]) # Anfang des zu übersetzenden Strings ::Parameter $4::
529 (.*?) # Der zu übersetzende String ::Parameter $5::
530 (?<!\\)\4 # Ende des zu übersetzenden Strings
531 \s*\|\s* # Pipe-Zeichen mit optionalen Whitespace davor und danach
532 (\$T8) # Filteraufruf ::Parameter $6::
533 .*? # Optionale Argumente für den Filter
535 [\-~#]? # Whitespace-Unterdrückung
536 \%\] # Template-Ende-Tag
539 my $module = $1 || $6;
540 my $string = $3 || $5;
541 print "Found filter >>>$string<<<\n" if $debug;
542 substr $line, $LAST_MATCH_START[1], $LAST_MATCH_END[0] - $LAST_MATCH_START[0], '';
544 $string = unescape_template_string($string);
545 $cached{$file}{all}{$string} = 1;
546 $cached{$file}{html}{$string} = 1;
547 $cached{$file}{submit}{$string} = 1 if $PREMATCH =~ /$submitsearch/;
548 $plugins{needed}->{T8} = 1 if $module eq '$T8';
549 $plugins{needed}->{LxERP} = 1 if $module eq 'LxERP.t8';
552 while ($line =~ m/\[\% # Template-Start-Tag
553 [\-~#]? # Whitespace-Unterdrückung
554 \s* # Optional beliebig viele Whitespace
555 (?: # Die erkannten Template-Direktiven
560 \s+ # Mindestens ein Whitespace
561 [\'\"]? # Anfang des Dateinamens
562 ([^\s]+) # Beliebig viele Nicht-Whitespaces -- Dateiname
563 \.html # Endung ".html", ansonsten kann es der Name eines Blocks sein
565 my $new_file_name = "$basedir/templates/webpages/$1.html";
566 $cached{$file}{scanh}{$new_file_name} = 1;
567 substr $line, $LAST_MATCH_START[1], $LAST_MATCH_END[0] - $LAST_MATCH_START[0], '';
573 foreach my $plugin (keys %{ $plugins{needed} }) {
574 next if ($plugins{loaded}->{$plugin});
575 print "E: " . strip_base($file) . " requires the Template plugin '$plugin', but is not loaded with '[\% USE $plugin \%]'.\n";
579 # copy back into global arrays
580 $alllocales{$_} = 1 for keys %{$cached{$file}{all}};
581 $locale{$_} = 1 for keys %{$cached{$file}{html}};
582 $submit{$_} = 1 for keys %{$cached{$file}{submit}};
584 scanhtmlfile($_) for keys %{$cached{$file}{scanh}};
586 $referenced_html_files{$_} = 1 for keys %{$cached{$file}{scanh}};
589 sub search_unused_htmlfiles {
590 my @unscanned_dirs = ('../../templates/webpages');
592 while (scalar @unscanned_dirs) {
593 my $dir = shift @unscanned_dirs;
595 foreach my $entry (<$dir/*>) {
597 push @unscanned_dirs, $entry;
599 } elsif (($entry =~ /_master.html$/) && -f $entry && !$referenced_html_files{$entry}) {
600 print "W: unused HTML template: " . strip_base($entry) . "\n";
608 my $s = "$_[0]"; # Create a copy of the string.
611 $s =~ s|templates/webpages/||;
618 $val =~ s/(\'|\\$)/\\$1/g;
619 return "'" . $val . "'";
623 my $key = _single_quote(shift);
624 my $text = _single_quote(shift);
626 my $template = $params{template} || qq| %-29s => %s,\n|;
627 my $fh = $params{fh} || croak 'need filehandle in _print_line';
629 print $fh sprintf $template, $key, $text;
635 my $file = $params{file} || croak 'need filename in generate_file';
636 my $header = $params{header};
637 my $lines = $params{data_sub};
638 my $data_name = $params{data_name};
639 my @delim = split //, ($params{delim} || '{}');
641 open my $fh, '>:encoding(utf8)', $file or die "$! : $file";
643 $charset =~ s/\r?\n//g;
644 my $emacs_charset = lc $charset;
646 print $fh "#!/usr/bin/perl\n# -*- coding: $emacs_charset; -*-\n# vim: fenc=$charset\n\nuse utf8;\n\n";
647 print $fh $header, "\n" if $header;
648 print $fh "$data_name = $delim[0]\n" if $data_name;
652 print $fh qq|$delim[1];\n\n1;\n|;
658 do { local ( @ARGV, $/ ) = $file; <> }
665 locales.pl - Collect strings for translation in kivitendo
669 locales.pl [options] lang_code
672 -n, --no-custom-files Do not process files whose name contains "_"
673 -c, --check-files Run extended checks on HTML files
674 -v, --verbose Be more verbose
675 -h, --help Show this help
681 =item B<-n>, B<--no-custom-files>
683 Do not process files whose name contains "_", e.g. "custom_io.pl".
685 =item B<-c>, B<--check-files>
687 Run extended checks on the usage of templates. This can be used to
688 discover HTML templates that are never used as well as the usage of
689 non-existing HTML templates.
691 =item B<-v>, B<--verbose>
699 This script collects strings from Perl files, the menu.ini file and
700 HTML templates and puts them into the file "all" for translation.