3 # this version of locales processes not only all required .pl files
4 # but also all parse_html_templated files.
12 unshift(@INC, $FindBin::Bin . '/../modules/override'); # Use our own versions of various modules (e.g. YAML).
13 push (@INC, $FindBin::Bin . '/..');
20 use File::Slurp qw(slurp);
24 use List::MoreUtils qw(apply);
25 use List::Util qw(first);
28 use SL::System::Process;
31 $OUTPUT_AUTOFLUSH = 1;
41 my $basedir = "../..";
42 my $locales_dir = ".";
43 my $bindir = "$basedir/bin/mozilla";
44 my @progdirs = ( "$basedir/SL" );
45 my @menufiles = glob("${basedir}/menus/*/*");
46 my @webpages = qw(webpages mobile_webpages design40_webpages);
47 my @javascript_dirs = ($basedir .'/js', map { $basedir .'/templates/' . $_ } @webpages);
48 my $javascript_output_dir = $basedir .'/js';
49 my $submitsearch = qr/type\s*=\s*[\"\']?submit/i;
54 my %ignore_unused_templates = (
55 map { $_ => 1 } qw(ct/testpage.html oe/periodic_invoices_email.txt part/testpage.html t/render.html t/render.js task_server/failure_notification_email.txt
56 failed_background_jobs_report/email.txt presenter/items_list/items_list.txt)
59 my (%referenced_html_files, %locale, %htmllocale, %alllocales, %cached, %submit, %jslocale);
60 my ($ALL_HEADER, $MISSING_HEADER, $LOST_HEADER);
65 my ($top_dir_name) = @_;
72 tie my %dir_h, 'IO::Dir', $dir_name;
74 push @files, grep { -f } map { "${dir_name}/${_}" } keys %dir_h;
75 my @sub_dirs = grep { -d } map { "${dir_name}/${_}" } grep { ! m/^\.\.?$/ } keys %dir_h;
77 $finder->($_) for @sub_dirs;
80 $finder->($top_dir_name);
86 # overwrite existing entries with the ones from 'missing'
87 $self->{texts}->{$_} = $missing->{$_} for grep { $missing->{$_} } keys %alllocales;
89 # try to set missing entries from lost ones
90 my %lost_by_text = map { ($_->{text} => $_->{translation}) } @lost;
91 $self->{texts}->{$_} = $lost_by_text{$_} for grep { !$self->{texts}{$_} } keys %alllocales;
94 my @bindir_files = find_files($bindir);
95 my @progfiles = map { m:^(.+)/([^/]+)$:; [ $2, $1 ] } grep { /\.pl$/ && !/_custom/ } @bindir_files;
96 my @customfiles = grep /_custom/, @bindir_files;
98 push @progfiles, map { m:^(.+)/([^/]+)$:; [ $2, $1 ] } grep { /\.pm$/ } map { find_files($_) } @progdirs;
103 foreach my $sub_dir ("Pg-upgrade2", "Pg-upgrade2-auth") {
104 my $dir = "$basedir/sql/$sub_dir";
105 tie %dir_h, 'IO::Dir', $dir;
106 push @dbplfiles, map { [ $_, $dir ] } grep { /\.pl$/ } keys %dir_h;
109 # slurp the translations in
110 if (-f "$locales_dir/all") {
111 require "$locales_dir/all";
113 # load custom translation (more_texts)
114 for my $file (glob("${locales_dir}/more/*")) {
115 if (open my $in, "<", "$file") {
120 $self->{more_texts_temp}{$_} = $self->{more_texts}{$_} for keys %{ $self->{more_texts} };
123 $self->{more_texts} = delete $self->{more_texts_temp};
125 if (-f "$locales_dir/missing") {
126 require "$locales_dir/missing" ;
127 unlink "$locales_dir/missing";
129 if (-f "$locales_dir/lost") {
130 require "$locales_dir/lost";
131 unlink "$locales_dir/lost";
134 my %old_texts = %{ $self->{texts} || {} };
136 handle_file(@{ $_ }) for @progfiles;
137 handle_file(@{ $_ }) for @dbplfiles;
138 scanmenu($_) for @menufiles;
141 for my $file_name (grep { /\.(?:js|html)$/i } map({find_files($_)} @javascript_dirs)) {
142 scan_javascript_file($file_name);
145 # merge entries to translate with entries from files 'missing' and 'lost'
148 # Generate "all" without translations in more_texts.
149 # But keep the ones which are in both old_texts (texts) and more_texts,
150 # because this are ones which are overwritten in more_texts for custom usage.
152 $to_keep{$_} = 1 for grep { !!$self->{more_texts}{$_} } keys %old_texts;
153 my @new_all = grep { $to_keep{$_} || !$self->{more_texts}{$_} } sort keys %alllocales;
156 file => "$locales_dir/all",
157 header => $ALL_HEADER,
158 data_name => '$self->{texts}',
159 data_sub => sub { _print_line($_, $self->{texts}{$_}, @_) for @new_all },
162 open(my $js_file, '>:encoding(utf8)', $javascript_output_dir .'/locale/'. $locale .'.js') || die;
163 print $js_file 'namespace("kivi").setupLocale({';
165 for my $key (sort(keys(%jslocale))) {
166 my $trans = $self->{more_texts}{$key} // $self->{texts}{$key};
167 print $js_file ((!$first_entry ? ',' : '') ."\n". _double_quote($key) .':'. _double_quote($trans));
170 print $js_file ("\n");
171 print $js_file ('});'."\n");
174 foreach my $text (keys %$missing) {
175 if ($locale{$text} || $htmllocale{$text}) {
176 unless ($self->{texts}{$text}) {
177 $self->{texts}{$text} = $missing->{$text};
183 # calc and generate missing
184 # don't add missing ones if we have a translation in more_texts
185 my @new_missing = grep { !$self->{more_texts}{$_} && !$self->{texts}{$_} } sort keys %alllocales;
189 my %existing_lc = map { (lc $_ => $_) } grep { $self->{texts}->{$_} } keys %{ $self->{texts} };
190 foreach my $entry (@new_missing) {
191 my $other = $existing_lc{lc $entry};
192 print "W: No entry for '${entry}' exists, but there is one with different case: '${other}'\n" if $other;
197 for my $string (@new_missing) {
198 print "new string '$string' in files:\n";
201 apply { s{^(?:\.\./)+}{} }
202 grep { $cached{$_}{all}{$string} }
208 file => "$locales_dir/missing",
209 header => $MISSING_HEADER,
210 data_name => '$missing',
211 data_sub => sub { _print_line($_, '', @_) for @new_missing },
215 # calc and generate lost
216 while (my ($text, $translation) = each %old_texts) {
217 next if ($alllocales{$text});
218 push @lost, { 'text' => $text, 'translation' => $translation };
222 splice @lost, 0, (scalar @lost - 50) if (scalar @lost > 50);
224 file => "$locales_dir/lost",
225 header => $LOST_HEADER,
227 data_name => '@lost',
229 _print_line($_->{text}, $_->{translation}, @_, template => " { 'text' => %s, 'translation' => %s },\n") for @lost;
234 my $trlanguage = slurp("$locales_dir/LANGUAGE");
237 search_unused_htmlfiles() if $opt_c;
239 my $count = scalar keys %alllocales;
240 my $notext = scalar @new_missing;
241 my $per = sprintf("%.1f", ($count - $notext) / $count * 100);
242 print "\n$trlanguage - ${per}%";
243 print " - $notext/$count missing" if $notext;
252 # These are all the texts to build the translations files.
253 # The file has the form of 'english text' => 'foreign text',
254 # you can add the translation in this file or in the 'missing' file
255 # run locales.pl from this directory to rebuild the translation files
257 $MISSING_HEADER = <<EOL;
258 # add the missing texts and run locales.pl to rebuild
260 $LOST_HEADER = <<EOL;
261 # The last 50 text strings, that have been removed.
262 # This file has been auto-generated by locales.pl. Please don't edit!
269 my ($opt_no_c, $ignore_for_compatiblity);
272 'check-files' => \$ignore_for_compatiblity,
273 'no-check-files' => \$opt_no_c,
274 'verbose' => \$opt_v,
275 'filenames' => \$opt_f,
289 pod2usage(-exitstatus => 0, -verbose => 2);
294 my $arg = shift @ARGV;
296 foreach my $dir ("../locale/$arg", "locale/$arg", "../$arg", $arg) {
297 next unless -d $dir && -f "$dir/all" && -f "$dir/LANGUAGE";
306 print "The locale directory '$arg' could not be found.\n";
310 } elsif (!-f 'all' || !-f 'LANGUAGE') {
311 print "locales.pl was not called from a locale/* subdirectory,\n"
312 . "and no locale directory name was given.\n";
316 $locale ||= (grep { $_ } split m:/:, getcwd())[-1];
321 my ($file, $dir) = @_;
322 print "\n$file" if $opt_v;
326 &scanfile("$dir/$file");
328 # scan custom_{module}.pl or {login}_{module}.pl files
329 foreach my $customfile (@customfiles) {
330 if ($customfile =~ /_$file/) {
331 if (-f "$dir/$customfile") {
332 &scanfile("$dir/$customfile");
340 sub extract_text_between_parenthesis {
341 my ($fh, $line) = @_;
342 my ($inside_string, $pos, $text, $quote_next) = (undef, 0, "", 0);
345 if (length($line) <= $pos) {
347 return ($text, "") unless ($line);
351 my $cur_char = substr($line, $pos, 1);
353 if (!$inside_string) {
354 if ((length($line) >= ($pos + 3)) && (substr($line, $pos, 2)) eq "qq") {
355 $inside_string = substr($line, $pos + 2, 1);
358 } elsif ((length($line) >= ($pos + 2)) &&
359 (substr($line, $pos, 1) eq "q")) {
360 $inside_string = substr($line, $pos + 1, 1);
363 } elsif (($cur_char eq '"') || ($cur_char eq '\'')) {
364 $inside_string = $cur_char;
366 } elsif (($cur_char eq ")") || ($cur_char eq ',')) {
367 return ($text, substr($line, $pos + 1));
372 $text .= '\\' unless $cur_char eq "'";
376 } elsif ($cur_char eq '\\') {
379 } elsif ($cur_char eq $inside_string) {
380 undef($inside_string);
393 my $dont_include_subs = shift;
394 my $scanned_files = shift;
399 $scanned_files = {} unless ($scanned_files);
400 return if ($scanned_files->{$file});
401 $scanned_files->{$file} = 1;
403 if (!defined $cached{$file}) {
405 return unless (-f "$file");
407 my $fh = new FileHandle;
408 open $fh, '<:encoding(utf8)', $file or die "$! : $file";
410 my ($is_submit, $line_no, $sub_line_no) = (0, 0, 0);
413 last if /^\s*__END__/;
417 # is this another file
418 if (/require\s+\W.*\.pl/) {
420 $newfile =~ s/require\s+\W//;
421 $newfile =~ s|bin/mozilla||;
422 $cached{$file}{scan}{"$bindir/$newfile"} = 1;
423 } elsif (/use\s+SL::([\w:]*)/) {
426 $cached{$file}{scannosubs}{"../../SL/${module}.pm"} = 1;
429 # Some calls to render() are split over multiple lines. Deal
431 while (/(?:parse_html_template2?|render)\s*\( *$/) {
436 # is this a template call?
437 if (/(?:parse_html_template2?|render)\s*\(\s*[\"\']([\w\/]+)\s*[\"\']/) {
438 my $new_file_name = $1;
439 if (/parse_html_template2/) {
440 print "E: " . strip_base($file) . " is still using 'parse_html_template2' for $new_file_name.html.\n";
444 for my $space (@webpages) {
445 for my $ext (qw(html js json)) {
446 my $new_file = "$basedir/templates/$space/$new_file_name.$ext";
448 $cached{$file}{scanh}{$new_file} = 1;
455 if ($opt_c && !$found_one) {
456 print "W: missing HTML template: $new_file_name.{html,json,js} (referenced from " . strip_base($file) . ")\n";
465 my ($null, $country) = split(/,/);
466 $country =~ s/^ +[\"\']//;
467 $country =~ s/[\"\'].*//;
473 # is it a submit button before $locale->
474 if (/$submitsearch/) {
476 if ($` !~ /locale->text/) {
478 $sub_line_no = $line_no;
483 if (/ (?: locale->text | \b t8 ) \b .*? \(/x) {
490 ($string, $_) = extract_text_between_parenthesis($fh, $postmatch);
493 # if there is no $ in the string record it
494 unless (($string =~ /\$\D.*/) || ("" eq $string)) {
496 # this guarantees one instance of string
497 $cached{$file}{locale}{$string} = 1;
499 # this one is for all the locales
500 $cached{$file}{all}{$string} = 1;
502 # is it a submit button before $locale->
504 $cached{$file}{submit}{$string} = 1;
507 } elsif ($postmatch =~ />/) {
511 # exit loop if there are no more locales on this line
512 ($rc) = ($postmatch =~ /locale->text | \b t8/x);
514 if ( ($postmatch =~ />/)
515 || (!$found && ($sub_line_no != $line_no) && />/)) {
525 $alllocales{$_} = 1 for keys %{$cached{$file}{all}};
526 $locale{$_} = 1 for keys %{$cached{$file}{locale}};
527 $submit{$_} = 1 for keys %{$cached{$file}{submit}};
529 scanfile($_, 0, $scanned_files) for keys %{$cached{$file}{scan}};
530 scanfile($_, 1, $scanned_files) for keys %{$cached{$file}{scannosubs}};
531 scanhtmlfile($_) for keys %{$cached{$file}{scanh}};
533 $referenced_html_files{$_} = 1 for keys %{$cached{$file}{scanh}};
539 my $menu = SL::YAML::LoadFile($file);
541 for my $node (@$menu) {
542 # possible for override files
543 next unless exists $node->{name};
545 $locale{$node->{name}} = 1;
546 $alllocales{$node->{name}} = 1;
547 $cached{$file}{all}{$node->{name}} = 1;
552 # we only need to do this for auth atm, because only auth scripts can include new rights, which are translateable
555 my $dbu = SL::DBUpgrade2->new(auth => $auth, path => SL::System::Process->exe_dir . '/sql/Pg-upgrade2-auth');
557 for my $upgrade ($dbu->sort_dbupdate_controls) {
558 for my $string (@{ $upgrade->{locales} || [] }) {
559 $locale{$string} = 1;
560 $alllocales{$string} = 1;
561 $cached{$upgrade->{tag}}{all}{$string} = 1;
566 sub unescape_template_string {
575 return if defined $cached{$file};
577 my $template_space = $file =~ m{templates/(\w+)/} ? $1 : 'webpages';
579 my %plugins = ( 'loaded' => { }, 'needed' => { } );
582 if (!open($fh, '<:encoding(utf8)', $file)) {
583 print "E: template file '$file' not found\n";
590 while (my $line = <$fh>) {
593 while ($line =~ m/\[\%[^\w]*use[^\w]+(\w+)[^\w]*?\%\]/gi) {
594 $plugins{loaded}->{$1} = 1;
597 while ($line =~ m/\[\%[^\w]*(\w+)\.\w+\(/g) {
599 $plugins{needed}->{$plugin} = 1 if (first { $_ eq $plugin } qw(HTML LxERP JavaScript JSON L P));
602 $plugins{needed}->{T8} = 1 if $line =~ m/\[\%.*\|.*\$T8/;
604 while ($line =~ m/(?: # Start von Variante 1: LxERP.t8('...'); ohne darumliegende [% ... %]-Tags
605 (LxERP\.t8)\( # LxERP.t8( ::Parameter $1::
606 ([\'\"]) # Anfang des zu übersetzenden Strings ::Parameter $2::
607 (.*?) # Der zu übersetzende String ::Parameter $3::
608 (?<!\\)\2 # Ende des zu übersetzenden Strings
609 | # Start von Variante 2: [% '...' | $T8 %]
610 \[\% # Template-Start-Tag
611 [\-~#]? # Whitespace-Unterdrückung
612 \s* # Optional beliebig viele Whitespace
613 ([\'\"]) # Anfang des zu übersetzenden Strings ::Parameter $4::
614 (.*?) # Der zu übersetzende String ::Parameter $5::
615 (?<!\\)\4 # Ende des zu übersetzenden Strings
616 \s*\|\s* # Pipe-Zeichen mit optionalen Whitespace davor und danach
617 (\$T8) # Filteraufruf ::Parameter $6::
618 .*? # Optionale Argumente für den Filter
620 [\-~#]? # Whitespace-Unterdrückung
621 \%\] # Template-Ende-Tag
624 my $module = $1 || $6;
625 my $string = $3 || $5;
626 print "Found filter >>>$string<<<\n" if $debug;
627 substr $line, $LAST_MATCH_START[1], $LAST_MATCH_END[0] - $LAST_MATCH_START[0], '';
629 $string = unescape_template_string($string);
630 $cached{$file}{all}{$string} = 1;
631 $cached{$file}{html}{$string} = 1;
632 $cached{$file}{submit}{$string} = 1 if $PREMATCH =~ /$submitsearch/;
633 $plugins{needed}->{T8} = 1 if $module eq '$T8';
634 $plugins{needed}->{LxERP} = 1 if $module eq 'LxERP.t8';
637 while ($line =~ m/\[\% # Template-Start-Tag
638 [\-~#]* # Whitespace-Unterdrückung
639 \s* # Optional beliebig viele Whitespace
640 (?: # Die erkannten Template-Direktiven
645 \s+ # Mindestens ein Whitespace
646 [\'\"]? # Anfang des Dateinamens
647 ([^\s]+) # Beliebig viele Nicht-Whitespaces -- Dateiname
648 \.(html|js) # Endung ".html" oder ".js", ansonsten kann es der Name eines Blocks sein
650 my $new_file_name = "$basedir/templates/$template_space/$1.$2";
651 $cached{$file}{scanh}{$new_file_name} = 1;
652 substr $line, $LAST_MATCH_START[1], $LAST_MATCH_END[0] - $LAST_MATCH_START[0], '';
658 foreach my $plugin (keys %{ $plugins{needed} }) {
659 next if ($plugins{loaded}->{$plugin});
660 print "E: " . strip_base($file) . " requires the Template plugin '$plugin', but is not loaded with '[\% USE $plugin \%]'.\n";
663 # copy back into global arrays
664 $alllocales{$_} = 1 for keys %{$cached{$file}{all}};
665 $locale{$_} = 1 for keys %{$cached{$file}{html}};
666 $submit{$_} = 1 for keys %{$cached{$file}{submit}};
668 scanhtmlfile($_) for keys %{$cached{$file}{scanh}};
670 $referenced_html_files{$_} = 1 for keys %{$cached{$file}{scanh}};
673 sub scan_javascript_file {
676 open(my $fh, '<:encoding(utf8)', $file) || die('can not open file: '. $file);
678 while( my $line = readline($fh) ) {
689 my $text = unescape_template_string($2);
691 $jslocale{$text} = 1;
692 $alllocales{$text} = 1;
698 sub search_unused_htmlfiles {
699 my @unscanned_dirs = map { '../../templates/' . $_ } @webpages;
701 while (scalar @unscanned_dirs) {
702 my $dir = shift @unscanned_dirs;
704 foreach my $entry (<$dir/*>) {
706 push @unscanned_dirs, $entry;
708 } elsif (!$ignore_unused_templates{strip_base($entry)} && -f $entry && !$referenced_html_files{$entry}) {
709 print "W: unused HTML template: " . strip_base($entry) . "\n";
717 my $s = "$_[0]"; # Create a copy of the string.
720 $s =~ s|templates/\w+/||;
727 $val =~ s/(\'|\\$)/\\$1/g;
728 return "'" . $val . "'";
733 $val =~ s/(\"|\\$)/\\$1/g;
734 return '"'. $val .'"';
738 my $key = _single_quote(shift);
739 my $text = _single_quote(shift);
741 my $template = $params{template} || qq| %-29s => %s,\n|;
742 my $fh = $params{fh} || croak 'need filehandle in _print_line';
744 print $fh sprintf $template, $key, $text;
750 my $file = $params{file} || croak 'need filename in generate_file';
751 my $header = $params{header};
752 my $lines = $params{data_sub};
753 my $data_name = $params{data_name};
754 my @delim = split //, ($params{delim} || '{}');
756 open my $fh, '>:encoding(utf8)', $file or die "$! : $file";
758 print $fh "#!/usr/bin/perl\n# -*- coding: utf-8; -*-\n# vim: fenc=utf-8\n\nuse utf8;\n\n";
759 print $fh $header, "\n" if $header;
760 print $fh "$data_name = $delim[0]\n" if $data_name;
764 print $fh qq|$delim[1];\n\n1;\n|;
772 locales.pl - Collect strings for translation in kivitendo
776 locales.pl [options] lang_code
779 -c, --check-files Run extended checks on HTML files (default)
780 -n, --no-check-files Do not run extended checks on HTML files
781 -f, --filenames Show the filenames where new strings where found
782 -v, --verbose Be more verbose
783 -h, --help Show this help
789 =item B<-c>, B<--check-files>
791 Run extended checks on the usage of templates. This can be used to
792 discover HTML templates that are never used as well as the usage of
793 non-existing HTML templates. This is enabled by default.
795 =item B<-n>, B<--no-check-files>
797 Do not run extended checks on the usage of templates. See
800 =item B<-v>, B<--verbose>
808 This script collects strings from Perl files, the menu files and
809 HTML templates and puts them into the file "all" for translation.