Add a dummy header (charset=UTF-8), fix escaping, pot generated first
[lhc/web/wiklou.git] / maintenance / lang2po.php
1 <?php
2 /**
3 * Convert Language files to .po files !
4 *
5 * Todo:
6 * - generate .po header
7 * - fix escaping of \
8 */
9
10 /** This is a command line script */
11 require_once('commandLine.inc');
12 require_once('languages.inc');
13
14 define('ALL_LANGUAGES', true);
15 define('XGETTEXT_BIN', 'xgettext');
16 define('MSGINIT_BIN', 'msginit');
17 define('XGETTEXT_OPTIONS', '-n --keyword=wfMsg ');
18
19 define('LOCALE_OUTPUT_DIR', $IP.'/locale');
20
21
22 if( isset($options['help']) ) { usage(); die(); }
23 // default output is WikiText
24 if( !isset($options['lang']) ) { $options['lang'] = ALL_LANGUAGES; }
25
26 function usage() {
27 print <<<END
28 Usage: php lang2po.php [--help] [--lang=<langcode>] [--stdout]
29 --help: this message.
30 --lang: a lang code you want to generate a .po for (default: all languages).
31
32 END;
33 }
34
35
36 /**
37 * Return a dummy header for later edition.
38 * @return string A dummy header
39 */
40 function poHeader() {
41 return
42 '# SOME DESCRIPTIVE TITLE.
43 # Copyright (C) 2005 MediaWiki
44 # This file is distributed under the same license as the MediaWiki package.
45 # FIRST AUTHOR <EMAIL@ADDRESS>, YEAR.
46 #
47 #, fuzzy
48 msgid ""
49 msgstr ""
50 "Project-Id-Version: PACKAGE VERSION\n"
51 "Report-Msgid-Bugs-To: bugzilllaaaaa\n"
52 "POT-Creation-Date: 2005-08-16 20:13+0200\n"
53 "PO-Revision-Date: YEAR-MO-DA HO:MI+ZONE\n"
54 "Last-Translator: VARIOUS <nobody>\n"
55 "Language-Team: LANGUAGE <nobody>\n"
56 "MIME-Version: 1.0\n"
57 "Content-Type: text/plain; charset=UTF-8\n"
58 "Content-Transfer-Encoding: 8bit\n"
59 ';
60 }
61
62 /**
63 * generate and write a file in .po format.
64 *
65 * @param string $langcode Code of a language it will process.
66 * @param array &$messages Array containing the various messages.
67 * @return string Filename where stuff got saved or false.
68 */
69 function generatePo($langcode, &$messages) {
70 $data = poHeader();
71
72 // Generate .po entries
73 foreach($messages as $identifier => $content) {
74 $data .= "msgid \"$identifier\"\n";
75
76 // Escape backslashes
77 $tmp = str_replace('\\', '\\\\', $content);
78 // Escape doublelquotes
79 $tmp = preg_replace( "/(?<!\\\\)\"/", '\"', $tmp);
80 // Rewrite multilines to gettext format
81 $tmp = str_replace("\n", "\"\n\"", $tmp);
82
83 $data .= 'msgstr "'. $tmp . "\"\n\n";
84 }
85
86 // Write the content to a file in locale/XX/messages.po
87 $dir = LOCALE_OUTPUT_DIR.'/'.$langcode;
88 if( !is_dir($dir) ) { mkdir( $dir, 0770 ); }
89 $filename = $dir.'/fromlanguagefile.po';
90
91 $file = fopen( $filename , 'wb' );
92 if( fwrite( $file, $data ) ) {
93 fclose( $file );
94 return $filename;
95 } else {
96 fclose( $file );
97 return false;
98 }
99 }
100
101
102 // Generate a template .pot based on source tree
103 echo "Getting 'gettext' default messages from sources\n";
104 exec( XGETTEXT_BIN
105 .' '.XGETTEXT_OPTIONS
106 .' -o '.$IP.'/locale/wfMsg.pot'
107 .' '.$IP.'/includes/*php'
108 );
109
110
111 $langTool = new languages();
112
113 // Do all languages
114 foreach ( $langTool->getList() as $langcode) {
115 echo "Loading messages for $langcode:\t";
116 require_once( 'languages/Language' . $langcode . '.php' );
117 $arr = 'wgAllMessages'.$langcode;
118 if(!@is_array($$arr)) {
119 echo "NONE FOUND\n";
120 } else {
121 echo "ok\n";
122 if( ! generatePo($langcode, $$arr) ) {
123 echo "ERROR: Failed to wrote file.\n";
124 }
125 }
126 }
127 ?>