diff options
author | Pascal Chevrel <pascal@chevrel.org> | 2012-04-25 08:05:02 +0200 |
---|---|---|
committer | Pascal Chevrel <pascal@chevrel.org> | 2012-04-25 08:05:02 +0200 |
commit | be4d9bf84103db5ed02d6ffd97e74f6c515f8515 (patch) | |
tree | 8e5a23b4e1282d1fe67958fcdf63fdeb0947834b /app/l10n/extract.php | |
parent | b518a33cf0274063261bccd0b21dca9b871a9755 (diff) | |
download | planet-be4d9bf84103db5ed02d6ffd97e74f6c515f8515.tar planet-be4d9bf84103db5ed02d6ffd97e74f6c515f8515.tar.gz planet-be4d9bf84103db5ed02d6ffd97e74f6c515f8515.tar.bz2 planet-be4d9bf84103db5ed02d6ffd97e74f6c515f8515.tar.xz planet-be4d9bf84103db5ed02d6ffd97e74f6c515f8515.zip |
extraction script for localization, extracts all localizable strings in the repo and updates the .lang files
Diffstat (limited to 'app/l10n/extract.php')
-rw-r--r-- | app/l10n/extract.php | 196 |
1 files changed, 196 insertions, 0 deletions
diff --git a/app/l10n/extract.php b/app/l10n/extract.php new file mode 100644 index 0000000..c63e564 --- /dev/null +++ b/app/l10n/extract.php @@ -0,0 +1,196 @@ +<?php + +/* + * This is a file parser to extract localizable strings from moonmoon + * + * It will scan the whole moonmoon repository for php files, extract + * localized strings and their localization notes and create .lang files. + * Existing translations will be automatically updated. + * A short report will be displayed afterwards. + * + * The easiest way to add a new locale is just to create an empty .lang file and then run the script + * + * The script scans for the files in the l10n/ folder to know which locales are supported + */ + +// released versions of moonmoon should immediately return for security +// return; + +$root = dirname(__FILE__) . '/../../'; +$GLOBALS['english'] = array(); + +include_once $root . '/app/classes/Simplel10n.class.php'; + +/* + * This is a file parser to extract localizable strings (in .php files) + * $GLOBALS['english'] is populated with localizable strings and their associated localization notes + * + */ + + +function extract_l10n_strings($file) { + $lines = file($file); + $patterns = array('/_g\((.*?)\)/', '/getString\((.*?)\)/', ); + + foreach ($lines as $line) { + + // Skip comments + if($line[0] == '#' || $line[0] == '/') continue; + + // parsing logic + foreach($patterns as $pattern) { + if(preg_match_all($pattern, $line, $matches, PREG_PATTERN_ORDER)) { + foreach($matches[1] as $val) { + + // Do not extract php variables calls or empty strings + if($val[0] == '$' || $val == '') continue; + + // Is there a localization comment ? + $l10n_note = explode("',", $val); + + // Also test strings in double quotes + if(count($l10n_note) == 1) { + $l10n_note = explode('",', $val); + } + + // Extract cleaned up strings + if(count($l10n_note) == 2) { + $l10n_str = substr(trim($l10n_note[0]), 1, -1); + $l10n_note = substr(trim($l10n_note[1]), 1, -1); + } else { + $l10n_str = substr(trim($val), 1, -1); # Remove quotes around the string + $l10n_note = ''; + } + + if(!array_key_exists($l10n_str, $GLOBALS['english'])) { + $GLOBALS['english'][$l10n_str] = array($l10n_str, $l10n_note); + } + } + } + } + } +} + +/* + * This is a function echoing $GLOBALS['english'] in .lang format + * Typical usage would be: + * <?php + * extract_l10n_strings('.'); + * show_l10n_strings() ; + */ + +function show_l10n_strings() { + + header('Content-Type:text/plain'); + + foreach($GLOBALS['english'] as $val) { + if($val[1]) { + echo '# ' . $val[1] . "\n"; + } + echo ";$val[0]\n"; + echo "$val[0]\n\n\n"; + } +} + +/* + * Recursively scan files in a folder + * returns an array of file paths + */ + +function find_all_files($dir) { + + $result = array(); + $root = scandir($dir); + + $ignore = array('.', '..', '.git', '.svn', '.hg', 'cache', '.gitignore', 'lib'); + + foreach($root as $value) { + + if(in_array($value, $ignore)) { + continue; + } + + if(is_file("$dir/$value")) { + $split = explode('.', $value); + if(isset($split[1]) && $split[1] == 'php'){ + $result[] = "$dir/$value"; + } + continue; + } + + foreach(find_all_files("$dir/$value") as $value) { + $result[]=$value; + } + } + + return $result; +} + +function update_lang_files($source, $dest) { + + $files = find_all_files($source); + + foreach($files as $file) { + extract_l10n_strings($file); + } + + + $files = scandir($dest); + $ignore = array('.', '..'); + + + // list locales + $locales = array(); + foreach($files as $file) { + + if(in_array($file, $ignore)) { + continue; + } + + $split = explode('.', $file); + + if($split[1] == 'lang') { + $locales[] = $split[0]; + } + } + + + foreach($locales as $locale) { + $status[$locale] = 0; + $lang_file_path = $dest . '/' . $locale; + + Simplel10n::load($lang_file_path); + + ob_start(); + foreach($GLOBALS['english'] as $key => $val) { + + if($val[1]) { + echo '# Translation note: ' . $val[1] . "\n"; + } + echo ";$val[0]\n"; + + $value = @Simplel10n::getString($key); + echo $value . "\n\n\n"; + if($value == $val[0]) { + $status[$locale]++; + } + } + + $content = ob_get_contents(); + ob_end_clean(); + file_put_contents($lang_file_path. '.lang', $content); + + unset($GLOBALS['locale']); + } + + + // Display a short status report + header('Content-Type:text/plain'); + echo "Number of English strings: " . count($GLOBALS['english']) . "\n"; + echo "Your installation has these languages installed: " . implode(', ', $locales) . "\n"; + foreach($locales as $val) { + echo $val . " has " . $status[$val] . " untranslated strings.\n"; + } +} + +update_lang_files($root, $root . 'app/l10n'); |