b925a1b6b9
"Special characters which have no HTML-entities are not properly escaped"
80 lines
2 KiB
PHP
80 lines
2 KiB
PHP
#!/usr/bin/php -q
|
|
<?php
|
|
/*
|
|
LibreSSL - CAcert web application
|
|
Copyright (C) 2004-2012 CAcert Inc.
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; version 2 of the License.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; if not, write to the Free Software
|
|
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
/* Convert special characters in UTF-8 encoded PO files to HTML entities */
|
|
|
|
define('MSGSTR', 'msgstr');
|
|
define('MSGSTR_LEN', strlen(MSGSTR));
|
|
define('MSGID', 'msgid');
|
|
define('MSGID_LEN', strlen(MSGID));
|
|
|
|
function is_msgstr($line) {
|
|
if (strlen($line) < MSGSTR_LEN) {
|
|
return false;
|
|
}
|
|
|
|
return substr_compare($line, MSGSTR, 0, MSGSTR_LEN) === 0;
|
|
}
|
|
|
|
function is_msgid($line) {
|
|
if (strlen($line) < MSGID_LEN) {
|
|
return false;
|
|
}
|
|
|
|
return substr_compare($line, MSGID, 0, MSGID_LEN) === 0;
|
|
}
|
|
|
|
|
|
////////////// Main //////////////
|
|
|
|
// Skip the metadata (first msgid/msgstr pair)
|
|
while (!feof(STDIN)) {
|
|
$line = fgets(STDIN);
|
|
|
|
echo $line;
|
|
|
|
if (is_msgstr($line)) {
|
|
break;
|
|
}
|
|
}
|
|
|
|
// determines if the current line belongs to a msgid or a msgstr
|
|
$msgstr = false;
|
|
|
|
while (!feof(STDIN)) {
|
|
$line = fgets(STDIN);
|
|
|
|
if (is_msgstr($line)) {
|
|
$msgstr = true;
|
|
} elseif (is_msgid($line)) {
|
|
$msgstr = false;
|
|
}
|
|
|
|
if ($msgstr) {
|
|
// Escape everything that has a special HTML entity such as
|
|
// > or ä except quote characters
|
|
$line = htmlentities($line, ENT_NOQUOTES, "UTF-8");
|
|
|
|
// Escape everything else -> all characters that don't have a special
|
|
// HTML entity but are outside the ASCII range
|
|
$line = mb_convert_encoding($line, "HTML-ENTITIES", "UTF-8");
|
|
}
|
|
echo $line;
|
|
}
|