summaryrefslogtreecommitdiff
path: root/locale/escape_special_chars.php
blob: 0f494f19499b63bbac8e5f816560485810222574 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
#!/usr/bin/php -q
<?php
/*
LibreSSL - CAcert web application
Copyright (C) 2004-2012  CAcert Inc.

This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; version 2 of the License.

This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
*/

/* Convert special characters in UTF-8 encoded PO files to HTML entities */

define('MSGSTR', 'msgstr');
define('MSGSTR_LEN', strlen(MSGSTR));
define('MSGID', 'msgid');
define('MSGID_LEN', strlen(MSGID));

function is_msgstr($line) {
	if (strlen($line) < MSGSTR_LEN) {
		return false;
	}
	
	return substr_compare($line, MSGSTR, 0, MSGSTR_LEN) === 0;
}

function is_msgid($line) {
	if (strlen($line) < MSGID_LEN) {
		return false;
	}
	
	return substr_compare($line, MSGID, 0, MSGID_LEN) === 0;
}


////////////// Main //////////////

// Skip the metadata (first msgid/msgstr pair)
while (!feof(STDIN)) {
	$line = fgets(STDIN);
	
	echo $line;
	
	if (is_msgstr($line)) {
		break;
	}
}

// determines if the current line belongs to a msgid or a msgstr
$msgstr = false;

while (!feof(STDIN)) {
	$line = fgets(STDIN);
	
	if (is_msgstr($line)) {
		$msgstr = true;
	} elseif (is_msgid($line)) {
		$msgstr = false;
	}
	
	if ($msgstr) {
		// Escape everything that has a special HTML entity such as
		// &gt; or &auml; except quote characters
		$line = htmlentities($line, ENT_NOQUOTES, "UTF-8");
		
		// Escape everything else -> all characters that don't have a special
		// HTML entity but are outside the ASCII range
		$line = mb_convert_encoding($line, "HTML-ENTITIES", "UTF-8");
	}
	echo $line;
}