aboutsummaryrefslogtreecommitdiffstats
path: root/maintenance/language/generateUpperCharTable.php
blob: c34fbbae2c89c8409320db8274b50b42d6ef573a (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
<?php
/**
 * Generate a json file containing an array of
 *   utf8_lowercase => utf8_uppercase
 * for all of the utf-8 range. This provides the input for generateUcfirstOverrides.php
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License along
 * with this program; if not, write to the Free Software Foundation, Inc.,
 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
 * http://www.gnu.org/copyleft/gpl.html
 *
 * @file
 * @ingroup MaintenanceLanguage
 */

// @codeCoverageIgnoreStart
require_once __DIR__ . '/../Maintenance.php';
// @codeCoverageIgnoreEnd

class GenerateUpperCharTable extends Maintenance {

	public function __construct() {
		parent::__construct();
		$this->addDescription( 'Generates the lowercase => uppercase json table' );
		$this->addOption( 'outfile', 'Output file', true, true, 'o' );
		$this->addOption( 'titlecase', 'Use title case instead of upper case' );
	}

	public function execute() {
		$outfile = $this->getOption( 'outfile', 'upperchar.json' );
		$toUpperTable = [];
		$titlecase = $this->getOption( 'titlecase' );
		for ( $i = 0; $i <= 0x10ffff; $i++ ) {
			// skip all surrogate codepoints or json_encode would fail.
			if ( $i >= 0xd800 && $i <= 0xdfff ) {
				continue;
			}
			$char = UtfNormal\Utils::codepointToUtf8( $i );
			if ( $titlecase ) {
				$upper = mb_convert_case( $char, MB_CASE_TITLE );
			} else {
				$upper = mb_strtoupper( $char );
			}
			$toUpperTable[$char] = $upper;
		}
		file_put_contents( $outfile, json_encode( $toUpperTable ) );
	}
}

// @codeCoverageIgnoreStart
$maintClass = GenerateUpperCharTable::class;
require_once RUN_MAINTENANCE_IF_MAIN;
// @codeCoverageIgnoreEnd