From c1f9b1f7b1b77776192048005dcc66dcf3df2bfb Mon Sep 17 00:00:00 2001 From: Pierre Schmitz Date: Sat, 27 Dec 2014 15:41:37 +0100 Subject: Update to MediaWiki 1.24.1 --- maintenance/language/generateNormalizerDataMl.php | 69 +++++++++++++++++++++++ 1 file changed, 69 insertions(+) create mode 100644 maintenance/language/generateNormalizerDataMl.php (limited to 'maintenance/language/generateNormalizerDataMl.php') diff --git a/maintenance/language/generateNormalizerDataMl.php b/maintenance/language/generateNormalizerDataMl.php new file mode 100644 index 00000000..c7237cfe --- /dev/null +++ b/maintenance/language/generateNormalizerDataMl.php @@ -0,0 +1,69 @@ +mDescription = 'Generate the normalizer data file for Malayalam'; + } + + public function getDbType() { + return Maintenance::DB_NONE; + } + + public function execute() { + $hexPairs = array( + # From http://unicode.org/versions/Unicode5.1.0/#Malayalam_Chillu_Characters + '0D23 0D4D 200D' => '0D7A', + '0D28 0D4D 200D' => '0D7B', + '0D30 0D4D 200D' => '0D7C', + '0D32 0D4D 200D' => '0D7D', + '0D33 0D4D 200D' => '0D7E', + + # From http://permalink.gmane.org/gmane.science.linguistics.wikipedia.technical/46413 + '0D15 0D4D 200D' => '0D7F', + ); + + $pairs = array(); + foreach ( $hexPairs as $hexSource => $hexDest ) { + $source = hexSequenceToUtf8( $hexSource ); + $dest = hexSequenceToUtf8( $hexDest ); + $pairs[$source] = $dest; + } + + global $IP; + file_put_contents( "$IP/serialized/normalize-ml.ser", serialize( $pairs ) ); + echo "ml: " . count( $pairs ) . " pairs written.\n"; + } +} + +$maintClass = 'GenerateNormalizerDataMl'; +require_once RUN_MAINTENANCE_IF_MAIN; -- cgit v1.2.2