summaryrefslogtreecommitdiff
path: root/languages/classes/LanguageRu.php
blob: 11b42cf9a20f96d99bf9a3015a3b85acde524766 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
<?php
/**
 * Russian (русский язык) specific code.
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License along
 * with this program; if not, write to the Free Software Foundation, Inc.,
 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
 * http://www.gnu.org/copyleft/gpl.html
 *
 * @file
 * @ingroup Language
 */

/**
 * Russian (русский язык)
 *
 * You can contact Alexander Sigachov (alexander.sigachov at Googgle Mail)
 *
 * @ingroup Language
 */
class LanguageRu extends Language {

	/**
	 * Convert from the nominative form of a noun to some other case
	 * Invoked with {{grammar:case|word}}
	 *
	 * @param $word string
	 * @param $case string
	 * @return string
	 */
	function convertGrammar( $word, $case ) {
		global $wgGrammarForms;
		if ( isset( $wgGrammarForms['ru'][$case][$word] ) ) {
			return $wgGrammarForms['ru'][$case][$word];
		}

		# These rules are not perfect, but they are currently only used for Wikimedia site names so it doesn't
		# matter if they are wrong sometimes. Just add a special case for your site name if necessary.

		# substr doesn't support Unicode and mb_substr has issues,
		# so break it to characters using preg_match_all and then use array_slice and join
		$chars = array();
		preg_match_all( '/./us', $word, $chars );
		if ( !preg_match( "/[a-zA-Z_]/us", $word ) ) {
			switch ( $case ) {
				case 'genitive': # родительный падеж
					if ( join( '', array_slice( $chars[0], -1 ) ) === 'ь' ) {
						$word = join( '', array_slice( $chars[0], 0, -1 ) ) . 'я';
					} elseif ( join( '', array_slice( $chars[0], -2 ) ) === 'ия' ) {
						$word = join( '', array_slice( $chars[0], 0, -2 ) ) . 'ии';
					} elseif ( join( '', array_slice( $chars[0], -2 ) ) === 'ка' ) {
						$word = join( '', array_slice( $chars[0], 0, -2 ) ) . 'ки';
					} elseif ( join( '', array_slice( $chars[0], -2 ) ) === 'ти' ) {
						$word = join( '', array_slice( $chars[0], 0, -2 ) ) . 'тей';
					} elseif ( join( '', array_slice( $chars[0], -2 ) ) === 'ды' ) {
						$word = join( '', array_slice( $chars[0], 0, -2 ) ) . 'дов';
					} elseif ( join( '', array_slice( $chars[0], -3 ) ) === 'ник' ) {
						$word = join( '', array_slice( $chars[0], 0, -3 ) ) . 'ника';
					} elseif ( join( '', array_slice( $chars[0], -3 ) ) === 'ные' ) {
						$word = join( '', array_slice( $chars[0], 0, -3 ) ) . 'ных';
					}
					break;
				case 'dative': # дательный падеж
					# stub
					break;
				case 'accusative': # винительный падеж
					# stub
					break;
				case 'instrumental': # творительный падеж
					# stub
					break;
				case 'prepositional': # предложный падеж
					if ( join( '', array_slice( $chars[0], -1 ) ) === 'ь' ) {
						$word = join( '', array_slice( $chars[0], 0, -1 ) ) . 'е';
					} elseif ( join( '', array_slice( $chars[0], -2 ) ) === 'ия' ) {
						$word = join( '', array_slice( $chars[0], 0, -2 ) ) . 'ии';
					} elseif ( join( '', array_slice( $chars[0], -2 ) ) === 'ка' ) {
						$word = join( '', array_slice( $chars[0], 0, -2 ) ) . 'ке';
					} elseif ( join( '', array_slice( $chars[0], -2 ) ) === 'ти' ) {
						$word = join( '', array_slice( $chars[0], 0, -2 ) ) . 'тях';
					} elseif ( join( '', array_slice( $chars[0], -2 ) ) === 'ды' ) {
						$word = join( '', array_slice( $chars[0], 0, -2 ) ) . 'дах';
					} elseif ( join( '', array_slice( $chars[0], -3 ) ) === 'ник' ) {
						$word = join( '', array_slice( $chars[0], 0, -3 ) ) . 'нике';
					} elseif ( join( '', array_slice( $chars[0], -3 ) ) === 'ные' ) {
						$word = join( '', array_slice( $chars[0], 0, -3 ) ) . 'ных';
					}
					break;
			}
		}

		return $word;
	}

	/**
	 * Plural form transformations
	 *
	 * $forms[0] - singular form (for 1, 21, 31, 41...)
	 * $forms[1] - paucal form (for 2, 3, 4, 22, 23, 24, 32, 33, 34...)
	 * $forms[2] - plural form (for 0, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 25, 26...)
	 *
	 * Examples:
	 *   message with number
	 *     "Сделано $1 {{PLURAL:$1|изменение|изменения|изменений}}"
	 *     ("$1 change[s] were made)
	 *   message without number
	 *     "Действие не может быть выполнено по {{PLURAL:$1|следующей причине|следующим причинам}}:"
	 *     ("The action cannot be performed for the following reason[s]")
	 * @param $count int
	 * @param $forms array
	 *
	 * @return string
	 */
	function convertPlural( $count, $forms ) {
		if ( !count( $forms ) ) {
			return '';
		}

		// If the actual number is not mentioned in the expression, then just two forms are enough:
		// singular for $count === 1
		// plural   for $count !== 1
		// For example, "This user belongs to {{PLURAL:$1|one group|several groups}}."
		if ( count( $forms ) === 2 ) {
			return $count === 1 ? $forms[0] : $forms[1];
		}

		// @todo FIXME: CLDR defines 4 plural forms. Form with decimals missing.
		// See http://unicode.org/repos/cldr-tmp/trunk/diff/supplemental/language_plural_rules.html#ru
		$forms = $this->preConvertPlural( $forms, 3 );

		if ( $count > 10 && (int)floor( ( $count % 100 ) / 10 ) === 1 ) {
			return $forms[2];
		}

		switch ( $count % 10 ) {
			case 1:
				return $forms[0];
			case 2:
			case 3:
			case 4:
				return $forms[1];
			default:
				return $forms[2];
		}
	}

	/**
	 * Four-digit number should be without group commas (spaces)
	 * See manual of style at http://ru.wikipedia.org/wiki/Википедия:Оформление_статей
	 * So "1 234 567", "12 345" but "1234"
	 *
	 * @param $_ string
	 *
	 * @return string
	 */
	function commafy( $_ ) {
		if ( preg_match( '/^-?\d{1,4}(\.\d*)?$/', $_ ) ) {
			return $_;
		} else {
			return strrev( (string)preg_replace( '/(\d{3})(?=\d)(?!\d*\.)/', '$1,', strrev( $_ ) ) );
		}
	}
}