aboutsummaryrefslogtreecommitdiffstats
path: root/tests/unit/includes/LanguageTest.php
blob: 789dbe80b566da2342d9ceadbabceb712ced90a3 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
<?php
/*
 * Copyright (c) 2017 Hubzilla
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 * SOFTWARE.
 */

namespace Zotlabs\Tests\Unit\includes;

use Zotlabs\Tests\Unit\UnitTestCase;
use Text_LanguageDetect;
//use phpmock\phpunit\PHPMock;

/**
 * @brief Unit Test cases for include/language.php file.
 *
 * @author Klaus Weidenbach
 */
class LanguageTest extends UnitTestCase {
	//use PHPMock;

	/**
	 * @dataProvider languageExamplesProvider
	 * @coversNothing
	 */
	public function testDetectLanguage($text, $langCode, $confidence) {

		// php-mock can not mock global functions which is called by a global function.
		// If the calling function is in a namespace it would work.
		//$gc = $this->getFunctionMock(__NAMESPACE__, 'get_config');
		//$gc->expects($this->once())->willReturn(10)
		//$cg = $this->getFunctionMock('Zotlabs\Lib\Config', 'Get');
		//$cg->expects($this->once())->willReturn(10);
		//$this->assertEquals($langCode, detect_language($text));


		// Can not unit test detect_language(), therefore test the used library
		// only for now to find regressions on library updates.
		require_once('library/langdet/Text/LanguageDetect.php');
		$l = new Text_LanguageDetect;
		// return 2-letter ISO 639-1 (en) language code
		$l->setNameMode(2);
		$lng = $l->detectConfidence($text);

		$this->assertEquals($langCode, $lng['language']);
		$this->assertEquals($confidence, round($lng['confidence'], 6));
	}

	public function languageExamplesProvider() {
		return [
				'empty text' => [
						'',
						'',
						null
				],
				'English' => [
						'English is a West Germanic language that was first spoken in early medieval England and is now a global lingua franca.[4][5] Named after the Angles, one of the Germanic tribes that migrated to England, it ultimately derives its name from the Anglia (Angeln) peninsula in the Baltic Sea. It is closely related to the Frisian languages, but its vocabulary has been significantly influenced by other Germanic languages, particularly Norse (a North Germanic language), as well as by Latin and Romance languages, especially French.',
						'da', // nearly impossible to find a wikipedia article which is detected as english
						0.000367 // minimum confidence is checked in detect_language(), but that is not yet unit testable
				],
				'German' => [
						'Deutschland ist ein Bundesstaat in Mitteleuropa. Er besteht aus 16 Ländern und ist als freiheitlich-demokratischer und sozialer Rechtsstaat verfasst. Die Bundesrepublik Deutschland stellt die jüngste Ausprägung des deutschen Nationalstaates dar. Mit rund 82,8 Millionen Einwohnern (31. Dezember 2016) zählt Deutschland zu den dicht besiedelten Flächenstaaten.',
						'de',
						0.134339
				],
				'Norwegian' => [
						'Kongeriket Norge er et nordisk, europeisk land og en selvstendig stat vest på Den skandinaviske halvøy. Landet er langt og smalt, og kysten strekker seg langs Nord-Atlanteren, hvor også Norges kjente fjorder befinner seg. Totalt dekker det relativt tynt befolkede landet 385 000 kvadratkilometer med litt over fem millioner innbyggere (2016).',
						'no',
						0.007076
				]
		];
	}


	/**
	 * @covers ::get_language_name
	 * @dataProvider getLanguageNameProvider
	 */
	public function testGetLanguageName($lang, $name, $trans) {
		$this->assertEquals($name, get_language_name($lang));
		foreach ($trans as $k => $v) {
			//echo "$k -> $v";
			$this->assertEquals($v, get_language_name($lang, $k));
		}
	}

	public function getLanguageNameProvider() {
		return [
				'empty language code' => [
						'',
						'',
						['de' => '']
				],
				'invalid language code' => [
						'zz',
						'zz',
						['de' => 'zz']
				],
				'de' => [
						'de',
						'German',
						[
								'de' => 'Deutsch',
								'nb' => 'tysk'
						]
				],
				'de-de' => [
						'de-de',
						'German',
						[
								'de-de' => 'Deutsch',
								'nb' => 'Deutsch' // should be tysk, seems to be a bug upstream
						]
				],
				'en' => [
						'en',
						'English',
						[
								'de' => 'Englisch',
								'nb' => 'engelsk'
						]
				],
				'en-gb' => [
						'en-gb',
						'British English',
						[
								'de' => 'Britisches Englisch',
								'nb' => 'britisk engelsk'
						]
				],
				'en-au' => [
						'en-au',
						'Australian English',
						[
								'de' => 'Australisches Englisch',
								'nb' => 'australsk engelsk'
						]
				],
				'nb' => [
						'nb',
						'Norwegian Bokmål',
						[
								'de' => 'Norwegisch Bokmål',
								'nb' => 'norsk bokmål'
						]
				]
		];
	}
}