From 8e4c5db766ce23d05b8507991b04fece743147de Mon Sep 17 00:00:00 2001 From: Klaus Weidenbach Date: Wed, 25 Oct 2017 01:57:18 +0200 Subject: :arrow_up: Update Text_LanguageDetect. Update from v0.3.0 (2012) to v1.0.0 (2017) which should remove some warnings and improve PHP7 support. Using composer to handle this PEAR library now. Fix a problem in FeedutilsTest. --- library/langdet/docs/example_clui.php | 35 ----------------- library/langdet/docs/example_web.php | 72 ----------------------------------- library/langdet/docs/iso.php | 21 ---------- 3 files changed, 128 deletions(-) delete mode 100644 library/langdet/docs/example_clui.php delete mode 100644 library/langdet/docs/example_web.php delete mode 100644 library/langdet/docs/iso.php (limited to 'library/langdet/docs') diff --git a/library/langdet/docs/example_clui.php b/library/langdet/docs/example_clui.php deleted file mode 100644 index 8e7d8577d..000000000 --- a/library/langdet/docs/example_clui.php +++ /dev/null @@ -1,35 +0,0 @@ -getLanguages(); -sort($langs); -echo join(', ', $langs); - -echo "\ntotal ", count($langs), "\n\n"; - -while ($line = fgets($stdin)) { - $result = $l->detect($line, 4); - print_r($result); - $blocks = $l->detectUnicodeBlocks($line, true); - print_r($blocks); -} - -fclose($stdin); -unset($l); - -/* vim: set expandtab tabstop=4 shiftwidth=4 softtabstop=4: */ - -?> diff --git a/library/langdet/docs/example_web.php b/library/langdet/docs/example_web.php deleted file mode 100644 index 1e155fef2..000000000 --- a/library/langdet/docs/example_web.php +++ /dev/null @@ -1,72 +0,0 @@ - - - -Text_LanguageDetect demonstration - - -

Text_LanguageDetect

-Supported languages:\n"; -$langs = $l->getLanguages(); -sort($langs); -foreach ($langs as $lang) { - echo ucfirst($lang), ', '; - $i++; -} - -echo "
total $i

"; - -?> -
-Enter text to identify language (at least a couple of sentences):
- -
- -
-utf8strlen($q); - if ($len < 20) { // this value picked somewhat arbitrarily - echo "Warning: string not very long ($len chars)
\n"; - } - - $result = $l->detectConfidence($q); - - if ($result == null) { - echo "Text_LanguageDetect cannot identify this piece of text.

\n"; - } else { - echo "Text_LanguageDetect thinks this text is written in {$result['language']} ({$result['similarity']}, {$result['confidence']})

\n"; - } - - $result = $l->detectUnicodeBlocks($q, false); - if (!empty($result)) { - arsort($result); - echo "Unicode blocks present: ", join(', ', array_keys($result)), "\n

"; - } -} - -unset($l); - -/* vim: set expandtab tabstop=4 shiftwidth=4 softtabstop=4: */ - -?> - diff --git a/library/langdet/docs/iso.php b/library/langdet/docs/iso.php deleted file mode 100644 index 6d7ec1d2e..000000000 --- a/library/langdet/docs/iso.php +++ /dev/null @@ -1,21 +0,0 @@ -setNameMode(2); -echo $l->detectSimple('Das ist ein kleiner Text') . "\n"; - -//will output the ISO 639-2 three-letter language code -// "deu" -$l->setNameMode(3); -echo $l->detectSimple('Das ist ein kleiner Text') . "\n"; - -?> \ No newline at end of file -- cgit v1.2.3