diff options
Diffstat (limited to 'vendor/commerceguys/intl/scripts/language/generate.php')
-rw-r--r-- | vendor/commerceguys/intl/scripts/language/generate.php | 148 |
1 files changed, 0 insertions, 148 deletions
diff --git a/vendor/commerceguys/intl/scripts/language/generate.php b/vendor/commerceguys/intl/scripts/language/generate.php deleted file mode 100644 index 72e8d1b44..000000000 --- a/vendor/commerceguys/intl/scripts/language/generate.php +++ /dev/null @@ -1,148 +0,0 @@ -<?php - -/** - * Generates the json files stored in resources/language. - * - * CLDR lists about 515 languages, many of them dead (like Latin or Old English). - * In order to decrease the list to a reasonable size, only the languages - * for which CLDR itself has translations are listed. - */ -set_time_limit(0); - -// Downloaded from https://github.com/unicode-cldr/cldr-localenames-full.git -$localeDirectory = '../assets/cldr-localenames-full/main/'; -$enLanguages = $localeDirectory . 'en/languages.json'; - -if (!is_dir($localeDirectory)) { - die("The $localeDirectory directory was not found"); -} -if (!file_exists($enLanguages)) { - die("The $enLanguages file was not found"); -} -if (!function_exists('collator_create')) { - // Reimplementing intl's collator would be a huge undertaking, so we - // use it instead to presort the generated locale specific data. - die('The intl extension was not found.'); -} - -// Locales listed without a "-" match all variants. -// Locales listed with a "-" match only those exact ones. -$ignoredLocales = [ - // Interlingua is a made up language. - 'ia', - // Valencian differs from its parent only by a single character (è/é). - 'ca-ES-VALENCIA', - // Special "grouping" locales. - 'root', 'en-US-POSIX', 'en-001', 'en-150', 'es-419', -]; - -$languages = []; -// Load the "en" data first so that it can be used as a fallback for -// untranslated language names in other locales. -$languageData = json_decode(file_get_contents($enLanguages), true); -$languageData = $languageData['main']['en']['localeDisplayNames']['languages']; -foreach ($languageData as $languageCode => $languageName) { - if (strpos($languageCode, '-alt-') === false) { - $languages['en'][$languageCode] = [ - 'name' => $languageName, - ]; - } -} - -// Gather available locales. -$locales = []; -if ($handle = opendir($localeDirectory)) { - while (false !== ($entry = readdir($handle))) { - if (substr($entry, 0, 1) != '.') { - $entryParts = explode('-', $entry); - if (!in_array($entry, $ignoredLocales) && !in_array($entryParts[0], $ignoredLocales)) { - $locales[] = $entry; - } - } - } - closedir($handle); -} - -// Remove all languages that aren't an available locale at the same time. -// This reduces the language list from about 515 to about 185 languages. -foreach ($languages['en'] as $languageCode => $languageData) { - if (!in_array($languageCode, $locales)) { - unset($languages['en'][$languageCode]); - } -} - -// Load the localizations. -$untranslatedCounts = []; -foreach ($locales as $locale) { - $data = json_decode(file_get_contents($localeDirectory . $locale . '/languages.json'), true); - $data = $data['main'][$locale]['localeDisplayNames']['languages']; - foreach ($data as $languageCode => $languageName) { - if (isset($languages['en'][$languageCode])) { - // This language name is untranslated, use to the english version. - if ($languageCode == str_replace('_', '-', $languageName)) { - $languageName = $languages['en'][$languageCode]['name']; - // Maintain a count of untranslated languages per locale. - $untranslatedCounts += [$locale => 0]; - $untranslatedCounts[$locale]++; - } - - $languages[$locale][$languageCode] = [ - 'name' => $languageName, - ]; - } - } -} - -// Ignore locales that are more than 80% untranslated. -foreach ($untranslatedCounts as $locale => $count) { - $totalCount = count($languages[$locale]); - $untranslatedPercentage = $count * (100 / $totalCount); - if ($untranslatedPercentage >= 80) { - unset($languages[$locale]); - } -} - -// Identify localizations that are the same as the ones for the parent locale. -// For example, "fr-FR" if "fr" has the same data. -$duplicates = []; -foreach ($languages as $locale => $localizedLanguages) { - if (strpos($locale, '-') !== false) { - $localeParts = explode('-', $locale); - array_pop($localeParts); - $parentLocale = implode('-', $localeParts); - $diff = array_udiff($localizedLanguages, $languages[$parentLocale], function ($first, $second) { - return ($first['name'] == $second['name']) ? 0 : 1; - }); - - if (empty($diff)) { - // The duplicates are not removed right away because they might - // still be needed for other duplicate checks (for example, - // when there are locales like bs-Latn-BA, bs-Latn, bs). - $duplicates[] = $locale; - } - } -} -// Remove the duplicates. -foreach ($duplicates as $locale) { - unset($languages[$locale]); -} - -// Write out the localizations. -foreach ($languages as $locale => $localizedLanguages) { - $collator = collator_create($locale); - uasort($localizedLanguages, function ($a, $b) use ($collator) { - return collator_compare($collator, $a['name'], $b['name']); - }); - file_put_json($locale . '.json', $localizedLanguages); -} - -/** - * Converts the provided data into json and writes it to the disk. - */ -function file_put_json($filename, $data) -{ - $data = json_encode($data, JSON_PRETTY_PRINT | JSON_UNESCAPED_UNICODE); - // Indenting with tabs instead of 4 spaces gives us 20% smaller files. - $data = str_replace(' ', "\t", $data); - file_put_contents($filename, $data); -} |