Add base language codes as well

In some cases CLDR provides only a script variant we might not use.
This commit is contained in:
Niklas Laxström
2016-05-26 15:34:20 +02:00
parent 35ce36a611
commit 8e4a35bb66
3 changed files with 106 additions and 20 deletions

View File

@@ -64,8 +64,17 @@ foreach ( $supplementalData->territoryInfo->territory as $territoryRecord ) {
$languageCodeAttr = $languageAttributes['type'];
// Lower case is a convention for language codes in ULS.
// '_' is used in CLDR for compound codes and it's replaced with '-' here.
$parsedLangdb['territories'][$territoryCode][] =
strtr( strtolower( (string) $languageCodeAttr[0] ), '_', '-' );
$normalisedCode = strtr( strtolower( (string) $languageCodeAttr[0] ), '_', '-' );
$parsedLangdb['territories'][$territoryCode][] = $normalisedCode;
// In case of codes with variants, also add the base because ULS might consider
// them as separate languages, e.g. zh, zh-hant and zh-hans.
if ( strpos( $normalisedCode, '-' ) !== false ) {
$parts = explode( '-', $normalisedCode );
$parsedLangdb['territories'][$territoryCode][] = $parts[0];
}
}
}
@@ -91,6 +100,11 @@ foreach ( $parsedLangdb['territories'] as $territoryCode => $languages ) {
continue;
}
// Remove duplicates we might have created
$parsedLangdb['territories'][$territoryCode] =
array_unique( $parsedLangdb['territories'][$territoryCode] );
// We need to renumber or json conversion thinks these are objects
$parsedLangdb['territories'][$territoryCode] =
array_values( $parsedLangdb['territories'][$territoryCode] );