From cdd945b0dad2da59954c4774ef6a044f255aa820 Mon Sep 17 00:00:00 2001 From: Andreas Beeker Date: Sun, 8 Dec 2019 23:36:02 +0000 Subject: [PATCH] Bug 63927 - Inconsistent mapping of Norwegian locales for date formats git-svn-id: https://svn.apache.org/repos/asf/poi/trunk@1871066 13f79535-47bb-0310-9956-ffa450edef68 --- .../poi/ss/util/DateFormatConverter.java | 287 +----- src/java/org/apache/poi/util/LocaleID.java | 574 +++++++++++ src/java/org/apache/poi/util/LocaleUtil.java | 948 +----------------- .../poi/ss/util/TestDateFormatConverter.java | 53 +- 4 files changed, 692 insertions(+), 1170 deletions(-) create mode 100644 src/java/org/apache/poi/util/LocaleID.java diff --git a/src/java/org/apache/poi/ss/util/DateFormatConverter.java b/src/java/org/apache/poi/ss/util/DateFormatConverter.java index cfe403b5af..9a49da3b67 100644 --- a/src/java/org/apache/poi/ss/util/DateFormatConverter.java +++ b/src/java/org/apache/poi/ss/util/DateFormatConverter.java @@ -24,6 +24,7 @@ import java.util.List; import java.util.Locale; import java.util.Map; +import org.apache.poi.util.LocaleID; import org.apache.poi.util.POILogFactory; import org.apache.poi.util.POILogger; @@ -46,56 +47,59 @@ import org.apache.poi.util.POILogger; * * TODO Generalise this for all Excel format strings */ -public class DateFormatConverter { +@SuppressWarnings("unused") +public final class DateFormatConverter { private static POILogger logger = POILogFactory.getLogger(DateFormatConverter.class); - + + private DateFormatConverter() { + } + public static class DateFormatTokenizer { String format; int pos; - + public DateFormatTokenizer(String format) { this.format = format; } - + public String getNextToken() { if( pos >= format.length() ) { return null; } int subStart = pos; - char curChar = format.charAt(pos); + final char curChar = format.charAt(pos); ++pos; if( curChar == '\'' ) { - while( ( pos < format.length() ) && ( ( curChar = format.charAt(pos) ) != '\'' ) ) { + while( ( pos < format.length() ) && ( format.charAt(pos) != '\'' ) ) { ++pos; } if( pos < format.length() ) { ++pos; } } else { - char activeChar = curChar; - while( ( pos < format.length() ) && ( ( curChar = format.charAt(pos) ) == activeChar ) ) { + while( ( pos < format.length() ) && ( format.charAt(pos) == curChar ) ) { ++pos; } } return format.substring(subStart,pos); } - + public static String[] tokenize( String format ) { List result = new ArrayList<>(); - + DateFormatTokenizer tokenizer = new DateFormatTokenizer(format); String token; while( ( token = tokenizer.getNextToken() ) != null ) { result.add(token); } - + return result.toArray(new String[0]); } - + @Override public String toString() { StringBuilder result = new StringBuilder(); - + DateFormatTokenizer tokenizer = new DateFormatTokenizer(format); String token; while( ( token = tokenizer.getNextToken() ) != null ) { @@ -104,17 +108,16 @@ public class DateFormatConverter { } result.append("[").append(token).append("]"); } - + return result.toString(); - } - } - + } + } + private static Map tokenConversions = prepareTokenConversions(); - private static Map localePrefixes = prepareLocalePrefixes(); - + private static Map prepareTokenConversions() { Map result = new HashMap<>(); - + result.put( "EEEE", "dddd" ); result.put( "EEE", "ddd" ); result.put( "EE", "ddd" ); @@ -130,218 +133,31 @@ public class DateFormatConverter { result.put( "S", "0" ); result.put( "SS", "00" ); result.put( "SSS", "000" ); - - return result; - } - - private static Map prepareLocalePrefixes() { - Map result = new HashMap<>(); - - result.put( "af", "[$-0436]" ); - result.put( "am", "[$-45E]" ); - result.put( "ar_ae", "[$-3801]" ); - result.put( "ar_bh", "[$-3C01]" ); - result.put( "ar_dz", "[$-1401]" ); - result.put( "ar_eg", "[$-C01]" ); - result.put( "ar_iq", "[$-0801]" ); - result.put( "ar_jo", "[$-2C01]" ); - result.put( "ar_kw", "[$-3401]" ); - result.put( "ar_lb", "[$-3001]" ); - result.put( "ar_ly", "[$-1001]" ); - result.put( "ar_ma", "[$-1801]" ); - result.put( "ar_om", "[$-2001]" ); - result.put( "ar_qa", "[$-4001]" ); - result.put( "ar_sa", "[$-0401]" ); - result.put( "ar_sy", "[$-2801]" ); - result.put( "ar_tn", "[$-1C01]" ); - result.put( "ar_ye", "[$-2401]" ); - result.put( "as", "[$-44D]" ); - result.put( "az_az", "[$-82C]" ); - result.put( "az_az", "[$-42C]" ); - result.put( "be", "[$-0423]" ); - result.put( "bg", "[$-0402]" ); - result.put( "bn", "[$-0845]" ); - result.put( "bn", "[$-0445]" ); - result.put( "bo", "[$-0451]" ); - result.put( "bs", "[$-141A]" ); - result.put( "ca", "[$-0403]" ); - result.put( "cs", "[$-0405]" ); - result.put( "cy", "[$-0452]" ); - result.put( "da", "[$-0406]" ); - result.put( "de_at", "[$-C07]" ); - result.put( "de_ch", "[$-0807]" ); - result.put( "de_de", "[$-0407]" ); - result.put( "de_li", "[$-1407]" ); - result.put( "de_lu", "[$-1007]" ); - result.put( "dv", "[$-0465]" ); - result.put( "el", "[$-0408]" ); - result.put( "en_au", "[$-C09]" ); - result.put( "en_bz", "[$-2809]" ); - result.put( "en_ca", "[$-1009]" ); - result.put( "en_cb", "[$-2409]" ); - result.put( "en_gb", "[$-0809]" ); - result.put( "en_ie", "[$-1809]" ); - result.put( "en_in", "[$-4009]" ); - result.put( "en_jm", "[$-2009]" ); - result.put( "en_nz", "[$-1409]" ); - result.put( "en_ph", "[$-3409]" ); - result.put( "en_tt", "[$-2C09]" ); - result.put( "en_us", "[$-0409]" ); - result.put( "en_za", "[$-1C09]" ); - result.put( "es_ar", "[$-2C0A]" ); - result.put( "es_bo", "[$-400A]" ); - result.put( "es_cl", "[$-340A]" ); - result.put( "es_co", "[$-240A]" ); - result.put( "es_cr", "[$-140A]" ); - result.put( "es_do", "[$-1C0A]" ); - result.put( "es_ec", "[$-300A]" ); - result.put( "es_es", "[$-40A]" ); - result.put( "es_gt", "[$-100A]" ); - result.put( "es_hn", "[$-480A]" ); - result.put( "es_mx", "[$-80A]" ); - result.put( "es_ni", "[$-4C0A]" ); - result.put( "es_pa", "[$-180A]" ); - result.put( "es_pe", "[$-280A]" ); - result.put( "es_pr", "[$-500A]" ); - result.put( "es_py", "[$-3C0A]" ); - result.put( "es_sv", "[$-440A]" ); - result.put( "es_uy", "[$-380A]" ); - result.put( "es_ve", "[$-200A]" ); - result.put( "et", "[$-0425]" ); - result.put( "eu", "[$-42D]" ); - result.put( "fa", "[$-0429]" ); - result.put( "fi", "[$-40B]" ); - result.put( "fo", "[$-0438]" ); - result.put( "fr_be", "[$-80C]" ); - result.put( "fr_ca", "[$-C0C]" ); - result.put( "fr_ch", "[$-100C]" ); - result.put( "fr_fr", "[$-40C]" ); - result.put( "fr_lu", "[$-140C]" ); - result.put( "gd", "[$-43C]" ); - result.put( "gd_ie", "[$-83C]" ); - result.put( "gn", "[$-0474]" ); - result.put( "gu", "[$-0447]" ); - result.put( "he", "[$-40D]" ); - result.put( "hi", "[$-0439]" ); - result.put( "hr", "[$-41A]" ); - result.put( "hu", "[$-40E]" ); - result.put( "hy", "[$-42B]" ); - result.put( "id", "[$-0421]" ); - result.put( "is", "[$-40F]" ); - result.put( "it_ch", "[$-0810]" ); - result.put( "it_it", "[$-0410]" ); - result.put( "ja", "[$-0411]" ); - result.put( "kk", "[$-43F]" ); - result.put( "km", "[$-0453]" ); - result.put( "kn", "[$-44B]" ); - result.put( "ko", "[$-0412]" ); - result.put( "ks", "[$-0460]" ); - result.put( "la", "[$-0476]" ); - result.put( "lo", "[$-0454]" ); - result.put( "lt", "[$-0427]" ); - result.put( "lv", "[$-0426]" ); - result.put( "mi", "[$-0481]" ); - result.put( "mk", "[$-42F]" ); - result.put( "ml", "[$-44C]" ); - result.put( "mn", "[$-0850]" ); - result.put( "mn", "[$-0450]" ); - result.put( "mr", "[$-44E]" ); - result.put( "ms_bn", "[$-83E]" ); - result.put( "ms_my", "[$-43E]" ); - result.put( "mt", "[$-43A]" ); - result.put( "my", "[$-0455]" ); - result.put( "ne", "[$-0461]" ); - result.put( "nl_be", "[$-0813]" ); - result.put( "nl_nl", "[$-0413]" ); - result.put( "no_no", "[$-0814]" ); - result.put( "or", "[$-0448]" ); - result.put( "pa", "[$-0446]" ); - result.put( "pl", "[$-0415]" ); - result.put( "pt_br", "[$-0416]" ); - result.put( "pt_pt", "[$-0816]" ); - result.put( "rm", "[$-0417]" ); - result.put( "ro", "[$-0418]" ); - result.put( "ro_mo", "[$-0818]" ); - result.put( "ru", "[$-0419]" ); - result.put( "ru_mo", "[$-0819]" ); - result.put( "sa", "[$-44F]" ); - result.put( "sb", "[$-42E]" ); - result.put( "sd", "[$-0459]" ); - result.put( "si", "[$-45B]" ); - result.put( "sk", "[$-41B]" ); - result.put( "sl", "[$-0424]" ); - result.put( "so", "[$-0477]" ); - result.put( "sq", "[$-41C]" ); - result.put( "sr_sp", "[$-C1A]" ); - result.put( "sr_sp", "[$-81A]" ); - result.put( "sv_fi", "[$-81D]" ); - result.put( "sv_se", "[$-41D]" ); - result.put( "sw", "[$-0441]" ); - result.put( "ta", "[$-0449]" ); - result.put( "te", "[$-44A]" ); - result.put( "tg", "[$-0428]" ); - result.put( "th", "[$-41E]" ); - result.put( "tk", "[$-0442]" ); - result.put( "tn", "[$-0432]" ); - result.put( "tr", "[$-41F]" ); - result.put( "ts", "[$-0431]" ); - result.put( "tt", "[$-0444]" ); - result.put( "uk", "[$-0422]" ); - result.put( "ur", "[$-0420]" ); - result.put( "UTF_8", "[$-0000]" ); - result.put( "uz_uz", "[$-0843]" ); - result.put( "uz_uz", "[$-0443]" ); - result.put( "vi", "[$-42A]" ); - result.put( "xh", "[$-0434]" ); - result.put( "yi", "[$-43D]" ); - result.put( "zh_cn", "[$-0804]" ); - result.put( "zh_hk", "[$-C04]" ); - result.put( "zh_mo", "[$-1404]" ); - result.put( "zh_sg", "[$-1004]" ); - result.put( "zh_tw", "[$-0404]" ); - result.put( "zu", "[$-0435]" ); - result.put( "ar", "[$-0401]" ); - result.put( "bn", "[$-0845]" ); - result.put( "de", "[$-0407]" ); - result.put( "en", "[$-0409]" ); - result.put( "es", "[$-40A]" ); - result.put( "fr", "[$-40C]" ); - result.put( "it", "[$-0410]" ); - result.put( "ms", "[$-43E]" ); - result.put( "nl", "[$-0413]" ); - result.put( "nn", "[$-0814]" ); - result.put( "no", "[$-0414]" ); - result.put( "pt", "[$-0816]" ); - result.put( "sr", "[$-C1A]" ); - result.put( "sv", "[$-41D]" ); - result.put( "uz", "[$-0843]" ); - result.put( "zh", "[$-0804]" ); - - result.put( "ga", "[$-43C]" ); - result.put( "ga_ie", "[$-83C]" ); - result.put( "in", "[$-0421]" ); - result.put( "iw", "[$-40D]" ); - - // JDK 8 adds an empty locale-string, see also https://issues.apache.org/jira/browse/LANG-941 - result.put( "", "[$-0409]" ); - return result; } - + public static String getPrefixForLocale( Locale locale ) { - String localeString = locale.toString().toLowerCase(locale); - String result = localePrefixes.get( localeString ); - if( result == null ) { - result = localePrefixes.get( localeString.substring( 0, 2 ) ); - if( result == null ) { - Locale parentLocale = new Locale(localeString.substring( 0, 2 )); - logger.log( POILogger.ERROR, "Unable to find prefix for " + locale + "(" + locale.getDisplayName(Locale.ROOT) + ") or " - + localeString.substring( 0, 2 ) + "(" + parentLocale.getDisplayName(Locale.ROOT) + ")" ); + final String languageTag = locale.toLanguageTag(); + if ("".equals(languageTag)) { + // JDK 8 adds an empty locale-string, see also https://issues.apache.org/jira/browse/LANG-941 + return "[$-0409]"; + } + + LocaleID loc = LocaleID.lookupByLanguageTag(languageTag); + if (loc == null) { + String cmpTag = (languageTag.indexOf('_') > -1) ? languageTag.replace('_','-') : languageTag; + int idx = languageTag.length(); + while (loc == null && (idx = cmpTag.lastIndexOf('-', idx-1)) > 0) { + loc = LocaleID.lookupByLanguageTag(languageTag.substring(0, idx)); + } + if (loc == null) { + logger.log( POILogger.ERROR, "Unable to find prefix for Locale '" + languageTag + "' or its parent locales." ); return ""; } } - return result; + + return String.format(Locale.ROOT, "[$-%04X]", loc.getLcid()); } public static String convert( Locale locale, DateFormat df ) { @@ -351,7 +167,7 @@ public class DateFormatConverter { public static String convert( Locale locale, String format ) { StringBuilder result = new StringBuilder(); - + result.append(getPrefixForLocale(locale)); DateFormatTokenizer tokenizer = new DateFormatTokenizer(format); String token; @@ -369,7 +185,7 @@ public class DateFormatConverter { result.append(";@"); return result.toString().trim(); } - + public static String getJavaDatePattern(int style, Locale locale) { DateFormat df = DateFormat.getDateInstance(style, locale); if( df instanceof SimpleDateFormat ) { @@ -378,18 +194,17 @@ public class DateFormatConverter { switch( style ) { case DateFormat.SHORT: return "d/MM/yy"; - case DateFormat.MEDIUM: - return "MMM d, yyyy"; case DateFormat.LONG: return "MMMM d, yyyy"; case DateFormat.FULL: return "dddd, MMMM d, yyyy"; default: + case DateFormat.MEDIUM: return "MMM d, yyyy"; } } } - + public static String getJavaTimePattern(int style, Locale locale) { DateFormat df = DateFormat.getTimeInstance(style, locale); if( df instanceof SimpleDateFormat ) { @@ -398,18 +213,15 @@ public class DateFormatConverter { switch( style ) { case DateFormat.SHORT: return "h:mm a"; + default: case DateFormat.MEDIUM: - return "h:mm:ss a"; case DateFormat.LONG: - return "h:mm:ss a"; case DateFormat.FULL: return "h:mm:ss a"; - default: - return "h:mm:ss a"; } } } - + public static String getJavaDateTimePattern(int style, Locale locale) { DateFormat df = DateFormat.getDateTimeInstance(style, style, locale); if( df instanceof SimpleDateFormat ) { @@ -418,16 +230,15 @@ public class DateFormatConverter { switch( style ) { case DateFormat.SHORT: return "M/d/yy h:mm a"; - case DateFormat.MEDIUM: - return "MMM d, yyyy h:mm:ss a"; case DateFormat.LONG: return "MMMM d, yyyy h:mm:ss a"; case DateFormat.FULL: return "dddd, MMMM d, yyyy h:mm:ss a"; default: + case DateFormat.MEDIUM: return "MMM d, yyyy h:mm:ss a"; } } } - + } diff --git a/src/java/org/apache/poi/util/LocaleID.java b/src/java/org/apache/poi/util/LocaleID.java new file mode 100644 index 0000000000..975442b5bc --- /dev/null +++ b/src/java/org/apache/poi/util/LocaleID.java @@ -0,0 +1,574 @@ +/* ==================================================================== + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +==================================================================== */ + +package org.apache.poi.util; + +import static java.util.Calendar.SATURDAY; +import static java.util.Calendar.SUNDAY; + +import java.util.Calendar; +import java.util.Map; +import java.util.function.Function; +import java.util.stream.Collectors; +import java.util.stream.Stream; + +/** + * Locale Collection

+ *

+ * This enum can be used to map between Windows LCID and Java {@link java.util.Locale Locales} + * + * @see [MS-LCID]: Windows Language Code Identifier (LCID) Reference + */ +@SuppressWarnings("unused") +public enum LocaleID { + AR(0x0001, "ar", "ar", "Arabic", 1256, SUNDAY), + BG(0x0002, "bg", "bg", "Bulgarian", 1251, -1), + CA(0x0003, "ca", "ca", "Catalan", 1252, -1), + ZH_HANS(0x0004, "zh_hans", "zh-Hans", "Chinese (Simplified)", 936, -1), + CS(0x0005, "cs", "cs", "Czech", 1250, -1), + DA(0x0006, "da", "da", "Danish", 1252, -1), + DE(0x0007, "de", "de", "German", 1252, -1), + EL(0x0008, "el", "el", "Greek", 1253, -1), + EN(0x0009, "en", "en", "English", 1252, -1), + ES(0x000A, "es", "es", "Spanish", 1252, -1), + FI(0x000B, "fi", "fi", "Finnish", 1252, -1), + FR(0x000C, "fr", "fr", "French", 1252, -1), + HE(0x000D, "he", "he", "Hebrew", 1255, SUNDAY), + HU(0x000E, "hu", "hu", "Hungarian", 1250, -1), + IS(0x000F, "is", "is", "Icelandic", 1252, -1), + IT(0x0010, "it", "it", "Italian", 1252, -1), + JA(0x0011, "ja", "ja", "Japanese", 932, SUNDAY), + KO(0x0012, "ko", "ko", "Korean", 949, SUNDAY), + NL(0x0013, "nl", "nl", "Dutch", 1252, -1), + NO(0x0014, "no", "no", "Norwegian", 1252, -1), + PL(0x0015, "pl", "pl", "Polish", 1250, -1), + PT(0x0016, "pt", "pt", "Portuguese", 1252, SUNDAY), + RM(0x0017, "rm", "rm", "Romansh", 1252, -1), + RO(0x0018, "ro", "ro", "Romanian", 1250, -1), + RU(0x0019, "ru", "ru", "Russian", 1251, -1), + HR(0x001A, "hr", "hr", "Croatian", 1250, -1), + SK(0x001B, "sk", "sk", "Slovak", 1250, -1), + SQ(0x001C, "sq", "sq", "Albanian", 1250, -1), + SV(0x001D, "sv", "sv", "Swedish", 1252, -1), + TH(0x001E, "th", "th", "Thai", 874, -1), + TR(0x001F, "tr", "tr", "Turkish", 1254, -1), + UR(0x0020, "ur", "ur", "Urdu", 1256, -1), + ID(0x0021, "id", "id", "Indonesian", 1252, SUNDAY), + UK(0x0022, "uk", "uk", "Ukrainian", 1251, -1), + BE(0x0023, "be", "be", "Belarusian", 1251, -1), + SL(0x0024, "sl", "sl", "Slovenian", 1250, -1), + ET(0x0025, "et", "et", "Estonian", 1257, -1), + LV(0x0026, "lv", "lv", "Latvian", 1257, -1), + LT(0x0027, "lt", "lt", "Lithuanian", 1257, -1), + TG(0x0028, "tg", "tg", "Tajik", 1251, -1), + FA(0x0029, "fa", "fa", "Persian", 1256, SATURDAY), + VI(0x002A, "vi", "vi", "Vietnamese", 1258, -1), + HY(0x002B, "hy", "hy", "Armenian", 0, -1), + AZ(0x002C, "az", "az", "Azerbaijani", 1254, -1), + EU(0x002D, "eu", "eu", "Basque", 1252, -1), + HSB(0x002E, "hsb", "hsb", "Upper Sorbian", 1252, -1), + MK(0x002F, "mk", "mk", "Macedonian (FYROM)", 1251, -1), + ST(0x0030, "st", "st", "Southern Sotho", 0, -1), + TS(0x0031, "ts", "ts", "Tsonga", 0, SUNDAY), + TN(0x0032, "tn", "tn", "Setswana", 1252, SUNDAY), + VE(0x0033, "ve", "ve", "Venda", 32759, SUNDAY), + XH(0x0034, "xh", "xh", "isiXhosa", 1252, SUNDAY), + ZU(0x0035, "zu", "zu", "isiZulu", 1252, SUNDAY), + AF(0x0036, "af", "af", "Afrikaans", 1252, SUNDAY), + KA(0x0037, "ka", "ka", "Georgian", 0, -1), + FO(0x0038, "fo", "fo", "Faroese", 1252, -1), + HI(0x0039, "hi", "hi", "Hindi", 0, -1), + MT(0x003A, "mt", "mt", "Maltese", 0, SUNDAY), + SE(0x003B, "se", "se", "Sami (Northern)", 1252, -1), + GA(0x003C, "ga", "ga", "Irish", 1252, SUNDAY), + YI(0x003D, "yi", "yi", "Yiddish", 32759, -1), + MS(0x003E, "ms", "ms", "Malay", 1252, -1), + KK(0x003F, "kk", "kk", "Kazakh", 0, -1), + KY(0x0040, "ky", "ky", "Kyrgyz", 1251, -1), + SW(0x0041, "sw", "sw", "Kiswahili", 1252, SUNDAY), + TK(0x0042, "tk", "tk", "Turkmen", 1250, -1), + UZ(0x0043, "uz", "uz", "Uzbek", 1254, -1), + TT(0x0044, "tt", "tt", "Tatar", 1251, -1), + BN(0x0045, "bn", "bn", "Bangla", 0, SUNDAY), + PA(0x0046, "pa", "pa", "Punjabi", 0, -1), + GU(0x0047, "gu", "gu", "Gujarati", 0, -1), + OR(0x0048, "or", "or", "Odia", 0, -1), + TA(0x0049, "ta", "ta", "Tamil", 0, -1), + TE(0x004A, "te", "te", "Telugu", 0, -1), + KN(0x004B, "kn", "kn", "Kannada", 0, -1), + ML(0x004C, "ml", "ml", "Malayalam", 0, SUNDAY), + AS(0x004D, "as", "as", "Assamese", 0, -1), + MR(0x004E, "mr", "mr", "Marathi", 0, -1), + SA(0x004F, "sa", "sa", "Sanskrit", 0, SUNDAY), + MN(0x0050, "mn", "mn", "Mongolian", 1251, -1), + BO(0x0051, "bo", "bo", "Tibetan", 0, -1), + CY(0x0052, "cy", "cy", "Welsh", 1252, -1), + KM(0x0053, "km", "km", "Khmer", 0, SUNDAY), + LO(0x0054, "lo", "lo", "Lao", 0, SUNDAY), + MY(0x0055, "my", "my", "Burmese", 0, SUNDAY), + GL(0x0056, "gl", "gl", "Galician", 1252, -1), + KOK(0x0057, "kok", "kok", "Konkani", 0, -1), + MNI(0x0058, "mni", "mni", "Manipuri", 32759, -1), + SD(0x0059, "sd", "sd", "Sindhi", 1256, -1), + SYR(0x005A, "syr", "syr", "Syriac", 0, SUNDAY), + SI(0x005B, "si", "si", "Sinhala", 0, -1), + CHR(0x005C, "chr", "chr", "Cherokee", 0, SUNDAY), + IU(0x005D, "iu", "iu", "Inuktitut", 1252, SUNDAY), + AM(0x005E, "am", "am", "Amharic", 0, SUNDAY), + TZM(0x005F, "tzm", "tzm", "Tamazight", 1252, -1), + KS(0x0060, "ks", "ks", "Kashmiri", 32759, -1), + NE(0x0061, "ne", "ne", "Nepali", 0, SUNDAY), + FY(0x0062, "fy", "fy", "Frisian", 1252, -1), + PS(0x0063, "ps", "ps", "Pashto", 0, SATURDAY), + FIL(0x0064, "fil", "fil", "Filipino", 1252, SUNDAY), + DV(0x0065, "dv", "dv", "Divehi", 0, SUNDAY), + BIN(0x0066, "bin", "bin", "Edo", 32759, SUNDAY), + FF(0x0067, "ff", "ff", "Fulah", 1252, -1), + HA(0x0068, "ha", "ha", "Hausa", 1252, -1), + IBB(0x0069, "ibb", "ibb", "Ibibio", 32759, SUNDAY), + YO(0x006A, "yo", "yo", "Yoruba", 1252, -1), + QUZ(0x006B, "quz", "quz", "Quechua", 1252, SUNDAY), + NSO(0x006C, "nso", "nso", "Sesotho sa Leboa", 1252, SUNDAY), + BA(0x006D, "ba", "ba", "Bashkir", 1251, -1), + LB(0x006E, "lb", "lb", "Luxembourgish", 1252, -1), + KL(0x006F, "kl", "kl", "Greenlandic", 1252, -1), + IG(0x0070, "ig", "ig", "Igbo", 1252, -1), + KR(0x0071, "kr", "kr", "Kanuri", 32759, SUNDAY), + OM(0x0072, "om", "om", "Oromo", 0, SUNDAY), + TI(0x0073, "ti", "ti", "Tigrinya", 0, -1), + GN(0x0074, "gn", "gn", "Guarani", 1252, SUNDAY), + HAW(0x0075, "haw", "haw", "Hawaiian", 1252, SUNDAY), + LA(0x0076, "la", "la", "Latin", 32759, SUNDAY), + SO(0x0077, "so", "so", "Somali", 0, -1), + II(0x0078, "ii", "ii", "Yi", 0, -1), + PAP(0x0079, "pap", "pap", "Papiamento", 32759, -1), + ARN(0x007A, "arn", "arn", "Mapudungun", 1252, SUNDAY), + INVALID_A(0x007B, "invalid_a", "", "", 32759, -1), + MOH(0x007C, "moh", "moh", "Mohawk", 1252, SUNDAY), + INVALID_B(0x007D, "invalid_b", "", "", 32759, -1), + BR(0x007E, "br", "br", "Breton", 1252, -1), + INVALID_C(0x007F, "invalid_c", "", "", 1252, -1), + UG(0x0080, "ug", "ug", "Uyghur", 1256, -1), + MI(0x0081, "mi", "mi", "Maori", 0, -1), + OC(0x0082, "oc", "oc", "Occitan", 1252, -1), + CO(0x0083, "co", "co", "Corsican", 1252, -1), + GSW(0x0084, "gsw", "gsw", "Alsatian", 1252, -1), + SAH(0x0085, "sah", "sah", "Sakha", 1251, -1), + QUT(0x0086, "qut", "qut", "Guatemala", 1252, -1), + RW(0x0087, "rw", "rw", "Kinyarwanda", 1252, -1), + WO(0x0088, "wo", "wo", "Wolof", 1252, -1), + INVALID_D(0x0089, "invalid_d", "", "", 32759, -1), + INVALID_E(0x008A, "invalid_e", "", "", 32759, -1), + INVALID_F(0x008B, "invalid_f", "", "", 32759, -1), + PRS(0x008C, "prs", "prs", "Dari", 1256, SATURDAY), + INVALID_G(0x008D, "invalid_g", "", "", 32759, -1), + INVALID_H(0x008E, "invalid_h", "", "", 32759, -1), + INVALID_I(0x008F, "invalid_i", "", "", 32759, -1), + INVALID_J(0x0090, "invalid_j", "", "", 32759, -1), + GD(0x0091, "gd", "gd", "Scottish Gaelic", 1252, -1), + KU(0x0092, "ku", "ku", "Central Kurdish", 1256, SUNDAY), + QUC(0x0093, "quc", "quc", "K'iche'", 32759, -1), + AR_SA(0x0401, "ar_sa", "ar-SA", "Arabic (Saudi Arabia)", 1256, SUNDAY), + BG_BG(0x0402, "bg_bg", "bg-BG", "Bulgarian (Bulgaria)", 1251, -1), + CA_ES(0x0403, "ca_es", "ca-ES", "Catalan (Catalan)", 1252, -1), + ZH_TW(0x0404, "zh_tw", "zh-TW", "Chinese (Traditional, Taiwan)", 950, SUNDAY), + CS_CZ(0x0405, "cs_cz", "cs-CZ", "Czech (Czech Republic)", 1250, -1), + DA_DK(0x0406, "da_dk", "da-DK", "Danish (Denmark)", 1252, -1), + DE_DE(0x0407, "de_de", "de-DE", "German (Germany)", 1252, -1), + EL_GR(0x0408, "el_gr", "el-GR", "Greek (Greece)", 1253, -1), + EN_US(0x0409, "en_us", "en-US", "English (United States)", 1252, SUNDAY), + ES_ES_TRADNL(0x040A, "es_es_tradnl", "es-ES-tradnl", "Spanish (Spain,tradnl)", 1252, -1), + FI_FI(0x040B, "fi_fi", "fi-FI", "Finnish (Finland)", 1252, -1), + FR_FR(0x040C, "fr_fr", "fr-FR", "French (France)", 1252, -1), + HE_IL(0x040D, "he_il", "he-IL", "Hebrew (Israel)", 1255, SUNDAY), + HU_HU(0x040E, "hu_hu", "hu-HU", "Hungarian (Hungary)", 1250, -1), + IS_IS(0x040F, "is_is", "is-IS", "Icelandic (Iceland)", 1252, -1), + IT_IT(0x0410, "it_it", "it-IT", "Italian (Italy)", 1252, -1), + JA_JP(0x0411, "ja_jp", "ja-JP", "Japanese (Japan)", 932, SUNDAY), + KO_KR(0x0412, "ko_kr", "ko-KR", "Korean (Korea)", 949, SUNDAY), + NL_NL(0x0413, "nl_nl", "nl-NL", "Dutch (Netherlands)", 1252, -1), + NB_NO(0x0414, "nb_no", "nb-NO", "Norwegian, Bokm\u00E5l (Norway)", 1252, -1), + PL_PL(0x0415, "pl_pl", "pl-PL", "Polish (Poland)", 1250, -1), + PT_BR(0x0416, "pt_br", "pt-BR", "Portuguese (Brazil)", 1252, SUNDAY), + RM_CH(0x0417, "rm_ch", "rm-CH", "Romansh (Switzerland)", 1252, -1), + RO_RO(0x0418, "ro_ro", "ro-RO", "Romanian (Romania)", 1250, -1), + RU_RU(0x0419, "ru_ru", "ru-RU", "Russian (Russia)", 1251, -1), + HR_HR(0x041A, "hr_hr", "hr-HR", "Croatian (Croatia)", 1250, -1), + SK_SK(0x041B, "sk_sk", "sk-SK", "Slovak (Slovakia)", 1250, -1), + SQ_AL(0x041C, "sq_al", "sq-AL", "Albanian (Albania)", 1250, -1), + SV_SE(0x041D, "sv_se", "sv-SE", "Swedish (Sweden)", 1252, -1), + TH_TH(0x041E, "th_th", "th-TH", "Thai (Thailand)", 874, -1), + TR_TR(0x041F, "tr_tr", "tr-TR", "Turkish (Turkey)", 1254, -1), + UR_PK(0x0420, "ur_pk", "ur-PK", "Urdu (Islamic Republic of Pakistan)", 1256, -1), + ID_ID(0x0421, "id_id", "id-ID", "Indonesian (Indonesia)", 1252, SUNDAY), + UK_UA(0x0422, "uk_ua", "uk-UA", "Ukrainian (Ukraine)", 1251, -1), + BE_BY(0x0423, "be_by", "be-BY", "Belarusian (Belarus)", 1251, -1), + SL_SI(0x0424, "sl_si", "sl-SI", "Slovenian (Slovenia)", 1250, -1), + ET_EE(0x0425, "et_ee", "et-EE", "Estonian (Estonia)", 1257, -1), + LV_LV(0x0426, "lv_lv", "lv-LV", "Latvian (Latvia)", 1257, -1), + LT_LT(0x0427, "lt_lt", "lt-LT", "Lithuanian (Lithuania)", 1257, -1), + TG_CYRL_TJ(0x0428, "tg_cyrl_tj", "tg-Cyrl-TJ", "Tajik (Cyrillic, Tajikistan)", 1251, -1), + FA_IR(0x0429, "fa_ir", "fa-IR", "Persian (Iran)", 1256, SATURDAY), + VI_VN(0x042A, "vi_vn", "vi-VN", "Vietnamese (Vietnam)", 1258, -1), + HY_AM(0x042B, "hy_am", "hy-AM", "Armenian (Armenia)", 0, -1), + AZ_LATN_AZ(0x042C, "az_latn_az", "az-Latn-AZ", "Azerbaijani (Latin, Azerbaijan)", 1254, -1), + EU_ES(0x042D, "eu_es", "eu-ES", "Basque (Basque)", 1252, -1), + HSB_DE(0x042E, "hsb_de", "hsb-DE", "Upper Sorbian (Germany)", 1252, -1), + MK_MK(0x042F, "mk_mk", "mk-MK", "Macedonian (Former Yugoslav Republic of Macedonia)", 1251, -1), + ST_ZA(0x0430, "st_za", "st-ZA", "Southern Sotho (South Africa)", 0, -1), + TS_ZA(0x0431, "ts_za", "ts-ZA", "Tsonga (South Africa)", 0, -1), + TN_ZA(0x0432, "tn_za", "tn-ZA", "Setswana (South Africa)", 1252, SUNDAY), + VE_ZA(0x0433, "ve_za", "ve-ZA", "Venda (South Africa)", 32759, SUNDAY), + XH_ZA(0x0434, "xh_za", "xh-ZA", "isiXhosa (South Africa)", 1252, SUNDAY), + ZU_ZA(0x0435, "zu_za", "zu-ZA", "isiZulu (South Africa)", 1252, SUNDAY), + AF_ZA(0x0436, "af_za", "af-ZA", "Afrikaans (South Africa)", 1252, SUNDAY), + KA_GE(0x0437, "ka_ge", "ka-GE", "Georgian (Georgia)", 0, -1), + FO_FO(0x0438, "fo_fo", "fo-FO", "Faroese (Faroe Islands)", 1252, -1), + HI_IN(0x0439, "hi_in", "hi-IN", "Hindi (India)", 0, -1), + MT_MT(0x043A, "mt_mt", "mt-MT", "Maltese (Malta)", 0, SUNDAY), + SE_NO(0x043B, "se_no", "se-NO", "Sami, Northern (Norway)", 1252, -1), + YI_HEBR(0x043D, "yi_hebr", "yi-Hebr", "Yiddish (Hebrew)", 32759, -1), + MS_MY(0x043E, "ms_my", "ms-MY", "Malay (Malaysia)", 1252, -1), + KK_KZ(0x043F, "kk_kz", "kk-KZ", "Kazakh (Kazakhstan)", 0, -1), + KY_KG(0x0440, "ky_kg", "ky-KG", "Kyrgyz (Kyrgyzstan)", 1251, -1), + SW_KE(0x0441, "sw_ke", "sw-KE", "Kiswahili (Kenya)", 1252, SUNDAY), + TK_TM(0x0442, "tk_tm", "tk-TM", "Turkmen (Turkmenistan)", 1250, -1), + UZ_LATN_UZ(0x0443, "uz_latn_uz", "uz-Latn-UZ", "Uzbek (Latin, Uzbekistan)", 1254, -1), + TT_RU(0x0444, "tt_ru", "tt-RU", "Tatar (Russia)", 1251, -1), + BN_IN(0x0445, "bn_in", "bn-IN", "Bangla (India)", 0, -1), + PA_IN(0x0446, "pa_in", "pa-IN", "Punjabi (India)", 0, -1), + GU_IN(0x0447, "gu_in", "gu-IN", "Gujarati (India)", 0, -1), + OR_IN(0x0448, "or_in", "or-IN", "Odia (India)", 0, -1), + TA_IN(0x0449, "ta_in", "ta-IN", "Tamil (India)", 0, -1), + TE_IN(0x044A, "te_in", "te-IN", "Telugu (India)", 0, -1), + KN_IN(0x044B, "kn_in", "kn-IN", "Kannada (India)", 0, -1), + ML_IN(0x044C, "ml_in", "ml-IN", "Malayalam (India)", 0, SUNDAY), + AS_IN(0x044D, "as_in", "as-IN", "Assamese (India)", 0, -1), + MR_IN(0x044E, "mr_in", "mr-IN", "Marathi (India)", 0, -1), + SA_IN(0x044F, "sa_in", "sa-IN", "Sanskrit (India)", 0, SUNDAY), + MN_MN(0x0450, "mn_mn", "mn-MN", "Mongolian (Cyrillic, Mongolia)", 1251, -1), + BO_CN(0x0451, "bo_cn", "bo-CN", "Tibetan (PRC)", 0, -1), + CY_GB(0x0452, "cy_gb", "cy-GB", "Welsh (United Kingdom)", 1252, -1), + KM_KH(0x0453, "km_kh", "km-KH", "Khmer (Cambodia)", 0, SUNDAY), + LO_LA(0x0454, "lo_la", "lo-LA", "Lao (Lao P.D.R.)", 0, SUNDAY), + MY_MM(0x0455, "my_mm", "my-MM", "Burmese (Myanmar)", 0, SUNDAY), + GL_ES(0x0456, "gl_es", "gl-ES", "Galician (Galician)", 1252, -1), + KOK_IN(0x0457, "kok_in", "kok-IN", "Konkani (India)", 0, -1), + MNI_IN(0x0458, "mni_in", "mni-IN", "Manipuri (India)", 32759, -1), + SD_DEVA_IN(0x0459, "sd_deva_in", "sd-Deva-IN", "Sindhi (Devanagari, India)", 32759, SUNDAY), + SYR_SY(0x045A, "syr_sy", "syr-SY", "Syriac (Syria)", 0, SUNDAY), + SI_LK(0x045B, "si_lk", "si-LK", "Sinhala (Sri Lanka)", 0, -1), + CHR_CHER_US(0x045C, "chr_cher_us", "chr-Cher-US", "Cherokee (Cherokee)", 0, SUNDAY), + IU_CANS_CA(0x045D, "iu_cans_ca", "iu-Cans-CA", "Inuktitut (Syllabics, Canada)", 0, SUNDAY), + AM_ET(0x045E, "am_et", "am-ET", "Amharic (Ethiopia)", 0, SUNDAY), + TZM_ARAB_MA(0x045F, "tzm_arab_ma", "tzm-Arab-MA", "Central Atlas Tamazight (Arabic, Morocco)", 32759, SATURDAY), + KS_ARAB(0x0460, "ks_arab", "ks-Arab", "Kashmiri (Perso-Arabic)", 32759, SUNDAY), + NE_NP(0x0461, "ne_np", "ne-NP", "Nepali (Nepal)", 0, SUNDAY), + FY_NL(0x0462, "fy_nl", "fy-NL", "Frisian (Netherlands)", 1252, -1), + PS_AF(0x0463, "ps_af", "ps-AF", "Pashto (Afghanistan)", 0, SATURDAY), + FIL_PH(0x0464, "fil_ph", "fil-PH", "Filipino (Philippines)", 1252, SUNDAY), + DV_MV(0x0465, "dv_mv", "dv-MV", "Divehi (Maldives)", 0, SUNDAY), + BIN_NG(0x0466, "bin_ng", "bin-NG", "Edo (Nigeria)", 32759, SUNDAY), + FUV_NG(0x0467, "fuv_ng", "fuv-NG", "fuv (Nigeria)", 32759, -1), + HA_LATN_NG(0x0468, "ha_latn_ng", "ha-Latn-NG", "Hausa (Latin, Nigeria)", 1252, -1), + IBB_NG(0x0469, "ibb_ng", "ibb-NG", "Ibibio (Nigeria)", 32759, SUNDAY), + YO_NG(0x046A, "yo_ng", "yo-NG", "Yoruba (Nigeria)", 1252, -1), + QUZ_BO(0x046B, "quz_bo", "quz-BO", "Quechua (Bolivia)", 1252, SUNDAY), + NSO_ZA(0x046C, "nso_za", "nso-ZA", "Sesotho sa Leboa (South Africa)", 1252, SUNDAY), + BA_RU(0x046D, "ba_ru", "ba-RU", "Bashkir (Russia)", 1251, -1), + LB_LU(0x046E, "lb_lu", "lb-LU", "Luxembourgish (Luxembourg)", 1252, -1), + KL_GL(0x046F, "kl_gl", "kl-GL", "Greenlandic (Greenland)", 1252, -1), + IG_NG(0x0470, "ig_ng", "ig-NG", "Igbo (Nigeria)", 1252, -1), + KR_NG(0x0471, "kr_ng", "kr-NG", "Kanuri (Nigeria)", 32759, SUNDAY), + OM_ET(0x0472, "om_et", "om-ET", "Oromo (Ethiopia)", 0, SUNDAY), + TI_ET(0x0473, "ti_et", "ti-ET", "Tigrinya (Ethiopia)", 0, SUNDAY), + GN_PY(0x0474, "gn_py", "gn-PY", "Guarani (Paraguay)", 1252, SUNDAY), + HAW_US(0x0475, "haw_us", "haw-US", "Hawaiian (United States)", 1252, SUNDAY), + LA_LATN(0x0476, "la_latn", "la-Latn", "Latin (Latin)", 32759, -1), + SO_SO(0x0477, "so_so", "so-SO", "Somali (Somalia)", 0, -1), + II_CN(0x0478, "ii_cn", "ii-CN", "Yi (PRC)", 0, -1), + PAP_029(0x0479, "pap_029", "pap-029", "Papiamento (Caribbean)", 32759, -1), + ARN_CL(0x047A, "arn_cl", "arn-CL", "Mapudungun (Chile)", 1252, SUNDAY), + MOH_CA(0x047C, "moh_ca", "moh-CA", "Mohawk (Mohawk)", 1252, SUNDAY), + BR_FR(0x047E, "br_fr", "br-FR", "Breton (France)", 1252, -1), + UG_CN(0x0480, "ug_cn", "ug-CN", "Uyghur (PRC)", 1256, -1), + MI_NZ(0x0481, "mi_nz", "mi-NZ", "Maori (New Zealand)", 0, -1), + OC_FR(0x0482, "oc_fr", "oc-FR", "Occitan (France)", 1252, -1), + CO_FR(0x0483, "co_fr", "co-FR", "Corsican (France)", 1252, -1), + GSW_FR(0x0484, "gsw_fr", "gsw-FR", "Alsatian (France)", 1252, -1), + SAH_RU(0x0485, "sah_ru", "sah-RU", "Sakha (Russia)", 1251, -1), + QUT_GT(0x0486, "qut_gt", "qut-GT", "qut (Guatemala)", 1252, -1), + RW_RW(0x0487, "rw_rw", "rw-RW", "Kinyarwanda (Rwanda)", 1252, -1), + WO_SN(0x0488, "wo_sn", "wo-SN", "Wolof (Senegal)", 1252, -1), + PRS_AF(0x048C, "prs_af", "prs-AF", "Dari (Afghanistan)", 1256, SATURDAY), + PLT_MG(0x048D, "plt_mg", "plt-MG", "plt (Madagascar)", 32759, -1), + ZH_YUE_HK(0x048E, "zh_yue_hk", "yue-HK", "yue (Hong Kong)", 32759, -1), + TDD_TALE_CN(0x048F, "tdd_tale_cn", "tdd-Tale-CN", "tdd (Tai Le,China)", 32759, -1), + KHB_TALU_CN(0x0490, "khb_talu_cn", "khb-Talu-CN", "khb (New Tai Lue,China)", 32759, -1), + GD_GB(0x0491, "gd_gb", "gd-GB", "Scottish Gaelic (United Kingdom)", 1252, -1), + KU_ARAB_IQ(0x0492, "ku_arab_iq", "ku-Arab-IQ", "Central Kurdish (Iraq)", 1256, SUNDAY), + QUC_CO(0x0493, "quc_co", "quc-CO", "quc (Colombia)", 32759, -1), + QPS_PLOC(0x0501, "qps_ploc", "qps-Ploc", "qps (Ploc)", 1250, -1), + QPS_PLOCA(0x05FE, "qps_ploca", "qps-ploca", "qps (ploca)", 932, -1), + AR_IQ(0x0801, "ar_iq", "ar-IQ", "Arabic (Iraq)", 1256, SATURDAY), + CA_ES_VALENCIA(0x0803, "ca_es_valencia", "ca-ES-valencia", "Valencian (Spain)", 1252, -1), + ZH_CN(0x0804, "zh_cn", "zh-CN", "Chinese (Simplified, PRC)", 936, -1), + DE_CH(0x0807, "de_ch", "de-CH", "German (Switzerland)", 1252, -1), + EN_GB(0x0809, "en_gb", "en-GB", "English (United Kingdom)", 1252, -1), + ES_MX(0x080A, "es_mx", "es-MX", "Spanish (Mexico)", 1252, SUNDAY), + FR_BE(0x080C, "fr_be", "fr-BE", "French (Belgium)", 1252, -1), + IT_CH(0x0810, "it_ch", "it-CH", "Italian (Switzerland)", 1252, -1), + JA_PLOC_JP(0x0811, "ja_ploc_jp", "ja-Ploc-JP", "Japanese (Ploc,Japan)", 32759, -1), + NL_BE(0x0813, "nl_be", "nl-BE", "Dutch (Belgium)", 1252, -1), + NN_NO(0x0814, "nn_no", "nn-NO", "Norwegian, Nynorsk (Norway)", 1252, -1), + PT_PT(0x0816, "pt_pt", "pt-PT", "Portuguese (Portugal)", 1252, SUNDAY), + RO_MD(0x0818, "ro_md", "ro-MD", "Romanian (Moldova)", 0, -1), + RU_MD(0x0819, "ru_md", "ru-MD", "Russian (Moldova)", 32759, -1), + SR_LATN_CS(0x081A, "sr_latn_cs", "sr-Latn-CS", "Serbian (Latin,Serbia and Montenegro)", 1250, -1), + SV_FI(0x081D, "sv_fi", "sv-FI", "Swedish (Finland)", 1252, -1), + UR_IN(0x0820, "ur_in", "ur-IN", "Urdu (India)", 0, -1), + INVALID_K(0x0827, "invalid_k", "", "", 32759, -1), + AZ_CYRL_AZ(0x082C, "az_cyrl_az", "az-Cyrl-AZ", "Azerbaijani (Cyrillic, Azerbaijan)", 1251, -1), + DSB_DE(0x082E, "dsb_de", "dsb-DE", "Lower Sorbian (Germany)", 1252, -1), + TN_BW(0x0832, "tn_bw", "tn-BW", "Setswana (Botswana)", 1252, SUNDAY), + SE_SE(0x083B, "se_se", "se-SE", "Sami, Northern (Sweden)", 1252, -1), + GA_IE(0x083C, "ga_ie", "ga-IE", "Irish (Ireland)", 1252, SUNDAY), + MS_BN(0x083E, "ms_bn", "ms-BN", "Malay (Brunei Darussalam)", 1252, -1), + UZ_CYRL_UZ(0x0843, "uz_cyrl_uz", "uz-Cyrl-UZ", "Uzbek (Cyrillic, Uzbekistan)", 1251, -1), + BN_BD(0x0845, "bn_bd", "bn-BD", "Bangla (Bangladesh)", 0, SUNDAY), + PA_ARAB_PK(0x0846, "pa_arab_pk", "pa-Arab-PK", "Punjabi (Islamic Republic of Pakistan)", 1256, -1), + TA_LK(0x0849, "ta_lk", "ta-LK", "Tamil (Sri Lanka)", 0, -1), + MN_MONG_CN(0x0850, "mn_mong_cn", "mn-Mong-CN", "Mongolian (Traditional Mongolian, PRC)", 0, -1), + BO_BT(0x0851, "bo_bt", "bo-BT", "Tibetan (Bhutan)", 32759, -1), + SD_ARAB_PK(0x0859, "sd_arab_pk", "sd-Arab-PK", "Sindhi (Islamic Republic of Pakistan)", 1256, -1), + IU_LATN_CA(0x085D, "iu_latn_ca", "iu-Latn-CA", "Inuktitut (Latin, Canada)", 1252, SUNDAY), + TZM_LATN_DZ(0x085F, "tzm_latn_dz", "tzm-Latn-DZ", "Tamazight (Latin, Algeria)", 1252, -1), + KS_DEVA(0x0860, "ks_deva", "ks-Deva", "Kashmiri (Devanagari)", 32759, -1), + NE_IN(0x0861, "ne_in", "ne-IN", "Nepali (India)", 0, SUNDAY), + FF_LATN_SN(0x0867, "ff_latn_sn", "ff-Latn-SN", "Fulah (Latin, Senegal)", 1252, -1), + QUZ_EC(0x086B, "quz_ec", "quz-EC", "Quechua (Ecuador)", 1252, SUNDAY), + TI_ER(0x0873, "ti_er", "ti-ER", "Tigrinya (Eritrea)", 0, -1), + QPS_PLOCM(0x09FF, "qps_plocm", "qps-plocm", "qps (plocm)", 1256, -1), + AR_EG(0x0C01, "ar_eg", "ar-EG", "Arabic (Egypt)", 1256, SATURDAY), + ZH_HK(0x0C04, "zh_hk", "zh-HK", "Chinese (Traditional, Hong Kong S.A.R.)", 950, SUNDAY), + DE_AT(0x0C07, "de_at", "de-AT", "German (Austria)", 1252, -1), + EN_AU(0x0C09, "en_au", "en-AU", "English (Australia)", 1252, -1), + ES_ES(0x0C0A, "es_es", "es-ES", "Spanish (Spain)", 1252, -1), + FR_CA(0x0C0C, "fr_ca", "fr-CA", "French (Canada)", 1252, SUNDAY), + SR_CYRL_CS(0x0C1A, "sr_cyrl_cs", "sr-Cyrl-CS", "Serbian (Cyrillic,Serbia and Montenegro)", 1251, -1), + SE_FI(0x0C3B, "se_fi", "se-FI", "Sami, Northern (Finland)", 1252, -1), + MN_MONG_MN(0x0C50, "mn_mong_mn", "mn-Mong-MN", "Mongolian (Traditional Mongolian, Mongolia)", 0, -1), + DZ_BT(0x0C51, "dz_bt", "dz-BT", "Dzongkha (Bhutan)", 0, SUNDAY), + TMZ_MA(0x0C5F, "tmz_ma", "tmz-MA", "tmz (Morocco)", 32759, -1), + QUZ_PE(0x0C6b, "quz_pe", "quz-PE", "Quechua (Peru)", 1252, -1), + AR_LY(0x1001, "ar_ly", "ar-LY", "Arabic (Libya)", 1256, SATURDAY), + ZH_SG(0x1004, "zh_sg", "zh-SG", "Chinese (Simplified, Singapore)", 936, SUNDAY), + DE_LU(0x1007, "de_lu", "de-LU", "German (Luxembourg)", 1252, -1), + EN_CA(0x1009, "en_ca", "en-CA", "English (Canada)", 1252, SUNDAY), + ES_GT(0x100A, "es_gt", "es-GT", "Spanish (Guatemala)", 1252, SUNDAY), + FR_CH(0x100C, "fr_ch", "fr-CH", "French (Switzerland)", 1252, -1), + HR_BA(0x101A, "hr_ba", "hr-BA", "Croatian (Latin, Bosnia and Herzegovina)", 1250, -1), + SMJ_NO(0x103B, "smj_no", "smj-NO", "Sami, Lule (Norway)", 1252, -1), + TZM_TFNG_MA(0x105F, "tzm_tfng_ma", "tzm-Tfng-MA", "Central Atlas Tamazight (Tifinagh, Morocco)", 0, SATURDAY), + AR_DZ(0x1401, "ar_dz", "ar-DZ", "Arabic (Algeria)", 1256, SATURDAY), + ZH_MO(0x1404, "zh_mo", "zh-MO", "Chinese (Traditional, Macao S.A.R.)", 950, SUNDAY), + DE_LI(0x1407, "de_li", "de-LI", "German (Liechtenstein)", 1252, -1), + EN_NZ(0x1409, "en_nz", "en-NZ", "English (New Zealand)", 1252, SUNDAY), + ES_CR(0x140A, "es_cr", "es-CR", "Spanish (Costa Rica)", 1252, -1), + FR_LU(0x140C, "fr_lu", "fr-LU", "French (Luxembourg)", 1252, -1), + BS_LATN_BA(0x141A, "bs_latn_ba", "bs-Latn-BA", "Bosnian (Latin, Bosnia and Herzegovina)", 1250, -1), + SMJ_SE(0x143B, "smj_se", "smj-SE", "Sami, Lule (Sweden)", 1252, -1), + AR_MA(0x1801, "ar_ma", "ar-MA", "Arabic (Morocco)", 1256, -1), + EN_IE(0x1809, "en_ie", "en-IE", "English (Ireland)", 1252, SUNDAY), + ES_PA(0x180A, "es_pa", "es-PA", "Spanish (Panama)", 1252, SUNDAY), + FR_MC(0x180C, "fr_mc", "fr-MC", "French (Monaco)", 1252, -1), + SR_LATN_BA(0x181A, "sr_latn_ba", "sr-Latn-BA", "Serbian (Latin, Bosnia and Herzegovina)", 1250, -1), + SMA_NO(0x183B, "sma_no", "sma-NO", "Sami, Southern (Norway)", 1252, -1), + AR_TN(0x1C01, "ar_tn", "ar-TN", "Arabic (Tunisia)", 1256, -1), + EN_ZA(0x1C09, "en_za", "en-ZA", "English (South Africa)", 1252, SUNDAY), + ES_DO(0x1C0A, "es_do", "es-DO", "Spanish (Dominican Republic)", 1252, SUNDAY), + INVALID_L(0x1C0C, "invalid_l", "", "", 32759, -1), + SR_CYRL_BA(0x1C1A, "sr_cyrl_ba", "sr-Cyrl-BA", "Serbian (Cyrillic, Bosnia and Herzegovina)", 1251, -1), + SMA_SE(0x1C3B, "sma_se", "sma-SE", "Sami, Southern (Sweden)", 1252, -1), + AR_OM(0x2001, "ar_om", "ar-OM", "Arabic (Oman)", 1256, SUNDAY), + INVALID_M(0x2008, "invalid_m", "", "", 32759, -1), + EN_JM(0x2009, "en_jm", "en-JM", "English (Jamaica)", 1252, SUNDAY), + ES_VE(0x200A, "es_ve", "es-VE", "Spanish (Venezuela)", 1252, -1), + FR_RE(0x200C, "fr_re", "fr-RE", "French (Reunion)", 0, -1), + BS_CYRL_BA(0x201A, "bs_cyrl_ba", "bs-Cyrl-BA", "Bosnian (Cyrillic, Bosnia and Herzegovina)", 1251, -1), + SMS_FI(0x203B, "sms_fi", "sms-FI", "Sami, Skolt (Finland)", 1252, -1), + AR_YE(0x2401, "ar_ye", "ar-YE", "Arabic (Yemen)", 1256, SATURDAY), + EN_029(0x2409, "en_029", "en-029", "English (Caribbean)", 1252, -1), + ES_CO(0x240A, "es_co", "es-CO", "Spanish (Colombia)", 1252, SUNDAY), + FR_CD(0x240C, "fr_cd", "fr-CD", "French (Congo DRC)", 0, -1), + SR_LATN_RS(0x241A, "sr_latn_rs", "sr-Latn-RS", "Serbian (Latin, Serbia)", 1250, -1), + SMN_FI(0x243B, "smn_fi", "smn-FI", "Sami, Inari (Finland)", 1252, -1), + AR_SY(0x2801, "ar_sy", "ar-SY", "Arabic (Syria)", 1256, SATURDAY), + EN_BZ(0x2809, "en_bz", "en-BZ", "English (Belize)", 1252, SUNDAY), + ES_PE(0x280A, "es_pe", "es-PE", "Spanish (Peru)", 1252, SUNDAY), + FR_SN(0x280C, "fr_sn", "fr-SN", "French (Senegal)", 0, -1), + SR_CYRL_RS(0x281A, "sr_cyrl_rs", "sr-Cyrl-RS", "Serbian (Cyrillic, Serbia)", 1251, -1), + AR_JO(0x2C01, "ar_jo", "ar-JO", "Arabic (Jordan)", 1256, SATURDAY), + EN_TT(0x2C09, "en_tt", "en-TT", "English (Trinidad and Tobago)", 1252, SUNDAY), + ES_AR(0x2C0A, "es_ar", "es-AR", "Spanish (Argentina)", 1252, SUNDAY), + FR_CM(0x2C0C, "fr_cm", "fr-CM", "French (Cameroon)", 0, -1), + SR_LATN_ME(0x2C1A, "sr_latn_me", "sr-Latn-ME", "Serbian (Latin, Montenegro)", 1250, -1), + AR_LB(0x3001, "ar_lb", "ar-LB", "Arabic (Lebanon)", 1256, -1), + EN_ZW(0x3009, "en_zw", "en-ZW", "English (Zimbabwe)", 1252, SUNDAY), + ES_EC(0x300A, "es_ec", "es-EC", "Spanish (Ecuador)", 1252, -1), + FR_CI(0x300C, "fr_ci", "fr-CI", "French (C\u00F4te d\u2019Ivoire)", 0, -1), + SR_CYRL_ME(0x301A, "sr_cyrl_me", "sr-Cyrl-ME", "Serbian (Cyrillic, Montenegro)", 1251, -1), + AR_KW(0x3401, "ar_kw", "ar-KW", "Arabic (Kuwait)", 1256, SATURDAY), + EN_PH(0x3409, "en_ph", "en-PH", "English (Philippines)", 1252, SUNDAY), + ES_CL(0x340A, "es_cl", "es-CL", "Spanish (Chile)", 1252, -1), + FR_ML(0x340C, "fr_ml", "fr-ML", "French (Mali)", 0, -1), + AR_AE(0x3801, "ar_ae", "ar-AE", "Arabic (U.A.E.)", 1256, SATURDAY), + EN_ID(0x3809, "en_id", "en-ID", "English (Indonesia)", 32759, SUNDAY), + ES_UY(0x380A, "es_uy", "es-UY", "Spanish (Uruguay)", 1252, -1), + FR_MA(0x380C, "fr_ma", "fr-MA", "French (Morocco)", 0, SATURDAY), + AR_BH(0x3c01, "ar_bh", "ar-BH", "Arabic (Bahrain)", 1256, SATURDAY), + EN_HK(0x3c09, "en_hk", "en-HK", "English (Hong Kong SAR)", 0, SUNDAY), + ES_PY(0x3c0A, "es_py", "es-PY", "Spanish (Paraguay)", 1252, SUNDAY), + FR_HT(0x3c0C, "fr_ht", "fr-HT", "French (Haiti)", 0, -1), + AR_QA(0x4001, "ar_qa", "ar-QA", "Arabic (Qatar)", 1256, SATURDAY), + EN_IN(0x4009, "en_in", "en-IN", "English (India)", 1252, -1), + ES_BO(0x400A, "es_bo", "es-BO", "Spanish (Bolivia)", 1252, -1), + AR_PLOC_SA(0x4401, "ar_ploc_sa", "ar-Ploc-SA", "Arabic (Ploc,Saudi Arabia)", 32759, -1), + EN_MY(0x4409, "en_my", "en-MY", "English (Malaysia)", 1252, SUNDAY), + ES_SV(0x440A, "es_sv", "es-SV", "Spanish (El Salvador)", 1252, SUNDAY), + AR_145(0x4801, "ar_145", "ar-145", "Arabic (Western Asia)", 32759, -1), + EN_SG(0x4809, "en_sg", "en-SG", "English (Singapore)", 1252, SUNDAY), + ES_HN(0x480A, "es_hn", "es-HN", "Spanish (Honduras)", 1252, SUNDAY), + EN_AE(0x4C09, "en_ae", "en-AE", "English (United Arab Emirates)", 32759, -1), + ES_NI(0x4C0A, "es_ni", "es-NI", "Spanish (Nicaragua)", 1252, SUNDAY), + EN_BH(0x5009, "en_bh", "en-BH", "English (Bahrain)", 32759, -1), + ES_PR(0x500A, "es_pr", "es-PR", "Spanish (Puerto Rico)", 1252, SUNDAY), + EN_EG(0x5409, "en_eg", "en-EG", "English (Egypt)", 32759, -1), + ES_US(0x540A, "es_us", "es-US", "Spanish (United States)", 1252, SUNDAY), + EN_JO(0x5809, "en_jo", "en-JO", "English (Jordan)", 32759, -1), + ES_419(0x580A, "es_419", "es-419", "Spanish (Latin America)", 0, -1), + EN_KW(0x5C09, "en_kw", "en-KW", "English (Kuwait)", 32759, -1), + ES_CU(0x5C0A, "es_cu", "es-CU", "Spanish (Cuba)", 0, -1), + EN_TR(0x6009, "en_tr", "en-TR", "English (Turkey)", 32759, -1), + EN_YE(0x6409, "en_ye", "en-YE", "English (Yemen)", 32759, -1), + BS_CYRL(0x641A, "bs_cyrl", "bs-Cyrl", "Bosnian (Cyrillic)", 1251, -1), + BS_LATN(0x681A, "bs_latn", "bs-Latn", "Bosnian (Latin)", 1250, -1), + SR_CYRL(0x6C1A, "sr_cyrl", "sr-Cyrl", "Serbian (Cyrillic)", 1251, -1), + SR_LATN(0x701A, "sr_latn", "sr-Latn", "Serbian (Latin)", 1250, -1), + SMN(0x703B, "smn", "smn", "Sami (Inari)", 1252, -1), + AZ_CYRL(0x742C, "az_cyrl", "az-Cyrl", "Azerbaijani (Cyrillic)", 1251, -1), + SMS(0x743B, "sms", "sms", "Sami (Skolt)", 1252, -1), + ZH(0x7804, "zh", "zh", "Chinese", 936, -1), + NN(0x7814, "nn", "nn", "Norwegian (Nynorsk)", 1252, -1), + BS(0x781A, "bs", "bs", "Bosnian", 1250, -1), + AZ_LATN(0x782C, "az_latn", "az-Latn", "Azerbaijani (Latin)", 1254, -1), + SMA(0x783B, "sma", "sma", "Sami (Southern)", 1252, -1), + UZ_CYRL(0x7843, "uz_cyrl", "uz-Cyrl", "Uzbek (Cyrillic)", 1251, -1), + MN_CYRL(0x7850, "mn_cyrl", "mn-Cyrl", "Mongolian (Cyrillic)", 1251, -1), + IU_CANS(0x785D, "iu_cans", "iu-Cans", "Inuktitut (Syllabics)", 0, SUNDAY), + TZM_TFNG(0x785F, "tzm_tfng", "tzm-Tfng", "Tamazight (Tifinagh)", 0, -1), + ZH_HANT(0x7C04, "zh_hant", "zh-Hant", "Chinese (Traditional)", 950, SUNDAY), + NB(0x7C14, "nb", "nb", "Norwegian (Bokm\u00E5l)", 1252, -1), + SR(0x7C1A, "sr", "sr", "Serbian", 1250, -1), + TG_CYRL(0x7C28, "tg_cyrl", "tg-Cyrl", "Tajik (Cyrillic)", 1251, -1), + DSB(0x7C2E, "dsb", "dsb", "Lower Sorbian", 1252, -1), + SMJ(0x7C3B, "smj", "smj", "Sami (Lule)", 1252, -1), + UZ_LATN(0x7C43, "uz_latn", "uz-Latn", "Uzbek (Latin)", 1254, -1), + PA_ARAB(0x7C46, "pa_arab", "pa-Arab", "Punjabi (Arabic)", 1256, -1), + MN_MONG(0x7C50, "mn_mong", "mn-Mong", "Mongolian (Traditional Mongolian)", 0, -1), + SD_ARAB(0x7C59, "sd_arab", "sd-Arab", "Sindhi (Arabic)", 1256, -1), + CHR_CHER(0x7C5C, "chr_cher", "chr-Cher", "Cherokee (Cherokee)", 0, SUNDAY), + IU_LATN(0x7C5D, "iu_latn", "iu-Latn", "Inuktitut (Latin)", 1252, SUNDAY), + TZM_LATN(0x7C5F, "tzm_latn", "tzm-Latn", "Tamazight (Latin)", 1252, -1), + FF_LATN(0x7C67, "ff_latn", "ff-Latn", "Fulah (Latin)", 1252, -1), + HA_LATN(0x7C68, "ha_latn", "ha-Latn", "Hausa (Latin)", 1252, -1), + KU_ARAB(0x7C92, "ku_arab", "ku-Arab", "Central Kurdish (Arabic)", 1256, -1), + INVALID_N(0xF2EE, "invalid_n", "", "", 0, -1), + INVALID_O(0xEEEE, "invalid_o", "", "", 0, -1), + ; + + private final int lcid; + private final String windowsId; + private final String languageTag; + private final String description; + private final int defaultCodepage; + private final int firstWeekday; + + private static final Map languageTagLookup = + Stream.of(values()).filter(LocaleID::isValid).collect(Collectors.toMap(LocaleID::getLanguageTag, Function.identity())); + + private static final Map lcidLookup = + Stream.of(values()).collect(Collectors.toMap(LocaleID::getLcid, Function.identity())); + + LocaleID(int lcid, String windowsId, String languageTag, String description, int defaultCodepage, int firstWeekday) { + this.lcid = lcid; + this.windowsId = windowsId; + this.languageTag = languageTag; + this.description = description; + this.defaultCodepage = defaultCodepage; + this.firstWeekday = (firstWeekday == -1) ? Calendar.MONDAY : firstWeekday; + } + + public int getLcid() { + return lcid; + } + + public String getWindowsId() { + return windowsId; + } + + public String getLanguageTag() { + return languageTag; + } + + public String getDescription() { + return description; + } + + public int getDefaultCodepage() { + return defaultCodepage; + } + + public int getFirstWeekday() { + return firstWeekday; + } + + private boolean isValid() { + return !languageTag.isEmpty(); + } + + /** + * Lookup via the Java language tag / locale display name + * + * @param languageTag the locale display name + * @return if found the LocaleId, otherwise {@code null} + */ + public static LocaleID lookupByLanguageTag(String languageTag) { + return languageTagLookup.get(languageTag); + } + + /** + * Lookup via the Windows LCID + * + * @param lcid the language code id (LCID) + * @return if found the LocaleId, otherwise {@code null} + */ + public static LocaleID lookupByLcid(int lcid) { + return lcidLookup.get(lcid); + } + +} diff --git a/src/java/org/apache/poi/util/LocaleUtil.java b/src/java/org/apache/poi/util/LocaleUtil.java index c440fc96a4..5e6619645c 100644 --- a/src/java/org/apache/poi/util/LocaleUtil.java +++ b/src/java/org/apache/poi/util/LocaleUtil.java @@ -14,7 +14,7 @@ See the License for the specific language governing permissions and limitations under the License. ==================================================================== */ - + package org.apache.poi.util; @@ -30,7 +30,7 @@ import java.util.TimeZone; * the locale/time zone specific handling of certain office documents - * maybe for different time zones / locales ... - shouldn't affect * other java components. - * + * * The settings are saved in a {@link java.lang.ThreadLocal}, * so they only apply to the current thread and can't be set globally. */ @@ -38,13 +38,15 @@ public final class LocaleUtil { private LocaleUtil() { // no instances of this class } - + + + /** * Excel doesn't store TimeZone information in the file, so if in doubt, * use UTC to perform calculations */ public static final TimeZone TIMEZONE_UTC = TimeZone.getTimeZone("UTC"); - + /** * Default encoding for unknown byte encodings of native files * (at least it's better than to rely on a platform dependent encoding @@ -54,7 +56,7 @@ public final class LocaleUtil { private static final ThreadLocal userTimeZone = new ThreadLocal<>(); private static final ThreadLocal userLocale = new ThreadLocal<>(); - + /** * As time zone information is not stored in any format, it can be * set before any date calculations take place. @@ -65,7 +67,7 @@ public final class LocaleUtil { public static void setUserTimeZone(TimeZone timezone) { userTimeZone.set(timezone); } - + /** * @return the time zone which is used for date calculations. If not set, returns {@link TimeZone#getDefault()}. */ @@ -77,7 +79,7 @@ public final class LocaleUtil { /** * Clear the thread-local user time zone. - */ + */ public static void resetUserTimeZone() { userTimeZone.remove(); } @@ -89,7 +91,7 @@ public final class LocaleUtil { public static void setUserLocale(Locale locale) { userLocale.set(locale); } - + /** * @return the default user locale. If not set, returns {@link Locale#getDefault()}. */ @@ -139,14 +141,14 @@ public final class LocaleUtil { cal.clear(Calendar.MILLISECOND); return cal; } - + /** * @return a calendar for the user locale and time zone */ public static Calendar getLocaleCalendar(TimeZone timeZone) { return Calendar.getInstance(timeZone, getUserLocale()); } - + /** * Decode the language ID from LCID value * @@ -154,468 +156,10 @@ public final class LocaleUtil { * @return the locale/language ID */ public static String getLocaleFromLCID(int lcid) { - int languageId = lcid & 0xFFFF; - switch (languageId) { - case 0x0001: return "ar"; - case 0x0002: return "bg"; - case 0x0003: return "ca"; - case 0x0004: return "zh-Hans"; - case 0x0005: return "cs"; - case 0x0006: return "da"; - case 0x0007: return "de"; - case 0x0008: return "el"; - case 0x0009: return "en"; - case 0x000a: return "es"; - case 0x000b: return "fi"; - case 0x000c: return "fr"; - case 0x000d: return "he"; - case 0x000e: return "hu"; - case 0x000f: return "is"; - case 0x0010: return "it"; - case 0x0011: return "ja"; - case 0x0012: return "ko"; - case 0x0013: return "nl"; - case 0x0014: return "no"; - case 0x0015: return "pl"; - case 0x0016: return "pt"; - case 0x0017: return "rm"; - case 0x0018: return "ro"; - case 0x0019: return "ru"; - case 0x001a: return "bs, hr, or sr"; - case 0x001b: return "sk"; - case 0x001c: return "sq"; - case 0x001d: return "sv"; - case 0x001e: return "th"; - case 0x001f: return "tr"; - case 0x0020: return "ur"; - case 0x0021: return "id"; - case 0x0022: return "uk"; - case 0x0023: return "be"; - case 0x0024: return "sl"; - case 0x0025: return "et"; - case 0x0026: return "lv"; - case 0x0027: return "lt"; - case 0x0028: return "tg"; - case 0x0029: return "fa"; - case 0x002a: return "vi"; - case 0x002b: return "hy"; - case 0x002c: return "az"; - case 0x002d: return "eu"; - case 0x002e: return "dsb or hsb"; - case 0x002f: return "mk"; - case 0x0030: return "st"; // reserved - case 0x0031: return "ts"; // reserved - case 0x0032: return "tn"; - case 0x0033: return "ve"; // reserved - case 0x0034: return "xh"; - case 0x0035: return "zu"; - case 0x0036: return "af"; - case 0x0037: return "ka"; - case 0x0038: return "fo"; - case 0x0039: return "hi"; - case 0x003a: return "mt"; - case 0x003b: return "se"; - case 0x003c: return "ga"; - case 0x003d: return "yi"; // reserved - case 0x003e: return "ms"; - case 0x003f: return "kk"; - case 0x0040: return "ky"; - case 0x0041: return "sw"; - case 0x0042: return "tk"; - case 0x0043: return "uz"; - case 0x0044: return "tt"; - case 0x0045: return "bn"; - case 0x0046: return "pa"; - case 0x0047: return "gu"; - case 0x0048: return "or"; - case 0x0049: return "ta"; - case 0x004a: return "te"; - case 0x004b: return "kn"; - case 0x004c: return "ml"; - case 0x004d: return "as"; - case 0x004e: return "mr"; - case 0x004f: return "sa"; - case 0x0050: return "mn"; - case 0x0051: return "bo"; - case 0x0052: return "cy"; - case 0x0053: return "km"; - case 0x0054: return "lo"; - case 0x0055: return "my"; // reserved - case 0x0056: return "gl"; - case 0x0057: return "kok"; - case 0x0058: return "mni"; // reserved - case 0x0059: return "sd"; - case 0x005a: return "syr"; - case 0x005b: return "si"; - case 0x005c: return "chr"; - case 0x005d: return "iu"; - case 0x005e: return "am"; - case 0x005f: return "tzm"; - case 0x0060: return "ks"; // reserved - case 0x0061: return "ne"; - case 0x0062: return "fy"; - case 0x0063: return "ps"; - case 0x0064: return "fil"; - case 0x0065: return "dv"; - case 0x0066: return "bin"; // reserved - case 0x0067: return "ff"; - case 0x0068: return "ha"; - case 0x0069: return "ibb"; // reserved - case 0x006a: return "yo"; - case 0x006b: return "quz"; - case 0x006c: return "nso"; - case 0x006d: return "ba"; - case 0x006e: return "lb"; - case 0x006f: return "kl"; - case 0x0070: return "ig"; - case 0x0071: return "kr"; // reserved - case 0x0072: return "om"; // reserved - case 0x0073: return "ti"; - case 0x0074: return "gn"; // reserved - case 0x0075: return "haw"; - case 0x0076: return "la"; // reserved - case 0x0077: return "so"; // reserved - case 0x0078: return "ii"; - case 0x0079: return "pap"; // reserved - case 0x007a: return "arn"; - case 0x007b: return "invalid"; // Neither defined nor reserved - case 0x007c: return "moh"; - case 0x007d: return "invalid"; // Neither defined nor reserved - case 0x007e: return "br"; - case 0x007f: return "invalid"; // Reserved or invariant locale behavior - case 0x0080: return "ug"; - case 0x0081: return "mi"; - case 0x0082: return "oc"; - case 0x0083: return "co"; - case 0x0084: return "gsw"; - case 0x0085: return "sah"; - case 0x0086: return "qut"; - case 0x0087: return "rw"; - case 0x0088: return "wo"; - case 0x0089: return "invalid"; // Neither defined nor reserved - case 0x008a: return "invalid"; // Neither defined nor reserved - case 0x008b: return "invalid"; // Neither defined nor reserved - case 0x008c: return "prs"; - case 0x008d: return "invalid"; // Neither defined nor reserved - case 0x008e: return "invalid"; // Neither defined nor reserved - case 0x008f: return "invalid"; // Neither defined nor reserved - case 0x0090: return "invalid"; // Neither defined nor reserved - case 0x0091: return "gd"; - case 0x0092: return "ku"; - case 0x0093: return "quc"; // reserved - case 0x0401: return "ar-SA"; - case 0x0402: return "bg-BG"; - case 0x0403: return "ca-ES"; - case 0x0404: return "zh-TW"; - case 0x0405: return "cs-CZ"; - case 0x0406: return "da-DK"; - case 0x0407: return "de-DE"; - case 0x0408: return "el-GR"; - case 0x0409: return "en-US"; - case 0x040a: return "es-ES_tradnl"; - case 0x040b: return "fi-FI"; - case 0x040c: return "fr-FR"; - case 0x040d: return "he-IL"; - case 0x040e: return "hu-HU"; - case 0x040f: return "is-IS"; - case 0x0410: return "it-IT"; - case 0x0411: return "ja-JP"; - case 0x0412: return "ko-KR"; - case 0x0413: return "nl-NL"; - case 0x0414: return "nb-NO"; - case 0x0415: return "pl-PL"; - case 0x0416: return "pt-BR"; - case 0x0417: return "rm-CH"; - case 0x0418: return "ro-RO"; - case 0x0419: return "ru-RU"; - case 0x041a: return "hr-HR"; - case 0x041b: return "sk-SK"; - case 0x041c: return "sq-AL"; - case 0x041d: return "sv-SE"; - case 0x041e: return "th-TH"; - case 0x041f: return "tr-TR"; - case 0x0420: return "ur-PK"; - case 0x0421: return "id-ID"; - case 0x0422: return "uk-UA"; - case 0x0423: return "be-BY"; - case 0x0424: return "sl-SI"; - case 0x0425: return "et-EE"; - case 0x0426: return "lv-LV"; - case 0x0427: return "lt-LT"; - case 0x0428: return "tg-Cyrl-TJ"; - case 0x0429: return "fa-IR"; - case 0x042a: return "vi-VN"; - case 0x042b: return "hy-AM"; - case 0x042c: return "az-Latn-AZ"; - case 0x042d: return "eu-ES"; - case 0x042e: return "hsb-DE"; - case 0x042f: return "mk-MK"; - case 0x0430: return "st-ZA"; // reserved - case 0x0431: return "ts-ZA"; // reserved - case 0x0432: return "tn-ZA"; - case 0x0433: return "ve-ZA"; // reserved - case 0x0434: return "xh-ZA"; - case 0x0435: return "zu-ZA"; - case 0x0436: return "af-ZA"; - case 0x0437: return "ka-GE"; - case 0x0438: return "fo-FO"; - case 0x0439: return "hi-IN"; - case 0x043a: return "mt-MT"; - case 0x043b: return "se-NO"; - case 0x043d: return "yi-Hebr"; // reserved - case 0x043e: return "ms-MY"; - case 0x043f: return "kk-KZ"; - case 0x0440: return "ky-KG"; - case 0x0441: return "sw-KE"; - case 0x0442: return "tk-TM"; - case 0x0443: return "uz-Latn-UZ"; - case 0x0444: return "tt-RU"; - case 0x0445: return "bn-IN"; - case 0x0446: return "pa-IN"; - case 0x0447: return "gu-IN"; - case 0x0448: return "or-IN"; - case 0x0449: return "ta-IN"; - case 0x044a: return "te-IN"; - case 0x044b: return "kn-IN"; - case 0x044c: return "ml-IN"; - case 0x044d: return "as-IN"; - case 0x044e: return "mr-IN"; - case 0x044f: return "sa-IN"; - case 0x0450: return "mn-MN"; - case 0x0451: return "bo-CN"; - case 0x0452: return "cy-GB"; - case 0x0453: return "km-KH"; - case 0x0454: return "lo-LA"; - case 0x0455: return "my-MM"; // reserved - case 0x0456: return "gl-ES"; - case 0x0457: return "kok-IN"; - case 0x0458: return "mni-IN"; // reserved - case 0x0459: return "sd-Deva-IN"; // reserved - case 0x045a: return "syr-SY"; - case 0x045b: return "si-LK"; - case 0x045c: return "chr-Cher-US"; - case 0x045d: return "iu-Cans-CA"; - case 0x045e: return "am-ET"; - case 0x045f: return "tzm-Arab-MA"; // reserved - case 0x0460: return "ks-Arab"; // reserved - case 0x0461: return "ne-NP"; - case 0x0462: return "fy-NL"; - case 0x0463: return "ps-AF"; - case 0x0464: return "fil-PH"; - case 0x0465: return "dv-MV"; - case 0x0466: return "bin-NG"; // reserved - case 0x0467: return "fuv-NG"; // reserved - case 0x0468: return "ha-Latn-NG"; - case 0x0469: return "ibb-NG"; // reserved - case 0x046a: return "yo-NG"; - case 0x046b: return "quz-BO"; - case 0x046c: return "nso-ZA"; - case 0x046d: return "ba-RU"; - case 0x046e: return "lb-LU"; - case 0x046f: return "kl-GL"; - case 0x0470: return "ig-NG"; - case 0x0471: return "kr-NG"; // reserved - case 0x0472: return "om-Ethi-ET"; // reserved - case 0x0473: return "ti-ET"; - case 0x0474: return "gn-PY"; // reserved - case 0x0475: return "haw-US"; - case 0x0476: return "la-Latn"; // reserved - case 0x0477: return "so-SO"; // reserved - case 0x0478: return "ii-CN"; - case 0x0479: return "pap-x029"; // reserved - case 0x047a: return "arn-CL"; - case 0x047c: return "moh-CA"; - case 0x047e: return "br-FR"; - case 0x0480: return "ug-CN"; - case 0x0481: return "mi-NZ"; - case 0x0482: return "oc-FR"; - case 0x0483: return "co-FR"; - case 0x0484: return "gsw-FR"; - case 0x0485: return "sah-RU"; - case 0x0486: return "qut-GT"; - case 0x0487: return "rw-RW"; - case 0x0488: return "wo-SN"; - case 0x048c: return "prs-AF"; - case 0x048d: return "plt-MG"; // reserved - case 0x048e: return "zh-yue-HK"; // reserved - case 0x048f: return "tdd-Tale-CN"; // reserved - case 0x0490: return "khb-Talu-CN"; // reserved - case 0x0491: return "gd-GB"; - case 0x0492: return "ku-Arab-IQ"; - case 0x0493: return "quc-CO"; // reserved - case 0x0501: return "qps-ploc"; - case 0x05fe: return "qps-ploca"; - case 0x0801: return "ar-IQ"; - case 0x0803: return "ca-ES-valencia"; - case 0x0804: return "zh-CN"; - case 0x0807: return "de-CH"; - case 0x0809: return "en-GB"; - case 0x080a: return "es-MX"; - case 0x080c: return "fr-BE"; - case 0x0810: return "it-CH"; - case 0x0811: return "ja-Ploc-JP"; // reserved - case 0x0813: return "nl-BE"; - case 0x0814: return "nn-NO"; - case 0x0816: return "pt-PT"; - case 0x0818: return "ro-MO"; // reserved - case 0x0819: return "ru-MO"; // reserved - case 0x081a: return "sr-Latn-CS"; - case 0x081d: return "sv-FI"; - case 0x0820: return "ur-IN"; // reserved - case 0x0827: return "invalid"; // Neither defined nor reserved - case 0x082c: return "az-Cyrl-AZ"; - case 0x082e: return "dsb-DE"; - case 0x0832: return "tn-BW"; - case 0x083b: return "se-SE"; - case 0x083c: return "ga-IE"; - case 0x083e: return "ms-BN"; - case 0x0843: return "uz-Cyrl-UZ"; - case 0x0845: return "bn-BD"; - case 0x0846: return "pa-Arab-PK"; - case 0x0849: return "ta-LK"; - case 0x0850: return "mn-Mong-CN"; - case 0x0851: return "bo-BT"; // reserved - case 0x0859: return "sd-Arab-PK"; - case 0x085d: return "iu-Latn-CA"; - case 0x085f: return "tzm-Latn-DZ"; - case 0x0860: return "ks-Deva"; // reserved - case 0x0861: return "ne-IN"; // reserved - case 0x0867: return "ff-Latn-SN"; - case 0x086b: return "quz-EC"; - case 0x0873: return "ti-ER"; - case 0x09ff: return "qps-plocm"; - case 0x0c01: return "ar-EG"; - case 0x0c04: return "zh-HK"; - case 0x0c07: return "de-AT"; - case 0x0c09: return "en-AU"; - case 0x0c0a: return "es-ES"; - case 0x0c0c: return "fr-CA"; - case 0x0c1a: return "sr-Cyrl-CS"; - case 0x0c3b: return "se-FI"; - case 0x0c5f: return "tmz-MA"; // reserved - case 0x0c6b: return "quz-PE"; - case 0x1001: return "ar-LY"; - case 0x1004: return "zh-SG"; - case 0x1007: return "de-LU"; - case 0x1009: return "en-CA"; - case 0x100a: return "es-GT"; - case 0x100c: return "fr-CH"; - case 0x101a: return "hr-BA"; - case 0x103b: return "smj-NO"; - case 0x1401: return "ar-DZ"; - case 0x1404: return "zh-MO"; - case 0x1407: return "de-LI"; - case 0x1409: return "en-NZ"; - case 0x140a: return "es-CR"; - case 0x140c: return "fr-LU"; - case 0x141a: return "bs-Latn-BA"; - case 0x143b: return "smj-SE"; - case 0x1801: return "ar-MA"; - case 0x1809: return "en-IE"; - case 0x180a: return "es-PA"; - case 0x180c: return "fr-MC"; - case 0x181a: return "sr-Latn-BA"; - case 0x183b: return "sma-NO"; - case 0x1c01: return "ar-TN"; - case 0x1c09: return "en-ZA"; - case 0x1c0a: return "es-DO"; - case 0x1c0c: return "invalid"; // Neither defined nor reserved - case 0x1c1a: return "sr-Cyrl-BA"; - case 0x1c3b: return "sma-SE"; - case 0x2001: return "ar-OM"; - case 0x2008: return "invalid"; // Neither defined nor reserved - case 0x2009: return "en-JM"; - case 0x200a: return "es-VE"; - case 0x200c: return "fr-RE"; // reserved - case 0x201a: return "bs-Cyrl-BA"; - case 0x203b: return "sms-FI"; - case 0x2401: return "ar-YE"; - case 0x2409: return "en-029"; - case 0x240a: return "es-CO"; - case 0x240c: return "fr-CG"; // reserved - case 0x241a: return "sr-Latn-RS"; - case 0x243b: return "smn-FI"; - case 0x2801: return "ar-SY"; - case 0x2809: return "en-BZ"; - case 0x280a: return "es-PE"; - case 0x280c: return "fr-SN"; // reserved - case 0x281a: return "sr-Cyrl-RS"; - case 0x2c01: return "ar-JO"; - case 0x2c09: return "en-TT"; - case 0x2c0a: return "es-AR"; - case 0x2c0c: return "fr-CM"; // reserved - case 0x2c1a: return "sr-Latn-ME"; - case 0x3001: return "ar-LB"; - case 0x3009: return "en-ZW"; - case 0x300a: return "es-EC"; - case 0x300c: return "fr-CI"; // reserved - case 0x301a: return "sr-Cyrl-ME"; - case 0x3401: return "ar-KW"; - case 0x3409: return "en-PH"; - case 0x340a: return "es-CL"; - case 0x340c: return "fr-ML"; // reserved - case 0x3801: return "ar-AE"; - case 0x3809: return "en-ID"; // reserved - case 0x380a: return "es-UY"; - case 0x380c: return "fr-MA"; // reserved - case 0x3c01: return "ar-BH"; - case 0x3c09: return "en-HK"; // reserved - case 0x3c0a: return "es-PY"; - case 0x3c0c: return "fr-HT"; // reserved - case 0x4001: return "ar-QA"; - case 0x4009: return "en-IN"; - case 0x400a: return "es-BO"; - case 0x4401: return "ar-Ploc-SA"; // reserved - case 0x4409: return "en-MY"; - case 0x440a: return "es-SV"; - case 0x4801: return "ar-145"; // reserved - case 0x4809: return "en-SG"; - case 0x480a: return "es-HN"; - case 0x4c09: return "en-AE"; // reserved - case 0x4c0a: return "es-NI"; - case 0x5009: return "en-BH"; // reserved - case 0x500a: return "es-PR"; - case 0x5409: return "en-EG"; // reserved - case 0x540a: return "es-US"; - case 0x5809: return "en-JO"; // reserved - case 0x5c09: return "en-KW"; // reserved - case 0x6009: return "en-TR"; // reserved - case 0x6409: return "en-YE"; // reserved - case 0x641a: return "bs-Cyrl"; - case 0x681a: return "bs-Latn"; - case 0x6c1a: return "sr-Cyrl"; - case 0x701a: return "sr-Latn"; - case 0x703b: return "smn"; - case 0x742c: return "az-Cyrl"; - case 0x743b: return "sms"; - case 0x7804: return "zh"; - case 0x7814: return "nn"; - case 0x781a: return "bs"; - case 0x782c: return "az-Latn"; - case 0x783b: return "sma"; - case 0x7843: return "uz-Cyrl"; - case 0x7850: return "mn-Cyrl"; - case 0x785d: return "iu-Cans"; - case 0x7c04: return "zh-Hant"; - case 0x7c14: return "nb"; - case 0x7c1a: return "sr"; - case 0x7c28: return "tg-Cyrl"; - case 0x7c2e: return "dsb"; - case 0x7c3b: return "smj"; - case 0x7c43: return "uz-Latn"; - case 0x7c46: return "pa-Arab"; - case 0x7c50: return "mn-Mong"; - case 0x7c59: return "sd-Arab"; - case 0x7c5c: return "chr-Cher"; - case 0x7c5d: return "iu-Latn"; - case 0x7c5f: return "tzm-Latn"; - case 0x7c67: return "ff-Latn"; - case 0x7c68: return "ha-Latn"; - case 0x7c92: return "ku-Arab"; - default: return "invalid"; - } + LocaleID lid = LocaleID.lookupByLcid(lcid & 0xFFFF); + return (lid == null) ? "invalid" : lid.getLanguageTag(); } - + /** * Get default code page from LCID value * @@ -623,466 +167,8 @@ public final class LocaleUtil { * @return the default code page */ public static int getDefaultCodePageFromLCID(int lcid) { - int languageId = lcid & 0xFFFF; - switch (languageId) { - case 0x0001: return 1256; - case 0x0002: return 1251; - case 0x0003: return 1252; - case 0x0004: return 936; - case 0x0005: return 1250; - case 0x0006: return 1252; - case 0x0007: return 1252; - case 0x0008: return 1253; - case 0x0009: return 1252; - case 0x000a: return 1252; - case 0x000b: return 1252; - case 0x000c: return 1252; - case 0x000d: return 1255; - case 0x000e: return 1250; - case 0x000f: return 1252; - case 0x0010: return 1252; - case 0x0011: return 932; - case 0x0012: return 949; - case 0x0013: return 1252; - case 0x0014: return 1252; - case 0x0015: return 1250; - case 0x0016: return 1252; - case 0x0017: return 1252; - case 0x0018: return 1250; - case 0x0019: return 1251; - case 0x001a: return 1250; - case 0x001b: return 1250; - case 0x001c: return 1250; - case 0x001d: return 1252; - case 0x001e: return 874; - case 0x001f: return 1254; - case 0x0020: return 1256; - case 0x0021: return 1252; - case 0x0022: return 1251; - case 0x0023: return 1251; - case 0x0024: return 1250; - case 0x0025: return 1257; - case 0x0026: return 1257; - case 0x0027: return 1257; - case 0x0028: return 1251; - case 0x0029: return 1256; - case 0x002a: return 1258; - case 0x002b: return 0; - case 0x002c: return 1254; - case 0x002d: return 1252; - case 0x002e: return 1252; - case 0x002f: return 1251; - case 0x0030: return 0; - case 0x0031: return 0; - case 0x0032: return 1252; - case 0x0033: return 32759; - case 0x0034: return 1252; - case 0x0035: return 1252; - case 0x0036: return 1252; - case 0x0037: return 0; - case 0x0038: return 1252; - case 0x0039: return 0; - case 0x003a: return 0; - case 0x003b: return 1252; - case 0x003c: return 1252; - case 0x003d: return 32759; - case 0x003e: return 1252; - case 0x003f: return 0; - case 0x0040: return 1251; - case 0x0041: return 1252; - case 0x0042: return 1250; - case 0x0043: return 1254; - case 0x0044: return 1251; - case 0x0045: return 0; - case 0x0046: return 0; - case 0x0047: return 0; - case 0x0048: return 0; - case 0x0049: return 0; - case 0x004a: return 0; - case 0x004b: return 0; - case 0x004c: return 0; - case 0x004d: return 0; - case 0x004e: return 0; - case 0x004f: return 0; - case 0x0050: return 1251; - case 0x0051: return 0; - case 0x0052: return 1252; - case 0x0053: return 0; - case 0x0054: return 0; - case 0x0055: return 0; - case 0x0056: return 1252; - case 0x0057: return 0; - case 0x0058: return 32759; - case 0x0059: return 1256; - case 0x005a: return 0; - case 0x005b: return 0; - case 0x005c: return 0; - case 0x005d: return 1252; - case 0x005e: return 0; - case 0x005f: return 1252; - case 0x0060: return 32759; - case 0x0061: return 0; - case 0x0062: return 1252; - case 0x0063: return 0; - case 0x0064: return 1252; - case 0x0065: return 0; - case 0x0066: return 32759; - case 0x0067: return 1252; - case 0x0068: return 1252; - case 0x0069: return 32759; - case 0x006a: return 1252; - case 0x006b: return 1252; - case 0x006c: return 1252; - case 0x006d: return 1251; - case 0x006e: return 1252; - case 0x006f: return 1252; - case 0x0070: return 1252; - case 0x0071: return 32759; - case 0x0072: return 0; - case 0x0073: return 0; - case 0x0074: return 1252; - case 0x0075: return 1252; - case 0x0076: return 32759; - case 0x0077: return 0; - case 0x0078: return 0; - case 0x0079: return 32759; - case 0x007a: return 1252; - case 0x007b: return 32759; - case 0x007c: return 1252; - case 0x007d: return 32759; - case 0x007e: return 1252; - case 0x007f: return 1252; - case 0x0080: return 1256; - case 0x0081: return 0; - case 0x0082: return 1252; - case 0x0083: return 1252; - case 0x0084: return 1252; - case 0x0085: return 1251; - case 0x0086: return 1252; - case 0x0087: return 1252; - case 0x0088: return 1252; - case 0x0089: return 32759; - case 0x008a: return 32759; - case 0x008b: return 32759; - case 0x008c: return 1256; - case 0x008d: return 32759; - case 0x008e: return 32759; - case 0x008f: return 32759; - case 0x0090: return 32759; - case 0x0091: return 1252; - case 0x0092: return 1256; - case 0x0093: return 32759; - case 0x0401: return 1256; - case 0x0402: return 1251; - case 0x0403: return 1252; - case 0x0404: return 950; - case 0x0405: return 1250; - case 0x0406: return 1252; - case 0x0407: return 1252; - case 0x0408: return 1253; - case 0x0409: return 1252; - case 0x040a: return 1252; - case 0x040b: return 1252; - case 0x040c: return 1252; - case 0x040d: return 1255; - case 0x040e: return 1250; - case 0x040f: return 1252; - case 0x0410: return 1252; - case 0x0411: return 932; - case 0x0412: return 949; - case 0x0413: return 1252; - case 0x0414: return 1252; - case 0x0415: return 1250; - case 0x0416: return 1252; - case 0x0417: return 1252; - case 0x0418: return 1250; - case 0x0419: return 1251; - case 0x041a: return 1250; - case 0x041b: return 1250; - case 0x041c: return 1250; - case 0x041d: return 1252; - case 0x041e: return 874; - case 0x041f: return 1254; - case 0x0420: return 1256; - case 0x0421: return 1252; - case 0x0422: return 1251; - case 0x0423: return 1251; - case 0x0424: return 1250; - case 0x0425: return 1257; - case 0x0426: return 1257; - case 0x0427: return 1257; - case 0x0428: return 1251; - case 0x0429: return 1256; - case 0x042a: return 1258; - case 0x042b: return 0; - case 0x042c: return 1254; - case 0x042d: return 1252; - case 0x042e: return 1252; - case 0x042f: return 1251; - case 0x0430: return 0; - case 0x0431: return 0; - case 0x0432: return 1252; - case 0x0433: return 32759; - case 0x0434: return 1252; - case 0x0435: return 1252; - case 0x0436: return 1252; - case 0x0437: return 0; - case 0x0438: return 1252; - case 0x0439: return 0; - case 0x043a: return 0; - case 0x043b: return 1252; - case 0x043d: return 32759; - case 0x043e: return 1252; - case 0x043f: return 0; - case 0x0440: return 1251; - case 0x0441: return 1252; - case 0x0442: return 1250; - case 0x0443: return 1254; - case 0x0444: return 1251; - case 0x0445: return 0; - case 0x0446: return 0; - case 0x0447: return 0; - case 0x0448: return 0; - case 0x0449: return 0; - case 0x044a: return 0; - case 0x044b: return 0; - case 0x044c: return 0; - case 0x044d: return 0; - case 0x044e: return 0; - case 0x044f: return 0; - case 0x0450: return 1251; - case 0x0451: return 0; - case 0x0452: return 1252; - case 0x0453: return 0; - case 0x0454: return 0; - case 0x0455: return 0; - case 0x0456: return 1252; - case 0x0457: return 0; - case 0x0458: return 32759; - case 0x0459: return 32759; - case 0x045a: return 0; - case 0x045b: return 0; - case 0x045c: return 0; - case 0x045d: return 0; - case 0x045e: return 0; - case 0x045f: return 32759; - case 0x0460: return 32759; - case 0x0461: return 0; - case 0x0462: return 1252; - case 0x0463: return 0; - case 0x0464: return 1252; - case 0x0465: return 0; - case 0x0466: return 32759; - case 0x0467: return 32759; - case 0x0468: return 1252; - case 0x0469: return 32759; - case 0x046a: return 1252; - case 0x046b: return 1252; - case 0x046c: return 1252; - case 0x046d: return 1251; - case 0x046e: return 1252; - case 0x046f: return 1252; - case 0x0470: return 1252; - case 0x0471: return 32759; - case 0x0472: return 0; - case 0x0473: return 0; - case 0x0474: return 1252; - case 0x0475: return 1252; - case 0x0476: return 32759; - case 0x0477: return 0; - case 0x0478: return 0; - case 0x0479: return 32759; - case 0x047a: return 1252; - case 0x047c: return 1252; - case 0x047e: return 1252; - case 0x0480: return 1256; - case 0x0481: return 0; - case 0x0482: return 1252; - case 0x0483: return 1252; - case 0x0484: return 1252; - case 0x0485: return 1251; - case 0x0486: return 1252; - case 0x0487: return 1252; - case 0x0488: return 1252; - case 0x048c: return 1256; - case 0x048d: return 32759; - case 0x048e: return 32759; - case 0x048f: return 32759; - case 0x0490: return 32759; - case 0x0491: return 1252; - case 0x0492: return 1256; - case 0x0493: return 32759; - case 0x0501: return 1250; - case 0x05fe: return 932; - case 0x0801: return 1256; - case 0x0803: return 1252; - case 0x0804: return 936; - case 0x0807: return 1252; - case 0x0809: return 1252; - case 0x080a: return 1252; - case 0x080c: return 1252; - case 0x0810: return 1252; - case 0x0811: return 32759; - case 0x0813: return 1252; - case 0x0814: return 1252; - case 0x0816: return 1252; - case 0x0818: return 0; - case 0x0819: return 32759; - case 0x081a: return 1250; - case 0x081d: return 1252; - case 0x0820: return 0; - case 0x0827: return 32759; - case 0x082c: return 1251; - case 0x082e: return 1252; - case 0x0832: return 1252; - case 0x083b: return 1252; - case 0x083c: return 1252; - case 0x083e: return 1252; - case 0x0843: return 1251; - case 0x0845: return 0; - case 0x0846: return 1256; - case 0x0849: return 0; - case 0x0850: return 0; - case 0x0851: return 32759; - case 0x0859: return 1256; - case 0x085d: return 1252; - case 0x085f: return 1252; - case 0x0860: return 32759; - case 0x0861: return 0; - case 0x0867: return 1252; - case 0x086b: return 1252; - case 0x0873: return 0; - case 0x09ff: return 1256; - case 0x0c01: return 1256; - case 0x0c04: return 950; - case 0x0c07: return 1252; - case 0x0c09: return 1252; - case 0x0c0a: return 1252; - case 0x0c0c: return 1252; - case 0x0c1a: return 1251; - case 0x0c3b: return 1252; - case 0x0c5f: return 32759; - case 0x0c6b: return 1252; - case 0x1001: return 1256; - case 0x1004: return 936; - case 0x1007: return 1252; - case 0x1009: return 1252; - case 0x100a: return 1252; - case 0x100c: return 1252; - case 0x101a: return 1250; - case 0x103b: return 1252; - case 0x1401: return 1256; - case 0x1404: return 950; - case 0x1407: return 1252; - case 0x1409: return 1252; - case 0x140a: return 1252; - case 0x140c: return 1252; - case 0x141a: return 1250; - case 0x143b: return 1252; - case 0x1801: return 1256; - case 0x1809: return 1252; - case 0x180a: return 1252; - case 0x180c: return 1252; - case 0x181a: return 1250; - case 0x183b: return 1252; - case 0x1c01: return 1256; - case 0x1c09: return 1252; - case 0x1c0a: return 1252; - case 0x1c0c: return 32759; - case 0x1c1a: return 1251; - case 0x1c3b: return 1252; - case 0x2001: return 1256; - case 0x2008: return 32759; - case 0x2009: return 1252; - case 0x200a: return 1252; - case 0x200c: return 0; - case 0x201a: return 1251; - case 0x203b: return 1252; - case 0x2401: return 1256; - case 0x2409: return 1252; - case 0x240a: return 1252; - case 0x240c: return 0; - case 0x241a: return 1250; - case 0x243b: return 1252; - case 0x2801: return 1256; - case 0x2809: return 1252; - case 0x280a: return 1252; - case 0x280c: return 0; - case 0x281a: return 1251; - case 0x2c01: return 1256; - case 0x2c09: return 1252; - case 0x2c0a: return 1252; - case 0x2c0c: return 0; - case 0x2c1a: return 1250; - case 0x3001: return 1256; - case 0x3009: return 1252; - case 0x300a: return 1252; - case 0x300c: return 0; - case 0x301a: return 1251; - case 0x3401: return 1256; - case 0x3409: return 1252; - case 0x340a: return 1252; - case 0x340c: return 0; - case 0x3801: return 1256; - case 0x3809: return 32759; - case 0x380a: return 1252; - case 0x380c: return 0; - case 0x3c01: return 1256; - case 0x3c09: return 0; - case 0x3c0a: return 1252; - case 0x3c0c: return 0; - case 0x4001: return 1256; - case 0x4009: return 1252; - case 0x400a: return 1252; - case 0x4401: return 32759; - case 0x4409: return 1252; - case 0x440a: return 1252; - case 0x4801: return 32759; - case 0x4809: return 1252; - case 0x480a: return 1252; - case 0x4c09: return 32759; - case 0x4c0a: return 1252; - case 0x5009: return 32759; - case 0x500a: return 1252; - case 0x5409: return 32759; - case 0x540a: return 1252; - case 0x5809: return 32759; - case 0x5c09: return 32759; - case 0x6009: return 32759; - case 0x6409: return 32759; - case 0x641a: return 1251; - case 0x681a: return 1250; - case 0x6c1a: return 1251; - case 0x701a: return 1250; - case 0x703b: return 1252; - case 0x742c: return 1251; - case 0x743b: return 1252; - case 0x7804: return 936; - case 0x7814: return 1252; - case 0x781a: return 1250; - case 0x782c: return 1254; - case 0x783b: return 1252; - case 0x7843: return 1251; - case 0x7850: return 1251; - case 0x785d: return 0; - case 0x7c04: return 950; - case 0x7c14: return 1252; - case 0x7c1a: return 1250; - case 0x7c28: return 1251; - case 0x7c2e: return 1252; - case 0x7c3b: return 1252; - case 0x7c43: return 1254; - case 0x7c46: return 1256; - case 0x7c50: return 0; - case 0x7c59: return 1256; - case 0x7c5c: return 0; - case 0x7c5d: return 1252; - case 0x7c5f: return 1252; - case 0x7c67: return 1252; - case 0x7c68: return 1252; - case 0x7c92: return 1256; - default: return 0; - } + LocaleID lid = LocaleID.lookupByLcid(lcid & 0xFFFF); + return (lid == null) ? 0 : lid.getDefaultCodepage(); } } diff --git a/src/testcases/org/apache/poi/ss/util/TestDateFormatConverter.java b/src/testcases/org/apache/poi/ss/util/TestDateFormatConverter.java index 811a59701b..23a3164138 100644 --- a/src/testcases/org/apache/poi/ss/util/TestDateFormatConverter.java +++ b/src/testcases/org/apache/poi/ss/util/TestDateFormatConverter.java @@ -19,6 +19,11 @@ package org.apache.poi.ss.util; +import static org.junit.Assert.assertEquals; +import static org.junit.Assert.assertNotEquals; +import static org.junit.Assert.assertNotNull; +import static org.junit.Assert.assertTrue; + import java.io.File; import java.io.FileOutputStream; import java.text.DateFormat; @@ -26,6 +31,11 @@ import java.text.SimpleDateFormat; import java.util.Arrays; import java.util.Date; import java.util.Locale; +import java.util.Set; +import java.util.regex.Matcher; +import java.util.regex.Pattern; +import java.util.stream.Collectors; +import java.util.stream.Stream; import org.apache.poi.hssf.usermodel.HSSFWorkbook; import org.apache.poi.ss.usermodel.Cell; @@ -34,8 +44,8 @@ import org.apache.poi.ss.usermodel.DataFormat; import org.apache.poi.ss.usermodel.Row; import org.apache.poi.ss.usermodel.Sheet; import org.apache.poi.ss.usermodel.Workbook; +import org.apache.poi.util.LocaleID; import org.apache.poi.util.TempFile; -import org.junit.Ignore; import org.junit.Test; public final class TestDateFormatConverter { @@ -148,4 +158,45 @@ public final class TestDateFormatConverter { public void testJDK11MyLocale() { DateFormat.getDateTimeInstance(DateFormat.DEFAULT, DateFormat.DEFAULT, Locale.forLanguageTag("my")); } + + @Test + public void testAllKnownLocales() { + Pattern p = Pattern.compile("\\[\\$-(\\p{XDigit}+)]"); + + Set blacklist = Stream.of( + "sd-Deva", "tzm-Arab", "fuv", "plt", "yue", "tdd-Tale", "tdd", + "khb-Talu", "khb", "qps", "ja-Ploc", "dz", "tmz", "ar-Ploc" + ).collect(Collectors.toSet()); + + for (LocaleID lid : LocaleID.values()) { + final String langTag = lid.getLanguageTag(); + + if (langTag.isEmpty() || lid.getWindowsId().startsWith("invalid")) { + continue; + } + + // test all from variant to parent locales + String cmpTag = (langTag.indexOf('_') > 0) ? langTag.replace('_','-') : langTag; + for (int idx = langTag.length(); idx > 0; idx = cmpTag.lastIndexOf('-', idx-1)) { + final String partTag = langTag.substring(0, idx); + + Locale loc = Locale.forLanguageTag(partTag); + assertNotNull("Invalid language tag: "+partTag, loc); + + if (blacklist.contains(partTag)) { + continue; + } + + String prefix = DateFormatConverter.getPrefixForLocale(loc); + assertNotNull("Prefix not found - language tag: "+partTag, prefix); + assertNotEquals("Prefix not found - language tag: "+partTag,"", prefix); + Matcher m = p.matcher(prefix); + assertTrue("Invalid prefix: "+prefix, m.matches()); + + LocaleID partLid = LocaleID.lookupByLanguageTag(partTag); + assertNotNull("LocaleID not found for part: "+partTag, partLid); + assertEquals(partLid.getLcid(), Integer.parseInt(m.group(1), 16)); + } + } + } } -- 2.39.5