LocaleUtils.java

  1. /*
  2.  * Licensed to the Apache Software Foundation (ASF) under one or more
  3.  * contributor license agreements.  See the NOTICE file distributed with
  4.  * this work for additional information regarding copyright ownership.
  5.  * The ASF licenses this file to You under the Apache License, Version 2.0
  6.  * (the "License"); you may not use this file except in compliance with
  7.  * the License.  You may obtain a copy of the License at
  8.  *
  9.  *      http://www.apache.org/licenses/LICENSE-2.0
  10.  *
  11.  * Unless required by applicable law or agreed to in writing, software
  12.  * distributed under the License is distributed on an "AS IS" BASIS,
  13.  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  14.  * See the License for the specific language governing permissions and
  15.  * limitations under the License.
  16.  */
  17. package org.apache.commons.lang3;

  18. import java.util.ArrayList;
  19. import java.util.Arrays;
  20. import java.util.Collections;
  21. import java.util.HashSet;
  22. import java.util.List;
  23. import java.util.Locale;
  24. import java.util.Set;
  25. import java.util.concurrent.ConcurrentHashMap;
  26. import java.util.concurrent.ConcurrentMap;
  27. import java.util.function.Predicate;
  28. import java.util.stream.Collectors;

  29. /**
  30.  * Operations to assist when working with a {@link Locale}.
  31.  *
  32.  * <p>This class tries to handle {@code null} input gracefully.
  33.  * An exception will not be thrown for a {@code null} input.
  34.  * Each method documents its behavior in more detail.</p>
  35.  *
  36.  * @since 2.2
  37.  */
  38. public class LocaleUtils {

  39.     // class to avoid synchronization (Init on demand)
  40.     static class SyncAvoid {
  41.         /** Unmodifiable list of available locales. */
  42.         private static final List<Locale> AVAILABLE_LOCALE_LIST;
  43.         /** Unmodifiable set of available locales. */
  44.         private static final Set<Locale> AVAILABLE_LOCALE_SET;

  45.         static {
  46.             final List<Locale> list = new ArrayList<>(Arrays.asList(Locale.getAvailableLocales()));  // extra safe
  47.             AVAILABLE_LOCALE_LIST = Collections.unmodifiableList(list);
  48.             AVAILABLE_LOCALE_SET = Collections.unmodifiableSet(new HashSet<>(list));
  49.         }
  50.     }

  51.     /**
  52.      * The underscore character {@code '}{@value}{@code '}.
  53.      */
  54.     private static final char UNDERSCORE = '_';

  55.     /**
  56.      * The undetermined language {@value}.
  57.      */
  58.     private static final String UNDETERMINED = "und";

  59.     /**
  60.      * The dash character {@code '}{@value}{@code '}.
  61.      */
  62.     private static final char DASH = '-';

  63.     /**
  64.      * Concurrent map of language locales by country.
  65.      */
  66.     private static final ConcurrentMap<String, List<Locale>> cLanguagesByCountry = new ConcurrentHashMap<>();

  67.     /**
  68.      * Concurrent map of country locales by language.
  69.      */
  70.     private static final ConcurrentMap<String, List<Locale>> cCountriesByLanguage = new ConcurrentHashMap<>();

  71.     /**
  72.      * Obtains an unmodifiable list of installed locales.
  73.      *
  74.      * <p>This method is a wrapper around {@link Locale#getAvailableLocales()}.
  75.      * It is more efficient, as the JDK method must create a new array each
  76.      * time it is called.</p>
  77.      *
  78.      * @return the unmodifiable list of available locales
  79.      */
  80.     public static List<Locale> availableLocaleList() {
  81.         return SyncAvoid.AVAILABLE_LOCALE_LIST;
  82.     }

  83.     private static List<Locale> availableLocaleList(final Predicate<Locale> predicate) {
  84.         return availableLocaleList().stream().filter(predicate).collect(Collectors.toList());
  85.     }

  86.     /**
  87.      * Obtains an unmodifiable set of installed locales.
  88.      *
  89.      * <p>This method is a wrapper around {@link Locale#getAvailableLocales()}.
  90.      * It is more efficient, as the JDK method must create a new array each
  91.      * time it is called.</p>
  92.      *
  93.      * @return the unmodifiable set of available locales
  94.      */
  95.     public static Set<Locale> availableLocaleSet() {
  96.         return SyncAvoid.AVAILABLE_LOCALE_SET;
  97.     }

  98.     /**
  99.      * Obtains the list of countries supported for a given language.
  100.      *
  101.      * <p>This method takes a language code and searches to find the
  102.      * countries available for that language. Variant locales are removed.</p>
  103.      *
  104.      * @param languageCode  the 2 letter language code, null returns empty
  105.      * @return an unmodifiable List of Locale objects, not null
  106.      */
  107.     public static List<Locale> countriesByLanguage(final String languageCode) {
  108.         if (languageCode == null) {
  109.             return Collections.emptyList();
  110.         }
  111.         return cCountriesByLanguage.computeIfAbsent(languageCode, lc -> Collections.unmodifiableList(
  112.             availableLocaleList(locale -> languageCode.equals(locale.getLanguage()) && !locale.getCountry().isEmpty() && locale.getVariant().isEmpty())));
  113.     }

  114.     /**
  115.      * Checks if the locale specified is in the set of available locales.
  116.      *
  117.      * @param locale the Locale object to check if it is available
  118.      * @return true if the locale is a known locale
  119.      */
  120.     public static boolean isAvailableLocale(final Locale locale) {
  121.         return availableLocaleSet().contains(locale);
  122.     }

  123.     /**
  124.      * Checks whether the given String is a ISO 3166 alpha-2 country code.
  125.      *
  126.      * @param str the String to check
  127.      * @return true, is the given String is a ISO 3166 compliant country code.
  128.      */
  129.     private static boolean isISO3166CountryCode(final String str) {
  130.         return StringUtils.isAllUpperCase(str) && str.length() == 2;
  131.     }

  132.     /**
  133.      * Checks whether the given String is a ISO 639 compliant language code.
  134.      *
  135.      * @param str the String to check.
  136.      * @return true, if the given String is a ISO 639 compliant language code.
  137.      */
  138.     private static boolean isISO639LanguageCode(final String str) {
  139.         return StringUtils.isAllLowerCase(str) && (str.length() == 2 || str.length() == 3);
  140.     }

  141.     /**
  142.      * Tests whether a Locale's language is undetermined.
  143.      * <p>
  144.      * A Locale's language tag is undetermined if it's value is {@code "und"}. If a language is empty, or not well-formed (for example, "a" or"e2"), it will be
  145.      * equal to {@code "und"}.
  146.      * </p>
  147.      *
  148.      * @param locale the locale to test.
  149.      * @return whether a Locale's language is undetermined.
  150.      * @see Locale#toLanguageTag()
  151.      * @since 3.14.0
  152.      */
  153.     public static boolean isLanguageUndetermined(final Locale locale) {
  154.         return locale == null || UNDETERMINED.equals(locale.toLanguageTag());
  155.     }

  156.     /**
  157.      * Checks whether the given String is a UN M.49 numeric area code.
  158.      *
  159.      * @param str the String to check
  160.      * @return true, is the given String is a UN M.49 numeric area code.
  161.      */
  162.     private static boolean isNumericAreaCode(final String str) {
  163.         return StringUtils.isNumeric(str) && str.length() == 3;
  164.     }

  165.     /**
  166.      * Obtains the list of languages supported for a given country.
  167.      *
  168.      * <p>This method takes a country code and searches to find the
  169.      * languages available for that country. Variant locales are removed.</p>
  170.      *
  171.      * @param countryCode  the 2-letter country code, null returns empty
  172.      * @return an unmodifiable List of Locale objects, not null
  173.      */
  174.     public static List<Locale> languagesByCountry(final String countryCode) {
  175.         if (countryCode == null) {
  176.             return Collections.emptyList();
  177.         }
  178.         return cLanguagesByCountry.computeIfAbsent(countryCode,
  179.             k -> Collections.unmodifiableList(availableLocaleList(locale -> countryCode.equals(locale.getCountry()) && locale.getVariant().isEmpty())));
  180.     }

  181.     /**
  182.      * Obtains the list of locales to search through when performing
  183.      * a locale search.
  184.      *
  185.      * <pre>
  186.      * localeLookupList(Locale("fr", "CA", "xxx"))
  187.      *   = [Locale("fr", "CA", "xxx"), Locale("fr", "CA"), Locale("fr")]
  188.      * </pre>
  189.      *
  190.      * @param locale  the locale to start from
  191.      * @return the unmodifiable list of Locale objects, 0 being locale, not null
  192.      */
  193.     public static List<Locale> localeLookupList(final Locale locale) {
  194.         return localeLookupList(locale, locale);
  195.     }

  196.     /**
  197.      * Obtains the list of locales to search through when performing
  198.      * a locale search.
  199.      *
  200.      * <pre>
  201.      * localeLookupList(Locale("fr", "CA", "xxx"), Locale("en"))
  202.      *   = [Locale("fr", "CA", "xxx"), Locale("fr", "CA"), Locale("fr"), Locale("en"]
  203.      * </pre>
  204.      *
  205.      * <p>The result list begins with the most specific locale, then the
  206.      * next more general and so on, finishing with the default locale.
  207.      * The list will never contain the same locale twice.</p>
  208.      *
  209.      * @param locale  the locale to start from, null returns empty list
  210.      * @param defaultLocale  the default locale to use if no other is found
  211.      * @return the unmodifiable list of Locale objects, 0 being locale, not null
  212.      */
  213.     public static List<Locale> localeLookupList(final Locale locale, final Locale defaultLocale) {
  214.         final List<Locale> list = new ArrayList<>(4);
  215.         if (locale != null) {
  216.             list.add(locale);
  217.             if (!locale.getVariant().isEmpty()) {
  218.                 list.add(new Locale(locale.getLanguage(), locale.getCountry()));
  219.             }
  220.             if (!locale.getCountry().isEmpty()) {
  221.                 list.add(new Locale(locale.getLanguage(), StringUtils.EMPTY));
  222.             }
  223.             if (!list.contains(defaultLocale)) {
  224.                 list.add(defaultLocale);
  225.             }
  226.         }
  227.         return Collections.unmodifiableList(list);
  228.     }

  229.     /**
  230.      * Tries to parse a Locale from the given String.
  231.      * <p>
  232.      * See {@Link Locale} for the format.
  233.      * </p>
  234.      *
  235.      * @param str the String to parse as a Locale.
  236.      * @return a Locale parsed from the given String.
  237.      * @throws IllegalArgumentException if the given String can not be parsed.
  238.      * @see Locale
  239.      */
  240.     private static Locale parseLocale(final String str) {
  241.         if (isISO639LanguageCode(str)) {
  242.             return new Locale(str);
  243.         }
  244.         final int limit = 3;
  245.         final char separator = str.indexOf(UNDERSCORE) != -1 ? UNDERSCORE : DASH;
  246.         final String[] segments = str.split(String.valueOf(separator), 3);
  247.         final String language = segments[0];
  248.         if (segments.length == 2) {
  249.             final String country = segments[1];
  250.             if (isISO639LanguageCode(language) && isISO3166CountryCode(country) || isNumericAreaCode(country)) {
  251.                 return new Locale(language, country);
  252.             }
  253.         } else if (segments.length == limit) {
  254.             final String country = segments[1];
  255.             final String variant = segments[2];
  256.             if (isISO639LanguageCode(language) &&
  257.                     (country.isEmpty() || isISO3166CountryCode(country) || isNumericAreaCode(country)) &&
  258.                     !variant.isEmpty()) {
  259.                 return new Locale(language, country, variant);
  260.             }
  261.         }
  262.         throw new IllegalArgumentException("Invalid locale format: " + str);
  263.     }

  264.     /**
  265.      * Returns the given locale if non-{@code null}, otherwise {@link Locale#getDefault()}.
  266.      *
  267.      * @param locale a locale or {@code null}.
  268.      * @return the given locale if non-{@code null}, otherwise {@link Locale#getDefault()}.
  269.      * @since 3.12.0
  270.      */
  271.     public static Locale toLocale(final Locale locale) {
  272.         return locale != null ? locale : Locale.getDefault();
  273.     }

  274.     /**
  275.      * Converts a String to a Locale.
  276.      *
  277.      * <p>This method takes the string format of a locale and creates the
  278.      * locale object from it.</p>
  279.      *
  280.      * <pre>
  281.      *   LocaleUtils.toLocale("")           = new Locale("", "")
  282.      *   LocaleUtils.toLocale("en")         = new Locale("en", "")
  283.      *   LocaleUtils.toLocale("en_GB")      = new Locale("en", "GB")
  284.      *   LocaleUtils.toLocale("en-GB")      = new Locale("en", "GB")
  285.      *   LocaleUtils.toLocale("en_001")     = new Locale("en", "001")
  286.      *   LocaleUtils.toLocale("en_GB_xxx")  = new Locale("en", "GB", "xxx")   (#)
  287.      * </pre>
  288.      *
  289.      * <p>(#) The behavior of the JDK variant constructor changed between JDK1.3 and JDK1.4.
  290.      * In JDK1.3, the constructor upper cases the variant, in JDK1.4, it doesn't.
  291.      * Thus, the result from getVariant() may vary depending on your JDK.</p>
  292.      *
  293.      * <p>This method validates the input strictly.
  294.      * The language code must be lowercase.
  295.      * The country code must be uppercase.
  296.      * The separator must be an underscore or a dash.
  297.      * The length must be correct.
  298.      * </p>
  299.      *
  300.      * @param str  the locale String to convert, null returns null
  301.      * @return a Locale, null if null input
  302.      * @throws IllegalArgumentException if the string is an invalid format
  303.      * @see Locale#forLanguageTag(String)
  304.      */
  305.     public static Locale toLocale(final String str) {
  306.         if (str == null) {
  307.             // TODO Should this return the default locale?
  308.             return null;
  309.         }
  310.         if (str.isEmpty()) { // LANG-941 - JDK 8 introduced an empty locale where all fields are blank
  311.             return new Locale(StringUtils.EMPTY, StringUtils.EMPTY);
  312.         }
  313.         if (str.contains("#")) { // LANG-879 - Cannot handle Java 7 script & extensions
  314.             throw new IllegalArgumentException("Invalid locale format: " + str);
  315.         }
  316.         final int len = str.length();
  317.         if (len < 2) {
  318.             throw new IllegalArgumentException("Invalid locale format: " + str);
  319.         }
  320.         final char ch0 = str.charAt(0);
  321.         if (ch0 == UNDERSCORE || ch0 == DASH) {
  322.             if (len < 3) {
  323.                 throw new IllegalArgumentException("Invalid locale format: " + str);
  324.             }
  325.             final char ch1 = str.charAt(1);
  326.             final char ch2 = str.charAt(2);
  327.             if (!Character.isUpperCase(ch1) || !Character.isUpperCase(ch2)) {
  328.                 throw new IllegalArgumentException("Invalid locale format: " + str);
  329.             }
  330.             if (len == 3) {
  331.                 return new Locale(StringUtils.EMPTY, str.substring(1, 3));
  332.             }
  333.             if (len < 5) {
  334.                 throw new IllegalArgumentException("Invalid locale format: " + str);
  335.             }
  336.             if (str.charAt(3) != ch0) {
  337.                 throw new IllegalArgumentException("Invalid locale format: " + str);
  338.             }
  339.             return new Locale(StringUtils.EMPTY, str.substring(1, 3), str.substring(4));
  340.         }

  341.         return parseLocale(str);
  342.     }

  343.     /**
  344.      * {@link LocaleUtils} instances should NOT be constructed in standard programming.
  345.      * Instead, the class should be used as {@code LocaleUtils.toLocale("en_GB");}.
  346.      *
  347.      * <p>This constructor is public to permit tools that require a JavaBean instance
  348.      * to operate.</p>
  349.      *
  350.      * @deprecated TODO Make private in 4.0.
  351.      */
  352.     @Deprecated
  353.     public LocaleUtils() {
  354.         // empty
  355.     }

  356. }