virtualx-engine/thirdparty/icu4c/common/ulocimp.h

// © 2016 and later: Unicode, Inc. and others.
// License & terms of use: http://www.unicode.org/copyright.html
/*
**********************************************************************
*   Copyright (C) 2004-2016, International Business Machines
*   Corporation and others.  All Rights Reserved.
**********************************************************************
*/

#ifndef ULOCIMP_H
#define ULOCIMP_H

#include "unicode/bytestream.h"
#include "unicode/uloc.h"

#include "charstr.h"

/**
 * Create an iterator over the specified keywords list
 * @param keywordList double-null terminated list. Will be copied.
 * @param keywordListSize size in bytes of keywordList
 * @param status err code
 * @return enumeration (owned by caller) of the keyword list.
 * @internal ICU 3.0
 */
U_CAPI UEnumeration* U_EXPORT2
uloc_openKeywordList(const char *keywordList, int32_t keywordListSize, UErrorCode* status);

/**
 * Look up a resource bundle table item with fallback on the table level.
 * This is accessible so it can be called by C++ code.
 */
U_CAPI const UChar * U_EXPORT2
uloc_getTableStringWithFallback(
    const char *path,
    const char *locale,
    const char *tableKey,
    const char *subTableKey,
    const char *itemKey,
    int32_t *pLength,
    UErrorCode *pErrorCode);

/*returns true if a is an ID separator false otherwise*/
#define _isIDSeparator(a) (a == '_' || a == '-')

U_CFUNC const char* 
uloc_getCurrentCountryID(const char* oldID);

U_CFUNC const char* 
uloc_getCurrentLanguageID(const char* oldID);

U_CFUNC void
ulocimp_getKeywords(const char *localeID,
             char prev,
             icu::ByteSink& sink,
             UBool valuesToo,
             UErrorCode *status);

icu::CharString U_EXPORT2
ulocimp_getLanguage(const char *localeID,
                    const char **pEnd,
                    UErrorCode &status);

icu::CharString U_EXPORT2
ulocimp_getScript(const char *localeID,
                  const char **pEnd,
                  UErrorCode &status);

icu::CharString U_EXPORT2
ulocimp_getCountry(const char *localeID,
                   const char **pEnd,
                   UErrorCode &status);

U_CAPI void U_EXPORT2
ulocimp_getName(const char* localeID,
                icu::ByteSink& sink,
                UErrorCode* err);

U_CAPI void U_EXPORT2
ulocimp_getBaseName(const char* localeID,
                    icu::ByteSink& sink,
                    UErrorCode* err);

U_CAPI void U_EXPORT2
ulocimp_canonicalize(const char* localeID,
                     icu::ByteSink& sink,
                     UErrorCode* err);

U_CAPI void U_EXPORT2
ulocimp_getKeywordValue(const char* localeID,
                        const char* keywordName,
                        icu::ByteSink& sink,
                        UErrorCode* status);

U_CAPI void U_EXPORT2
ulocimp_getParent(const char* localeID,
                  icu::ByteSink& sink,
                  UErrorCode* err);

/**
 * Writes a well-formed language tag for this locale ID.
 *
 * **Note**: When `strict` is false, any locale fields which do not satisfy the
 * BCP47 syntax requirement will be omitted from the result.  When `strict` is
 * true, this function sets U_ILLEGAL_ARGUMENT_ERROR to the `err` if any locale
 * fields do not satisfy the BCP47 syntax requirement.
 *
 * @param localeID  the input locale ID
 * @param sink      the output sink receiving the BCP47 language
 *                  tag for this Locale.
 * @param strict    boolean value indicating if the function returns
 *                  an error for an ill-formed input locale ID.
 * @param err       error information if receiving the language
 *                  tag failed.
 * @return          The length of the BCP47 language tag.
 *
 * @internal ICU 64
 */
U_CAPI void U_EXPORT2
ulocimp_toLanguageTag(const char* localeID,
                      icu::ByteSink& sink,
                      UBool strict,
                      UErrorCode* err);

/**
 * Returns a locale ID for the specified BCP47 language tag string.
 * If the specified language tag contains any ill-formed subtags,
 * the first such subtag and all following subtags are ignored.
 * <p>
 * This implements the 'Language-Tag' production of BCP 47, and so
 * supports legacy language tags (marked as “Type: grandfathered” in BCP 47)
 * (regular and irregular) as well as private use language tags.
 *
 * Private use tags are represented as 'x-whatever',
 * and legacy tags are converted to their canonical replacements where they exist.
 *
 * Note that a few legacy tags have no modern replacement;
 * these will be converted using the fallback described in
 * the first paragraph, so some information might be lost.
 *
 * @param langtag   the input BCP47 language tag.
 * @param tagLen    the length of langtag, or -1 to call uprv_strlen().
 * @param sink      the output sink receiving a locale ID for the
 *                  specified BCP47 language tag.
 * @param parsedLength  if not NULL, successfully parsed length
 *                      for the input language tag is set.
 * @param err       error information if receiving the locald ID
 *                  failed.
 * @internal ICU 63
 */
U_CAPI void U_EXPORT2
ulocimp_forLanguageTag(const char* langtag,
                       int32_t tagLen,
                       icu::ByteSink& sink,
                       int32_t* parsedLength,
                       UErrorCode* err);

/**
 * Get the region to use for supplemental data lookup. Uses
 * (1) any region specified by locale tag "rg"; if none then
 * (2) any unicode_region_tag in the locale ID; if none then
 * (3) if inferRegion is true, the region suggested by
 * getLikelySubtags on the localeID.
 * If no region is found, returns length 0.
 * 
 * @param localeID
 *     The complete locale ID (with keywords) from which
 *     to get the region to use for supplemental data.
 * @param inferRegion
 *     If true, will try to infer region from localeID if
 *     no other region is found.
 * @param region
 *     Buffer in which to put the region ID found; should
 *     have a capacity at least ULOC_COUNTRY_CAPACITY. 
 * @param regionCapacity
 *     The actual capacity of the region buffer.
 * @param status
 *     Pointer to in/out UErrorCode value for latest status.
 * @return
 *     The length of any region code found, or 0 if none.
 * @internal ICU 57
 */
U_CAPI int32_t U_EXPORT2
ulocimp_getRegionForSupplementalData(const char *localeID, UBool inferRegion,
                                     char *region, int32_t regionCapacity, UErrorCode* status);

/**
 * Add the likely subtags for a provided locale ID, per the algorithm described
 * in the following CLDR technical report:
 *
 *   http://www.unicode.org/reports/tr35/#Likely_Subtags
 *
 * If localeID is already in the maximal form, or there is no data available
 * for maximization, it will be copied to the output buffer.  For example,
 * "und-Zzzz" cannot be maximized, since there is no reasonable maximization.
 *
 * Examples:
 *
 * "en" maximizes to "en_Latn_US"
 *
 * "de" maximizes to "de_Latn_US"
 *
 * "sr" maximizes to "sr_Cyrl_RS"
 *
 * "sh" maximizes to "sr_Latn_RS" (Note this will not reverse.)
 *
 * "zh_Hani" maximizes to "zh_Hans_CN" (Note this will not reverse.)
 *
 * @param localeID The locale to maximize
 * @param sink The output sink receiving the maximized locale
 * @param err Error information if maximizing the locale failed.  If the length
 * of the localeID and the null-terminator is greater than the maximum allowed size,
 * or the localeId is not well-formed, the error code is U_ILLEGAL_ARGUMENT_ERROR.
 * @internal ICU 64
 */
U_CAPI void U_EXPORT2
ulocimp_addLikelySubtags(const char* localeID,
                         icu::ByteSink& sink,
                         UErrorCode* err);

/**
 * Minimize the subtags for a provided locale ID, per the algorithm described
 * in the following CLDR technical report:
 *
 *   http://www.unicode.org/reports/tr35/#Likely_Subtags
 *
 * If localeID is already in the minimal form, or there is no data available
 * for minimization, it will be copied to the output buffer.  Since the
 * minimization algorithm relies on proper maximization, see the comments
 * for ulocimp_addLikelySubtags for reasons why there might not be any data.
 *
 * Examples:
 *
 * "en_Latn_US" minimizes to "en"
 *
 * "de_Latn_US" minimizes to "de"
 *
 * "sr_Cyrl_RS" minimizes to "sr"
 *
 * "zh_Hant_TW" minimizes to "zh_TW" (The region is preferred to the
 * script, and minimizing to "zh" would imply "zh_Hans_CN".)
 *
 * @param localeID The locale to minimize
 * @param sink The output sink receiving the maximized locale
 * @param favorScript favor to keep script if true, region if false.
 * @param err Error information if minimizing the locale failed.  If the length
 * of the localeID and the null-terminator is greater than the maximum allowed size,
 * or the localeId is not well-formed, the error code is U_ILLEGAL_ARGUMENT_ERROR.
 * @internal ICU 64
 */
U_CAPI void U_EXPORT2
ulocimp_minimizeSubtags(const char* localeID,
                        icu::ByteSink& sink,
                        bool favorScript,
                        UErrorCode* err);

U_CAPI const char * U_EXPORT2
locale_getKeywordsStart(const char *localeID);

U_CFUNC UBool
ultag_isExtensionSubtags(const char* s, int32_t len);

U_CFUNC UBool
ultag_isLanguageSubtag(const char* s, int32_t len);

U_CFUNC UBool
ultag_isPrivateuseValueSubtags(const char* s, int32_t len);

U_CFUNC UBool
ultag_isRegionSubtag(const char* s, int32_t len);

U_CFUNC UBool
ultag_isScriptSubtag(const char* s, int32_t len);

U_CFUNC UBool
ultag_isTransformedExtensionSubtags(const char* s, int32_t len);

U_CFUNC UBool
ultag_isUnicodeExtensionSubtags(const char* s, int32_t len);

U_CFUNC UBool
ultag_isUnicodeLocaleAttribute(const char* s, int32_t len);

U_CFUNC UBool
ultag_isUnicodeLocaleAttributes(const char* s, int32_t len);

U_CFUNC UBool
ultag_isUnicodeLocaleKey(const char* s, int32_t len);

U_CFUNC UBool
ultag_isUnicodeLocaleType(const char* s, int32_t len);

U_CFUNC UBool
ultag_isVariantSubtags(const char* s, int32_t len);

U_CAPI const char * U_EXPORT2
ultag_getTKeyStart(const char *localeID);

U_CFUNC const char*
ulocimp_toBcpKey(const char* key);

U_CFUNC const char*
ulocimp_toLegacyKey(const char* key);

U_CFUNC const char*
ulocimp_toBcpType(const char* key, const char* type, UBool* isKnownKey, UBool* isSpecialType);

U_CFUNC const char*
ulocimp_toLegacyType(const char* key, const char* type, UBool* isKnownKey, UBool* isSpecialType);

/* Function for testing purpose */
U_CAPI const char* const* ulocimp_getKnownCanonicalizedLocaleForTest(int32_t* length);

// Return true if the value is already canonicalized.
U_CAPI bool ulocimp_isCanonicalizedLocaleForTest(const char* localeName);

#endif
[Complex Text Layouts] Add third-party TextServer dependencies (ICU, HarfBuzz, Graphite). 2020-08-11 11:10:23 +02:00			`// © 2016 and later: Unicode, Inc. and others.`
			`// License & terms of use: http://www.unicode.org/copyright.html`
			`/*`
			`**********************************************************************`
			`* Copyright (C) 2004-2016, International Business Machines`
			`* Corporation and others. All Rights Reserved.`
			`**********************************************************************`
			`*/`

			`#ifndef ULOCIMP_H`
			`#define ULOCIMP_H`

			`#include "unicode/bytestream.h"`
			`#include "unicode/uloc.h"`

			`#include "charstr.h"`

			`/**`
			`* Create an iterator over the specified keywords list`
			`* @param keywordList double-null terminated list. Will be copied.`
			`* @param keywordListSize size in bytes of keywordList`
			`* @param status err code`
			`* @return enumeration (owned by caller) of the keyword list.`
			`* @internal ICU 3.0`
			`*/`
			`U_CAPI UEnumeration* U_EXPORT2`
			`uloc_openKeywordList(const char keywordList, int32_t keywordListSize, UErrorCode status);`

			`/**`
			`* Look up a resource bundle table item with fallback on the table level.`
			`* This is accessible so it can be called by C++ code.`
			`*/`
			`U_CAPI const UChar * U_EXPORT2`
			`uloc_getTableStringWithFallback(`
			`const char *path,`
			`const char *locale,`
			`const char *tableKey,`
			`const char *subTableKey,`
			`const char *itemKey,`
			`int32_t *pLength,`
			`UErrorCode *pErrorCode);`

			`/returns true if a is an ID separator false otherwise/`
			`#define _isIDSeparator(a) (a == '_' \|\| a == '-')`

			`U_CFUNC const char*`
			`uloc_getCurrentCountryID(const char* oldID);`

			`U_CFUNC const char*`
			`uloc_getCurrentLanguageID(const char* oldID);`

			`U_CFUNC void`
			`ulocimp_getKeywords(const char *localeID,`
			`char prev,`
			`icu::ByteSink& sink,`
			`UBool valuesToo,`
			`UErrorCode *status);`

			`icu::CharString U_EXPORT2`
			`ulocimp_getLanguage(const char *localeID,`
			`const char **pEnd,`
			`UErrorCode &status);`

			`icu::CharString U_EXPORT2`
			`ulocimp_getScript(const char *localeID,`
			`const char **pEnd,`
			`UErrorCode &status);`

			`icu::CharString U_EXPORT2`
			`ulocimp_getCountry(const char *localeID,`
			`const char **pEnd,`
			`UErrorCode &status);`

			`U_CAPI void U_EXPORT2`
			`ulocimp_getName(const char* localeID,`
			`icu::ByteSink& sink,`
			`UErrorCode* err);`

			`U_CAPI void U_EXPORT2`
			`ulocimp_getBaseName(const char* localeID,`
			`icu::ByteSink& sink,`
			`UErrorCode* err);`

			`U_CAPI void U_EXPORT2`
			`ulocimp_canonicalize(const char* localeID,`
			`icu::ByteSink& sink,`
			`UErrorCode* err);`

			`U_CAPI void U_EXPORT2`
			`ulocimp_getKeywordValue(const char* localeID,`
			`const char* keywordName,`
			`icu::ByteSink& sink,`
			`UErrorCode* status);`

ICU4C: Update to version 74.1 2023-11-01 07:56:12 +01:00			`U_CAPI void U_EXPORT2`
			`ulocimp_getParent(const char* localeID,`
			`icu::ByteSink& sink,`
			`UErrorCode* err);`

[Complex Text Layouts] Add third-party TextServer dependencies (ICU, HarfBuzz, Graphite). 2020-08-11 11:10:23 +02:00			`/**`
			`* Writes a well-formed language tag for this locale ID.`
			`*`
			* Note: When `strict` is false, any locale fields which do not satisfy the
			* BCP47 syntax requirement will be omitted from the result. When `strict` is
			* true, this function sets U_ILLEGAL_ARGUMENT_ERROR to the `err` if any locale
			`* fields do not satisfy the BCP47 syntax requirement.`
			`*`
			`* @param localeID the input locale ID`
			`* @param sink the output sink receiving the BCP47 language`
			`* tag for this Locale.`
			`* @param strict boolean value indicating if the function returns`
			`* an error for an ill-formed input locale ID.`
			`* @param err error information if receiving the language`
			`* tag failed.`
			`* @return The length of the BCP47 language tag.`
			`*`
			`* @internal ICU 64`
			`*/`
			`U_CAPI void U_EXPORT2`
			`ulocimp_toLanguageTag(const char* localeID,`
			`icu::ByteSink& sink,`
			`UBool strict,`
			`UErrorCode* err);`

			`/**`
			`* Returns a locale ID for the specified BCP47 language tag string.`
			`* If the specified language tag contains any ill-formed subtags,`
			`* the first such subtag and all following subtags are ignored.`
			`* <p>`
			`* This implements the 'Language-Tag' production of BCP 47, and so`
			`* supports legacy language tags (marked as “Type: grandfathered” in BCP 47)`
			`* (regular and irregular) as well as private use language tags.`
			`*`
			`* Private use tags are represented as 'x-whatever',`
			`* and legacy tags are converted to their canonical replacements where they exist.`
			`*`
			`* Note that a few legacy tags have no modern replacement;`
			`* these will be converted using the fallback described in`
			`* the first paragraph, so some information might be lost.`
			`*`
			`* @param langtag the input BCP47 language tag.`
			`* @param tagLen the length of langtag, or -1 to call uprv_strlen().`
			`* @param sink the output sink receiving a locale ID for the`
			`* specified BCP47 language tag.`
			`* @param parsedLength if not NULL, successfully parsed length`
			`* for the input language tag is set.`
			`* @param err error information if receiving the locald ID`
			`* failed.`
			`* @internal ICU 63`
			`*/`
			`U_CAPI void U_EXPORT2`
			`ulocimp_forLanguageTag(const char* langtag,`
			`int32_t tagLen,`
			`icu::ByteSink& sink,`
			`int32_t* parsedLength,`
			`UErrorCode* err);`

			`/**`
			`* Get the region to use for supplemental data lookup. Uses`
			`* (1) any region specified by locale tag "rg"; if none then`
			`* (2) any unicode_region_tag in the locale ID; if none then`
			`* (3) if inferRegion is true, the region suggested by`
			`* getLikelySubtags on the localeID.`
			`* If no region is found, returns length 0.`
			`*`
			`* @param localeID`
			`* The complete locale ID (with keywords) from which`
			`* to get the region to use for supplemental data.`
			`* @param inferRegion`
			`* If true, will try to infer region from localeID if`
			`* no other region is found.`
			`* @param region`
			`* Buffer in which to put the region ID found; should`
			`* have a capacity at least ULOC_COUNTRY_CAPACITY.`
			`* @param regionCapacity`
			`* The actual capacity of the region buffer.`
			`* @param status`
			`* Pointer to in/out UErrorCode value for latest status.`
			`* @return`
			`* The length of any region code found, or 0 if none.`
			`* @internal ICU 57`
			`*/`
			`U_CAPI int32_t U_EXPORT2`
			`ulocimp_getRegionForSupplementalData(const char *localeID, UBool inferRegion,`
			`char region, int32_t regionCapacity, UErrorCode status);`

			`/**`
			`* Add the likely subtags for a provided locale ID, per the algorithm described`
			`* in the following CLDR technical report:`
			`*`
			`* http://www.unicode.org/reports/tr35/#Likely_Subtags`
			`*`
			`* If localeID is already in the maximal form, or there is no data available`
			`* for maximization, it will be copied to the output buffer. For example,`
			`* "und-Zzzz" cannot be maximized, since there is no reasonable maximization.`
			`*`
			`* Examples:`
			`*`
			`* "en" maximizes to "en_Latn_US"`
			`*`
			`* "de" maximizes to "de_Latn_US"`
			`*`
			`* "sr" maximizes to "sr_Cyrl_RS"`
			`*`
			`* "sh" maximizes to "sr_Latn_RS" (Note this will not reverse.)`
			`*`
			`* "zh_Hani" maximizes to "zh_Hans_CN" (Note this will not reverse.)`
			`*`
			`* @param localeID The locale to maximize`
			`* @param sink The output sink receiving the maximized locale`
			`* @param err Error information if maximizing the locale failed. If the length`
			`* of the localeID and the null-terminator is greater than the maximum allowed size,`
			`* or the localeId is not well-formed, the error code is U_ILLEGAL_ARGUMENT_ERROR.`
			`* @internal ICU 64`
			`*/`
			`U_CAPI void U_EXPORT2`
			`ulocimp_addLikelySubtags(const char* localeID,`
			`icu::ByteSink& sink,`
			`UErrorCode* err);`

			`/**`
			`* Minimize the subtags for a provided locale ID, per the algorithm described`
			`* in the following CLDR technical report:`
			`*`
			`* http://www.unicode.org/reports/tr35/#Likely_Subtags`
			`*`
			`* If localeID is already in the minimal form, or there is no data available`
			`* for minimization, it will be copied to the output buffer. Since the`
			`* minimization algorithm relies on proper maximization, see the comments`
			`* for ulocimp_addLikelySubtags for reasons why there might not be any data.`
			`*`
			`* Examples:`
			`*`
			`* "en_Latn_US" minimizes to "en"`
			`*`
			`* "de_Latn_US" minimizes to "de"`
			`*`
			`* "sr_Cyrl_RS" minimizes to "sr"`
			`*`
			`* "zh_Hant_TW" minimizes to "zh_TW" (The region is preferred to the`
			`* script, and minimizing to "zh" would imply "zh_Hans_CN".)`
			`*`
			`* @param localeID The locale to minimize`
			`* @param sink The output sink receiving the maximized locale`
ICU4C: Update to version 74.1 2023-11-01 07:56:12 +01:00			`* @param favorScript favor to keep script if true, region if false.`
[Complex Text Layouts] Add third-party TextServer dependencies (ICU, HarfBuzz, Graphite). 2020-08-11 11:10:23 +02:00			`* @param err Error information if minimizing the locale failed. If the length`
			`* of the localeID and the null-terminator is greater than the maximum allowed size,`
			`* or the localeId is not well-formed, the error code is U_ILLEGAL_ARGUMENT_ERROR.`
			`* @internal ICU 64`
			`*/`
			`U_CAPI void U_EXPORT2`
			`ulocimp_minimizeSubtags(const char* localeID,`
			`icu::ByteSink& sink,`
ICU4C: Update to version 74.1 2023-11-01 07:56:12 +01:00			`bool favorScript,`
[Complex Text Layouts] Add third-party TextServer dependencies (ICU, HarfBuzz, Graphite). 2020-08-11 11:10:23 +02:00			`UErrorCode* err);`

			`U_CAPI const char * U_EXPORT2`
			`locale_getKeywordsStart(const char *localeID);`

			`U_CFUNC UBool`
			`ultag_isExtensionSubtags(const char* s, int32_t len);`

			`U_CFUNC UBool`
			`ultag_isLanguageSubtag(const char* s, int32_t len);`

			`U_CFUNC UBool`
			`ultag_isPrivateuseValueSubtags(const char* s, int32_t len);`

			`U_CFUNC UBool`
			`ultag_isRegionSubtag(const char* s, int32_t len);`

			`U_CFUNC UBool`
			`ultag_isScriptSubtag(const char* s, int32_t len);`

			`U_CFUNC UBool`
			`ultag_isTransformedExtensionSubtags(const char* s, int32_t len);`

			`U_CFUNC UBool`
			`ultag_isUnicodeExtensionSubtags(const char* s, int32_t len);`

			`U_CFUNC UBool`
			`ultag_isUnicodeLocaleAttribute(const char* s, int32_t len);`

			`U_CFUNC UBool`
			`ultag_isUnicodeLocaleAttributes(const char* s, int32_t len);`

			`U_CFUNC UBool`
			`ultag_isUnicodeLocaleKey(const char* s, int32_t len);`

			`U_CFUNC UBool`
			`ultag_isUnicodeLocaleType(const char* s, int32_t len);`

			`U_CFUNC UBool`
			`ultag_isVariantSubtags(const char* s, int32_t len);`

ICU: Update to version 69.1, improve ICU data export process. 2021-04-22 14:08:59 +02:00			`U_CAPI const char * U_EXPORT2`
			`ultag_getTKeyStart(const char *localeID);`

[Complex Text Layouts] Add third-party TextServer dependencies (ICU, HarfBuzz, Graphite). 2020-08-11 11:10:23 +02:00			`U_CFUNC const char*`
			`ulocimp_toBcpKey(const char* key);`

			`U_CFUNC const char*`
			`ulocimp_toLegacyKey(const char* key);`

			`U_CFUNC const char*`
			`ulocimp_toBcpType(const char* key, const char* type, UBool* isKnownKey, UBool* isSpecialType);`

			`U_CFUNC const char*`
			`ulocimp_toLegacyType(const char* key, const char* type, UBool* isKnownKey, UBool* isSpecialType);`

			`/* Function for testing purpose */`
			`U_CAPI const char* const* ulocimp_getKnownCanonicalizedLocaleForTest(int32_t* length);`

			`// Return true if the value is already canonicalized.`
			`U_CAPI bool ulocimp_isCanonicalizedLocaleForTest(const char* localeName);`

			`#endif`