initial commit, 4.5 stable
Some checks failed
🔗 GHA / 📊 Static checks (push) Has been cancelled
🔗 GHA / 🤖 Android (push) Has been cancelled
🔗 GHA / 🍏 iOS (push) Has been cancelled
🔗 GHA / 🐧 Linux (push) Has been cancelled
🔗 GHA / 🍎 macOS (push) Has been cancelled
🔗 GHA / 🏁 Windows (push) Has been cancelled
🔗 GHA / 🌐 Web (push) Has been cancelled
Some checks failed
🔗 GHA / 📊 Static checks (push) Has been cancelled
🔗 GHA / 🤖 Android (push) Has been cancelled
🔗 GHA / 🍏 iOS (push) Has been cancelled
🔗 GHA / 🐧 Linux (push) Has been cancelled
🔗 GHA / 🍎 macOS (push) Has been cancelled
🔗 GHA / 🏁 Windows (push) Has been cancelled
🔗 GHA / 🌐 Web (push) Has been cancelled
This commit is contained in:
152
thirdparty/icu4c/common/uscript.cpp
vendored
Normal file
152
thirdparty/icu4c/common/uscript.cpp
vendored
Normal file
@@ -0,0 +1,152 @@
|
||||
// © 2016 and later: Unicode, Inc. and others.
|
||||
// License & terms of use: http://www.unicode.org/copyright.html
|
||||
/*
|
||||
**********************************************************************
|
||||
* Copyright (C) 1997-2014, International Business Machines
|
||||
* Corporation and others. All Rights Reserved.
|
||||
**********************************************************************
|
||||
*
|
||||
* File USCRIPT.C
|
||||
*
|
||||
* Modification History:
|
||||
*
|
||||
* Date Name Description
|
||||
* 07/06/2001 Ram Creation.
|
||||
******************************************************************************
|
||||
*/
|
||||
|
||||
#include "unicode/uchar.h"
|
||||
#include "unicode/uscript.h"
|
||||
#include "unicode/uloc.h"
|
||||
#include "charstr.h"
|
||||
#include "cmemory.h"
|
||||
#include "cstring.h"
|
||||
#include "ulocimp.h"
|
||||
|
||||
static const UScriptCode JAPANESE[3] = { USCRIPT_KATAKANA, USCRIPT_HIRAGANA, USCRIPT_HAN };
|
||||
static const UScriptCode KOREAN[2] = { USCRIPT_HANGUL, USCRIPT_HAN };
|
||||
static const UScriptCode HAN_BOPO[2] = { USCRIPT_HAN, USCRIPT_BOPOMOFO };
|
||||
|
||||
static int32_t
|
||||
setCodes(const UScriptCode *src, int32_t length,
|
||||
UScriptCode *dest, int32_t capacity, UErrorCode *err) {
|
||||
int32_t i;
|
||||
if(U_FAILURE(*err)) { return 0; }
|
||||
if(length > capacity) {
|
||||
*err = U_BUFFER_OVERFLOW_ERROR;
|
||||
return length;
|
||||
}
|
||||
for(i = 0; i < length; ++i) {
|
||||
dest[i] = src[i];
|
||||
}
|
||||
return length;
|
||||
}
|
||||
|
||||
static int32_t
|
||||
setOneCode(UScriptCode script, UScriptCode *scripts, int32_t capacity, UErrorCode *err) {
|
||||
if(U_FAILURE(*err)) { return 0; }
|
||||
if(1 > capacity) {
|
||||
*err = U_BUFFER_OVERFLOW_ERROR;
|
||||
return 1;
|
||||
}
|
||||
scripts[0] = script;
|
||||
return 1;
|
||||
}
|
||||
|
||||
static int32_t
|
||||
getCodesFromLocale(const char *locale,
|
||||
UScriptCode *scripts, int32_t capacity, UErrorCode *err) {
|
||||
if (U_FAILURE(*err)) { return 0; }
|
||||
icu::CharString lang;
|
||||
icu::CharString script;
|
||||
if (locale == nullptr) {
|
||||
locale = uloc_getDefault();
|
||||
}
|
||||
ulocimp_getSubtags(locale, &lang, &script, nullptr, nullptr, nullptr, *err);
|
||||
if (U_FAILURE(*err)) { return 0; }
|
||||
// Multi-script languages, equivalent to the LocaleScript data
|
||||
// that we used to load from locale resource bundles.
|
||||
if (lang == "ja") {
|
||||
return setCodes(JAPANESE, UPRV_LENGTHOF(JAPANESE), scripts, capacity, err);
|
||||
}
|
||||
if (lang == "ko") {
|
||||
return setCodes(KOREAN, UPRV_LENGTHOF(KOREAN), scripts, capacity, err);
|
||||
}
|
||||
if (lang == "zh" && script == "Hant") {
|
||||
return setCodes(HAN_BOPO, UPRV_LENGTHOF(HAN_BOPO), scripts, capacity, err);
|
||||
}
|
||||
// Explicit script code.
|
||||
if (!script.isEmpty()) {
|
||||
UScriptCode scriptCode = static_cast<UScriptCode>(u_getPropertyValueEnum(UCHAR_SCRIPT, script.data()));
|
||||
if(scriptCode != USCRIPT_INVALID_CODE) {
|
||||
if(scriptCode == USCRIPT_SIMPLIFIED_HAN || scriptCode == USCRIPT_TRADITIONAL_HAN) {
|
||||
scriptCode = USCRIPT_HAN;
|
||||
}
|
||||
return setOneCode(scriptCode, scripts, capacity, err);
|
||||
}
|
||||
}
|
||||
return 0;
|
||||
}
|
||||
|
||||
/* TODO: this is a bad API and should be deprecated, ticket #11141 */
|
||||
U_CAPI int32_t U_EXPORT2
|
||||
uscript_getCode(const char* nameOrAbbrOrLocale,
|
||||
UScriptCode* fillIn,
|
||||
int32_t capacity,
|
||||
UErrorCode* err){
|
||||
UBool triedCode;
|
||||
UErrorCode internalErrorCode;
|
||||
int32_t length;
|
||||
|
||||
if(U_FAILURE(*err)) {
|
||||
return 0;
|
||||
}
|
||||
if(nameOrAbbrOrLocale==nullptr ||
|
||||
(fillIn == nullptr ? capacity != 0 : capacity < 0)) {
|
||||
*err = U_ILLEGAL_ARGUMENT_ERROR;
|
||||
return 0;
|
||||
}
|
||||
|
||||
triedCode = false;
|
||||
const char* lastSepPtr = uprv_strrchr(nameOrAbbrOrLocale, '-');
|
||||
if (lastSepPtr==nullptr) {
|
||||
lastSepPtr = uprv_strrchr(nameOrAbbrOrLocale, '_');
|
||||
}
|
||||
// Favor interpretation of nameOrAbbrOrLocale as a script alias if either
|
||||
// 1. nameOrAbbrOrLocale does not contain -/_. Handles Han, Mro, Nko, etc.
|
||||
// 2. The last instance of -/_ is at offset 3, and the portion after that is
|
||||
// longer than 4 characters (i.e. not a script or region code). This handles
|
||||
// Old_Hungarian, Old_Italic, etc. ("old" is a valid language code)
|
||||
// 3. The last instance of -/_ is at offset 7, and the portion after that is
|
||||
// 3 characters. This handles New_Tai_Lue ("new" is a valid language code).
|
||||
if (lastSepPtr==nullptr
|
||||
|| (lastSepPtr-nameOrAbbrOrLocale == 3 && uprv_strlen(nameOrAbbrOrLocale) > 8)
|
||||
|| (lastSepPtr-nameOrAbbrOrLocale == 7 && uprv_strlen(nameOrAbbrOrLocale) == 11) ) {
|
||||
/* try long and abbreviated script names first */
|
||||
UScriptCode code = (UScriptCode) u_getPropertyValueEnum(UCHAR_SCRIPT, nameOrAbbrOrLocale);
|
||||
if(code!=USCRIPT_INVALID_CODE) {
|
||||
return setOneCode(code, fillIn, capacity, err);
|
||||
}
|
||||
triedCode = true;
|
||||
}
|
||||
internalErrorCode = U_ZERO_ERROR;
|
||||
length = getCodesFromLocale(nameOrAbbrOrLocale, fillIn, capacity, err);
|
||||
if(U_FAILURE(*err) || length != 0) {
|
||||
return length;
|
||||
}
|
||||
icu::CharString likely = ulocimp_addLikelySubtags(nameOrAbbrOrLocale, internalErrorCode);
|
||||
if(U_SUCCESS(internalErrorCode) && internalErrorCode != U_STRING_NOT_TERMINATED_WARNING) {
|
||||
length = getCodesFromLocale(likely.data(), fillIn, capacity, err);
|
||||
if(U_FAILURE(*err) || length != 0) {
|
||||
return length;
|
||||
}
|
||||
}
|
||||
if(!triedCode) {
|
||||
/* still not found .. try long and abbreviated script names again */
|
||||
UScriptCode code = (UScriptCode) u_getPropertyValueEnum(UCHAR_SCRIPT, nameOrAbbrOrLocale);
|
||||
if(code!=USCRIPT_INVALID_CODE) {
|
||||
return setOneCode(code, fillIn, capacity, err);
|
||||
}
|
||||
}
|
||||
return 0;
|
||||
}
|
Reference in New Issue
Block a user