#include <string.h>
#include "unicode/utypes.h"
#include "unicode/uscript.h"
#include "unicode/uchar.h"
#include "cintltst.h"
#include "cucdapi.h"
#define LENGTHOF(array) (int32_t)(sizeof(array)/sizeof(array[0]))
void TestUScriptCodeAPI(){
int i =0;
int numErrors =0;
{
const char* testNames[]={
"en", "en_US", "sr", "ta" , "te_IN",
"hi", "he", "ar",
"Hani", "Hang","Hebr","Hira",
"Knda","Kana","Khmr","Lao",
"Latn",
"Mlym", "Mong",
"CYRILLIC","DESERET","DEVANAGARI","ETHIOPIC","GEORGIAN",
"GOTHIC", "GREEK", "GUJARATI", "COMMON", "INHERITED",
"malayalam", "mongolian", "myanmar", "ogham", "old-italic",
"oriya", "runic", "sinhala", "syriac","tamil",
"telugu", "thaana", "thai", "tibetan",
"tagb", "arabic",
"asfdasd", "5464", "12235",
"zyyy", "YI",
'\0'
};
UScriptCode expected[] ={
USCRIPT_LATIN, USCRIPT_LATIN, USCRIPT_CYRILLIC, USCRIPT_TAMIL, USCRIPT_TELUGU,
USCRIPT_DEVANAGARI, USCRIPT_HEBREW, USCRIPT_ARABIC,
USCRIPT_HAN, USCRIPT_HANGUL, USCRIPT_HEBREW, USCRIPT_HIRAGANA,
USCRIPT_KANNADA, USCRIPT_KATAKANA, USCRIPT_KHMER, USCRIPT_LAO,
USCRIPT_LATIN,
USCRIPT_MALAYALAM, USCRIPT_MONGOLIAN,
USCRIPT_CYRILLIC, USCRIPT_DESERET, USCRIPT_DEVANAGARI, USCRIPT_ETHIOPIC, USCRIPT_GEORGIAN,
USCRIPT_GOTHIC, USCRIPT_GREEK, USCRIPT_GUJARATI, USCRIPT_COMMON, USCRIPT_INHERITED,
USCRIPT_MALAYALAM, USCRIPT_MONGOLIAN, USCRIPT_MYANMAR, USCRIPT_OGHAM, USCRIPT_OLD_ITALIC,
USCRIPT_ORIYA, USCRIPT_RUNIC, USCRIPT_SINHALA, USCRIPT_SYRIAC, USCRIPT_TAMIL,
USCRIPT_TELUGU, USCRIPT_THAANA, USCRIPT_THAI, USCRIPT_TIBETAN,
USCRIPT_TAGBANWA, USCRIPT_ARABIC,
USCRIPT_INVALID_CODE, USCRIPT_INVALID_CODE, USCRIPT_INVALID_CODE,
USCRIPT_COMMON, USCRIPT_YI,
};
UErrorCode err = U_ZERO_ERROR;
const int32_t capacity = 10;
for( ; testNames[i]!='\0'; i++){
UScriptCode script[10]={USCRIPT_INVALID_CODE};
uscript_getCode(testNames[i],script,capacity, &err);
if( script[0] != expected[i]){
log_err("Error getting script code Got: %i Expected: %i for name %s\n",
script[0],expected[i],testNames[i]);
numErrors++;
}
}
if(numErrors >0 ){
log_data_err("Errors uchar_getScriptCode() : %i \n",numErrors);
}
}
{
UErrorCode err = U_ZERO_ERROR;
int32_t capacity=0;
int32_t j;
UScriptCode jaCode[]={USCRIPT_KATAKANA, USCRIPT_HIRAGANA, USCRIPT_HAN };
UScriptCode script[10]={USCRIPT_INVALID_CODE};
int32_t num = uscript_getCode("ja",script,capacity, &err);
if(err==U_BUFFER_OVERFLOW_ERROR){
err = U_ZERO_ERROR;
capacity = 10;
num = uscript_getCode("ja",script,capacity, &err);
if(num!=(sizeof(jaCode)/sizeof(UScriptCode))){
log_err("Errors uscript_getScriptCode() for Japanese locale: num=%d, expected %d \n",
num, (sizeof(jaCode)/sizeof(UScriptCode)));
}
for(j=0;j<sizeof(jaCode)/sizeof(UScriptCode);j++) {
if(script[j]!=jaCode[j]) {
log_err("Japanese locale: code #%d was %d (%s) but expected %d (%s)\n", j,
script[j], uscript_getName(script[j]),
jaCode[j], uscript_getName(jaCode[j]));
}
}
}else{
log_data_err("Errors in uscript_getScriptCode() expected error : %s got: %s \n",
"U_BUFFER_OVERFLOW_ERROR",
u_errorName(err));
}
}
{
UScriptCode testAbbr[]={
USCRIPT_CYRILLIC, USCRIPT_DESERET, USCRIPT_DEVANAGARI, USCRIPT_ETHIOPIC, USCRIPT_GEORGIAN,
USCRIPT_GOTHIC, USCRIPT_GREEK, USCRIPT_GUJARATI,
};
const char* expectedNames[]={
"Cyrillic","Deseret","Devanagari","Ethiopic","Georgian",
"Gothic", "Greek", "Gujarati",
'\0'
};
i=0;
while(i<sizeof(testAbbr)/sizeof(UScriptCode)){
const char* name = uscript_getName(testAbbr[i]);
if(name == NULL) {
log_data_err("Couldn't get script name\n");
return;
}
numErrors=0;
if(strcmp(expectedNames[i],name)!=0){
log_err("Error getting abbreviations Got: %s Expected: %s\n",name,expectedNames[i]);
numErrors++;
}
if(numErrors > 0){
if(numErrors >0 ){
log_err("Errors uchar_getScriptAbbr() : %i \n",numErrors);
}
}
i++;
}
}
{
UScriptCode testAbbr[]={
USCRIPT_HAN, USCRIPT_HANGUL, USCRIPT_HEBREW, USCRIPT_HIRAGANA,
USCRIPT_KANNADA, USCRIPT_KATAKANA, USCRIPT_KHMER, USCRIPT_LAO,
USCRIPT_LATIN,
USCRIPT_MALAYALAM, USCRIPT_MONGOLIAN,
};
const char* expectedAbbr[]={
"Hani", "Hang","Hebr","Hira",
"Knda","Kana","Khmr","Laoo",
"Latn",
"Mlym", "Mong",
'\0'
};
i=0;
while(i<sizeof(testAbbr)/sizeof(UScriptCode)){
const char* name = uscript_getShortName(testAbbr[i]);
numErrors=0;
if(strcmp(expectedAbbr[i],name)!=0){
log_err("Error getting abbreviations Got: %s Expected: %s\n",name,expectedAbbr[i]);
numErrors++;
}
if(numErrors > 0){
if(numErrors >0 ){
log_err("Errors uchar_getScriptAbbr() : %i \n",numErrors);
}
}
i++;
}
}
{
uint32_t codepoints[] = {
0x0000FF9D,
0x0000FFBE,
0x0000FFC7,
0x0000FFCF,
0x0000FFD7,
0x0000FFDC,
0x00010300,
0x00010330,
0x0001034A,
0x00010400,
0x00010428,
0x0001D167,
0x0001D17B,
0x0001D185,
0x0001D1AA,
0x00020000,
0x00000D02,
0x00000D00,
0x00000000,
0x0001D169,
0x0001D182,
0x0001D18B,
0x0001D1AD,
};
UScriptCode expected[] = {
USCRIPT_KATAKANA ,
USCRIPT_HANGUL ,
USCRIPT_HANGUL ,
USCRIPT_HANGUL ,
USCRIPT_HANGUL ,
USCRIPT_HANGUL ,
USCRIPT_OLD_ITALIC,
USCRIPT_GOTHIC ,
USCRIPT_GOTHIC ,
USCRIPT_DESERET ,
USCRIPT_DESERET ,
USCRIPT_INHERITED,
USCRIPT_INHERITED,
USCRIPT_INHERITED,
USCRIPT_INHERITED,
USCRIPT_HAN ,
USCRIPT_MALAYALAM,
USCRIPT_UNKNOWN,
USCRIPT_COMMON,
USCRIPT_INHERITED ,
USCRIPT_INHERITED ,
USCRIPT_INHERITED ,
USCRIPT_INHERITED ,
};
UScriptCode code = USCRIPT_INVALID_CODE;
UErrorCode status = U_ZERO_ERROR;
UBool passed = TRUE;
for(i=0; i<LENGTHOF(codepoints); ++i){
code = uscript_getScript(codepoints[i],&status);
if(U_SUCCESS(status)){
if( code != expected[i] ||
code != (UScriptCode)u_getIntPropertyValue(codepoints[i], UCHAR_SCRIPT)
) {
log_err("uscript_getScript for codepoint \\U%08X failed\n",codepoints[i]);
passed = FALSE;
}
}else{
log_err("uscript_getScript for codepoint \\U%08X failed. Error: %s\n",
codepoints[i],u_errorName(status));
break;
}
}
if(passed==FALSE){
log_err("uscript_getScript failed.\n");
}
}
{
UScriptCode code= USCRIPT_INVALID_CODE;
UErrorCode status = U_ZERO_ERROR;
code = uscript_getScript(0x001D169,&status);
if(code != USCRIPT_INHERITED){
log_err("\\U001D169 is not contained in USCRIPT_INHERITED");
}
}
{
UScriptCode code= USCRIPT_INVALID_CODE;
UErrorCode status = U_ZERO_ERROR;
int32_t err = 0;
for(i = 0; i<=0x10ffff; i++){
code = uscript_getScript(i,&status);
if(code == USCRIPT_INVALID_CODE){
err++;
log_err("uscript_getScript for codepoint \\U%08X failed.\n", i);
}
}
if(err>0){
log_err("uscript_getScript failed for %d codepoints\n", err);
}
}
{
for(i=0; (UScriptCode)i< USCRIPT_CODE_LIMIT; i++){
const char* name = uscript_getName((UScriptCode)i);
if(name==NULL || strcmp(name,"")==0){
log_err("uscript_getName failed for code %i: name is NULL or \"\"\n",i);
}
}
}
{
static const char* expectedLong[] = {
"Balinese", "Batk", "Blis", "Brah", "Cham", "Cirt", "Cyrs", "Egyd", "Egyh", "Egyp",
"Geok", "Hans", "Hant", "Hmng", "Hung", "Inds", "Java", "Kayah_Li", "Latf", "Latg",
"Lepcha", "Lina", "Mand", "Maya", "Mero", "Nko", "Orkh", "Perm", "Phags_Pa", "Phoenician",
"Plrd", "Roro", "Sara", "Syre", "Syrj", "Syrn", "Teng", "Vai", "Visp", "Cuneiform",
"Zxxx", "Unknown",
"Carian", "Jpan", "Lana", "Lycian", "Lydian", "Ol_Chiki", "Rejang", "Saurashtra", "Sgnw", "Sundanese",
"Moon", "Mtei",
"Armi", "Avst", "Cakm", "Kore",
"Kthi", "Mani", "Phli", "Phlp", "Phlv", "Prti", "Samr", "Tavt",
"Zmth", "Zsym",
};
static const char* expectedShort[] = {
"Bali", "Batk", "Blis", "Brah", "Cham", "Cirt", "Cyrs", "Egyd", "Egyh", "Egyp",
"Geok", "Hans", "Hant", "Hmng", "Hung", "Inds", "Java", "Kali", "Latf", "Latg",
"Lepc", "Lina", "Mand", "Maya", "Mero", "Nkoo", "Orkh", "Perm", "Phag", "Phnx",
"Plrd", "Roro", "Sara", "Syre", "Syrj", "Syrn", "Teng", "Vaii", "Visp", "Xsux",
"Zxxx", "Zzzz",
"Cari", "Jpan", "Lana", "Lyci", "Lydi", "Olck", "Rjng", "Saur", "Sgnw", "Sund",
"Moon", "Mtei",
"Armi", "Avst", "Cakm", "Kore",
"Kthi", "Mani", "Phli", "Phlp", "Phlv", "Prti", "Samr", "Tavt",
"Zmth", "Zsym",
};
int32_t j = 0;
for(i=USCRIPT_BALINESE; (UScriptCode)i<USCRIPT_CODE_LIMIT; i++, j++){
const char* name = uscript_getName((UScriptCode)i);
if(name==NULL || strcmp(name,expectedLong[j])!=0){
log_err("uscript_getName failed for code %i: %s!=%s\n", i, name, expectedLong[j]);
}
name = uscript_getShortName((UScriptCode)i);
if(name==NULL || strcmp(name,expectedShort[j])!=0){
log_err("uscript_getShortName failed for code %i: %s!=%s\n", i, name, expectedShort[j]);
}
}
for(i=0; i<LENGTHOF(expectedLong); i++){
UScriptCode fillIn[5] = {USCRIPT_INVALID_CODE};
UErrorCode status = U_ZERO_ERROR;
int32_t len = 0;
len = uscript_getCode(expectedShort[i], fillIn, LENGTHOF(fillIn), &status);
if(U_FAILURE(status)){
log_err("uscript_getCode failed for script name %s. Error: %s\n",expectedShort[i], u_errorName(status));
}
if(len>1){
log_err("uscript_getCode did not return expected number of codes for script %s. EXPECTED: 1 GOT: %i\n", expectedShort[i], len);
}
if(fillIn[0]!= (UScriptCode)(USCRIPT_BALINESE+i)){
log_err("uscript_getCode did not return expected code for script %s. EXPECTED: %i GOT: %i\n", expectedShort[i], (USCRIPT_BALINESE+i), fillIn[0] );
}
}
}
}
void TestBinaryValues() {
static const char *const falseValues[]={ "N", "No", "F", "False" };
static const char *const trueValues[]={ "Y", "Yes", "T", "True" };
int32_t i;
for(i=0; i<LENGTHOF(falseValues); ++i) {
if(FALSE!=u_getPropertyValueEnum(UCHAR_ALPHABETIC, falseValues[i])) {
log_err("u_getPropertyValueEnum(UCHAR_ALPHABETIC, \"%s\")!=FALSE\n", falseValues[i]);
}
}
for(i=0; i<LENGTHOF(trueValues); ++i) {
if(TRUE!=u_getPropertyValueEnum(UCHAR_ALPHABETIC, trueValues[i])) {
log_err("u_getPropertyValueEnum(UCHAR_ALPHABETIC, \"%s\")!=TRUE\n", trueValues[i]);
}
}
}