// © 2016 and later: Unicode, Inc. and others. // License & terms of use: http://www.unicode.org/copyright.html /******************************************************************** * COPYRIGHT: * Copyright (c) 1998-2016, International Business Machines Corporation and * others. All Rights Reserved. ********************************************************************/ /* * File udatatst.c * * Modification History: * * Date Name Description * 02/22/2000 Madhu Creation ****************************************************************************** */ #include "unicode/utypes.h" #include "unicode/putil.h" #include "unicode/udata.h" #include "unicode/ucal.h" #include "unicode/uchar.h" #include "unicode/ucnv.h" #include "unicode/ures.h" #include "unicode/ustring.h" #include "unicode/uclean.h" #include "cmemory.h" #include "cstring.h" #include "filestrm.h" #include "udatamem.h" #include "cintltst.h" #include "ubrkimpl.h" #include "toolutil.h" /* for uprv_fileExists() */ #include #include /* includes for TestSwapData() */ #include "udataswp.h" /* swapping implementations in common */ #include "uresdata.h" #include "ucnv_io.h" #include "uprops.h" #include "ucase.h" #include "ucol_imp.h" #include "ucol_swp.h" #include "ucnv_bld.h" #include "sprpimpl.h" #include "rbbidata.h" /* swapping implementation in i18n */ #include "uspoof_impl.h" U_CAPI int32_t U_EXPORT2 unorm2_swap(const UDataSwapper *ds, const void *inData, int32_t length, void *outData, UErrorCode *pErrorCode); /* other definitions and prototypes */ #if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION static void TestUDataOpen(void); static void TestUDataOpenChoiceDemo1(void); static void TestUDataOpenChoiceDemo2(void); static void TestUDataGetInfo(void); static void TestUDataGetMemory(void); static void TestErrorConditions(void); static void TestAppData(void); static void TestSwapData(void); #endif static void TestUDataSetAppData(void); static void TestICUDataName(void); static void PointerTableOfContents(void); static void SetBadCommonData(void); static void TestUDataFileAccess(void); #if !UCONFIG_NO_FORMATTING && !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION static void TestTZDataDir(void); #endif void addUDataTest(TestNode** root); void addUDataTest(TestNode** root) { #if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION addTest(root, &TestUDataOpen, "udatatst/TestUDataOpen" ); addTest(root, &TestUDataOpenChoiceDemo1, "udatatst/TestUDataOpenChoiceDemo1"); addTest(root, &TestUDataOpenChoiceDemo2, "udatatst/TestUDataOpenChoiceDemo2"); addTest(root, &TestUDataGetInfo, "udatatst/TestUDataGetInfo" ); addTest(root, &TestUDataGetMemory, "udatatst/TestUDataGetMemory" ); addTest(root, &TestErrorConditions, "udatatst/TestErrorConditions"); addTest(root, &TestAppData, "udatatst/TestAppData" ); addTest(root, &TestSwapData, "udatatst/TestSwapData" ); #endif addTest(root, &TestUDataSetAppData, "udatatst/TestUDataSetAppData" ); addTest(root, &TestICUDataName, "udatatst/TestICUDataName" ); addTest(root, &PointerTableOfContents, "udatatst/PointerTableOfContents" ); addTest(root, &SetBadCommonData, "udatatst/SetBadCommonData" ); addTest(root, &TestUDataFileAccess, "udatatst/TestUDataFileAccess" ); #if !UCONFIG_NO_FORMATTING && !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION addTest(root, &TestTZDataDir, "udatatst/TestTZDataDir" ); #endif } #if 0 static void lots_of_mallocs() { int q; for(q=1;q<100;q++) { free(malloc(q)); malloc(q*2); } } #endif #if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION static void TestUDataOpen(){ UDataMemory *result; UErrorCode status=U_ZERO_ERROR; const char* memMap[][2]={ {"root", "res"}, {"cnvalias", "icu"}, {"unames", "icu"}, {"ibm-37_P100-1995", "cnv"} }; const char* name = "test"; const char* type = "icu"; const char dirSepString[] = {U_FILE_SEP_CHAR, 0}; const char pathSepString[] = {U_PATH_SEP_CHAR, 0}; char* path=(char*)malloc(sizeof(char) * (strlen(ctest_dataOutDir()) + strlen(U_ICUDATA_NAME) + strlen("/build/tmp/..")+1 ) ); char *icuDataFilePath = 0; const char* testPath=loadTestData(&status); if(U_FAILURE(status)) { log_data_err("Could not load testdata.dat, status = %s\n", u_errorName(status)); free(path); return; } /* lots_of_mallocs(); */ log_verbose("Testing udata_open(%s)\n", testPath); result=udata_open(testPath, type, name, &status); if(U_FAILURE(status)){ log_data_err("FAIL: udata_open() failed for path = %s, name=%s, type=%s, \n errorcode=%s\n", testPath, name, type, myErrorName(status)); } else { log_verbose("PASS: udata_open worked\n"); udata_close(result); } { strcat(strcpy(path, ctest_dataOutDir()), U_ICUDATA_NAME); /* If the ICU system common data file is present in this confiugration, * verify that udata_open can explicitly fetch items from it. * If packaging mode == dll, the file may not exist. So, if the file is * missing, skip this test without error. */ icuDataFilePath = (char *)uprv_malloc(strlen(path) + 10); strcpy(icuDataFilePath, path); strcat(icuDataFilePath, ".dat"); /* lots_of_mallocs(); */ if (uprv_fileExists(icuDataFilePath)) { int i; log_verbose("Testing udata_open() on %s\n", icuDataFilePath); for(i=0; isize>=20 && pInfo->isBigEndian==U_IS_BIG_ENDIAN && pInfo->charsetFamily==U_CHARSET_FAMILY && pInfo->dataFormat[0]==0x43 && /* dataFormat="CvAl" */ pInfo->dataFormat[1]==0x76 && pInfo->dataFormat[2]==0x41 && pInfo->dataFormat[3]==0x6c && pInfo->formatVersion[0]==3 ) { log_verbose("The data from \"%s.%s\" IS acceptable using the verifing function isAcceptable1()\n", name, type); return TRUE; } else { log_verbose("The data from \"%s.%s\" IS NOT acceptable using the verifing function isAcceptable1():-\n" "\tsize = %d\n" "\tisBigEndian = %d\n" "\tcharsetFamily = %d\n" "\tformatVersion[0] = %d\n" "\tdataVersion[0] = %d\n" "\tdataFormat = %c%c%c%c\n", name, type, pInfo->size, pInfo->isBigEndian, pInfo->charsetFamily, pInfo->formatVersion[0], pInfo->dataVersion[0], pInfo->dataFormat[0], pInfo->dataFormat[1], pInfo->dataFormat[2], pInfo->dataFormat[3]); log_verbose("Call another verifing function to accept the data\n"); return FALSE; } } static UBool U_CALLCONV isAcceptable2(void *context, const char *type, const char *name, const UDataInfo *pInfo){ (void)context; // suppress compiler warnings about unused variable UVersionInfo unicodeVersion; u_getUnicodeVersion(unicodeVersion); if( pInfo->size>=20 && pInfo->isBigEndian==U_IS_BIG_ENDIAN && pInfo->charsetFamily==U_CHARSET_FAMILY && pInfo->dataFormat[0]==0x75 && /* dataFormat="unam" */ pInfo->dataFormat[1]==0x6e && pInfo->dataFormat[2]==0x61 && pInfo->dataFormat[3]==0x6d && pInfo->formatVersion[0]==1 && pInfo->dataVersion[0]==unicodeVersion[0] ) { log_verbose("The data from \"%s.%s\" IS acceptable using the verifing function isAcceptable2()\n", name, type); return TRUE; } else { log_verbose("The data from \"%s.%s\" IS NOT acceptable using the verifing function isAcceptable2()\n", name, type); return FALSE; } } static UBool U_CALLCONV isAcceptable3(void *context, const char *type, const char *name, const UDataInfo *pInfo){ (void)context; // suppress compiler warnings about unused variable if( pInfo->size>=20 && pInfo->isBigEndian==U_IS_BIG_ENDIAN && pInfo->charsetFamily==U_CHARSET_FAMILY && pInfo->dataFormat[0]==0x54 && /* dataFormat="test" */ pInfo->dataFormat[1]==0x65 && pInfo->dataFormat[2]==0x73 && pInfo->dataFormat[3]==0x74 && pInfo->formatVersion[0]==1 && pInfo->dataVersion[0]==1 ) { log_verbose("The data from \"%s.%s\" IS acceptable using the verifing function isAcceptable3()\n", name, type); return TRUE; } else { log_verbose("The data from \"%s.%s\" IS NOT acceptable using the verifing function isAcceptable3()\n", name, type); return FALSE; } } #if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION static void TestUDataOpenChoiceDemo1() { UDataMemory *result; UErrorCode status=U_ZERO_ERROR; const char* name[]={ "cnvalias", "unames", "test", "nam" }; const char* type="icu"; const char* testPath="testdata"; const char* fullTestDataPath = loadTestData(&status); if(U_FAILURE(status)) { log_data_err("Could not load testdata.dat, status = %s\n", u_errorName(status)); return; } result=udata_openChoice(NULL, "icu", name[0], isAcceptable1, NULL, &status); if(U_FAILURE(status)){ log_data_err("FAIL: udata_openChoice() failed name=%s, type=%s, \n errorcode=%s\n", name[0], type, myErrorName(status)); } else { log_verbose("PASS: udata_openChoice worked\n"); udata_close(result); } status=U_ZERO_ERROR; result=udata_openChoice(NULL, type, name[1], isAcceptable1, NULL, &status); if(U_FAILURE(status)){ status=U_ZERO_ERROR; result=udata_openChoice(NULL, type, name[1], isAcceptable2, NULL, &status); if(U_FAILURE(status)){ log_data_err("FAIL: udata_openChoice() failed name=%s, type=%s, \n errorcode=%s\n", name[1], type, myErrorName(status)); } } else { log_err("FAIL: udata_openChoice() unexpectedly passed. name=%s, type=%s, \n errorcode=%s\n", name[1], type, myErrorName(status)); } if(U_SUCCESS(status)){ udata_close(result); } status=U_ZERO_ERROR; result=udata_openChoice(testPath, type, name[2], isAcceptable1, NULL, &status); if(U_FAILURE(status)){ status=U_ZERO_ERROR; result=udata_openChoice(testPath, type, name[2], isAcceptable3, NULL, &status); if(U_FAILURE(status)){ log_data_err("FAIL: udata_openChoice() failed path=%s name=%s, type=%s, \n errorcode=%s\n", testPath, name[2], type, myErrorName(status)); } } else { log_err("FAIL: udata_openChoice() unexpectedly passed. name=%s, type=%s, \n errorcode=%s\n", name[2], type, myErrorName(status)); } if(U_SUCCESS(status)){ udata_close(result); } status=U_ZERO_ERROR; type="typ"; result=udata_openChoice(fullTestDataPath, type, name[3], isAcceptable1, NULL, &status); if(status != U_INVALID_FORMAT_ERROR){ // Android-changed: Android does not try to load ICU data from other files. See gDataFileAccess = UDATA_NO_FILES in udata.cpp. // log_err("FAIL: udata_openChoice() did not fail as expected. name=%s, type=%s, \n errorcode=%s\n", name[3], type, myErrorName(status)); log_data_err("FAIL: udata_openChoice() did not fail as expected. name=%s, type=%s, \n errorcode=%s\n", name[3], type, myErrorName(status)); } status=U_USELESS_COLLATOR_ERROR; result=udata_openChoice(fullTestDataPath, type, name[3], isAcceptable1, NULL, &status); if(status != U_USELESS_COLLATOR_ERROR){ // Android-changed: Android does not try to load ICU data from other files. See gDataFileAccess = UDATA_NO_FILES in udata.cpp. // log_err("FAIL: udata_openChoice() did not fail as expected. name=%s, type=%s, \n errorcode=%s\n", name[3], type, myErrorName(status)); log_data_err("FAIL: udata_openChoice() did not fail as expected. name=%s, type=%s, \n errorcode=%s\n", name[3], type, myErrorName(status)); } } static UBool U_CALLCONV isAcceptable(void *context, const char *type, const char *name, const UDataInfo *pInfo){ if( pInfo->size>=20 && pInfo->isBigEndian==U_IS_BIG_ENDIAN && pInfo->charsetFamily==U_CHARSET_FAMILY && pInfo->dataFormat[0]==0x54 && /* dataFormat="test" */ pInfo->dataFormat[1]==0x65 && pInfo->dataFormat[2]==0x73 && pInfo->dataFormat[3]==0x74 && pInfo->formatVersion[0]==1 && pInfo->dataVersion[0]==1 && *((int*)context) == 2 ) { log_verbose("The data from\"%s.%s\" IS acceptable using the verifing function isAcceptable()\n", name, type); return TRUE; } else { log_verbose("The data from \"%s.%s\" IS NOT acceptable using the verifing function isAcceptable()\n", name, type); return FALSE; } } /* This test checks to see if the isAcceptable function is being called correctly. */ static void TestUDataOpenChoiceDemo2() { UDataMemory *result; UErrorCode status=U_ZERO_ERROR; int i; int p=2; const char* name="test"; const char* type="icu"; const char* path = loadTestData(&status); if(U_FAILURE(status)) { log_data_err("Could not load testdata.dat, status = %s\n", u_errorName(status)); return; } result=udata_openChoice(path, type, name, isAcceptable, &p, &status); if(U_FAILURE(status)){ log_data_err("failed to load data at p=%s t=%s n=%s, isAcceptable", path, type, name); } if(U_SUCCESS(status) ) { udata_close(result); } p=0; for(i=0;i<2; i++){ result=udata_openChoice(path, type, name, isAcceptable, &p, &status); if(p<2) { if(U_FAILURE(status) && status==U_INVALID_FORMAT_ERROR){ log_verbose("Loads the data but rejects it as expected %s\n", myErrorName(status)); status=U_ZERO_ERROR; p++; } else { log_data_err("FAIL: failed to either load the data or to reject the loaded data. ERROR=%s\n", myErrorName(status) ); } } else if(p == 2) { if(U_FAILURE(status)) { log_data_err("FAIL: failed to load the data and accept it. ERROR=%s\n", myErrorName(status) ); } else { log_verbose("Loads the data and accepts it for p==2 as expected\n"); udata_close(result); } } } } static void TestUDataGetInfo() { UDataMemory *result; /* UDataInfo cf. udata.h */ static UDataInfo dataInfo={ 30, /*sizeof(UDataInfo),*/ 0, U_IS_BIG_ENDIAN, U_CHARSET_FAMILY, sizeof(UChar), 0, {0x54, 0x65, 0x73, 0x74}, /* dataFormat="Test" */ {9, 0, 0, 0}, /* formatVersion */ {4, 0, 0, 0} /* dataVersion */ }; UErrorCode status=U_ZERO_ERROR; const char* name="cnvalias"; const char* name2="test"; const char* type="icu"; const char* testPath=loadTestData(&status); if(U_FAILURE(status)) { log_data_err("Could not load testdata.dat, status = %s\n", u_errorName(status)); return; } log_verbose("Testing udata_getInfo() for cnvalias.icu\n"); result=udata_open(NULL, "icu", name, &status); if(U_FAILURE(status)){ log_data_err("FAIL: udata_open() failed for path = NULL, name=%s, type=%s, \n errorcode=%s\n", name, type, myErrorName(status)); return; } udata_getInfo(result, &dataInfo); if(dataInfo.size==20 && dataInfo.size!=30 && dataInfo.isBigEndian==U_IS_BIG_ENDIAN && dataInfo.charsetFamily==U_CHARSET_FAMILY && dataInfo.dataFormat[0]==0x43 && dataInfo.dataFormat[0]!=0x54 && /* dataFormat="CvAl" and not "Test". The values are set for cnvalias.dat*/ dataInfo.dataFormat[1]==0x76 && dataInfo.dataFormat[1]!=0x65 && dataInfo.dataFormat[2]==0x41 && dataInfo.dataFormat[2]!=0x73 && dataInfo.dataFormat[3]==0x6c && dataInfo.dataFormat[3]!=0x74 && dataInfo.formatVersion[0]!=9 && /*formatVersion is also set to the one for cnvalias*/ dataInfo.dataVersion[0]!=4 && /*dataVersion*/ dataInfo.dataVersion[1]!=0 ){ log_verbose("PASS: udata_getInfo() filled in the right values\n"); } else { log_err("FAIL: udata_getInfo() filled in the wrong values\n"); } udata_close(result); log_verbose("Testing udata_getInfo() for test.icu\n"); result=udata_open(testPath, type, name2, &status); if(U_FAILURE(status)) { log_data_err("FAIL: udata_open() failed for path=%s name2=%s, type=%s, \n errorcode=%s\n", testPath, name2, type, myErrorName(status)); return; } udata_getInfo(result, &dataInfo); if(dataInfo.size==20 && dataInfo.isBigEndian==U_IS_BIG_ENDIAN && dataInfo.charsetFamily==U_CHARSET_FAMILY && dataInfo.dataFormat[0]==0x54 && /* dataFormat="Test". The values are set for test.dat*/ dataInfo.dataFormat[1]==0x65 && dataInfo.dataFormat[2]==0x73 && dataInfo.dataFormat[3]==0x74 && dataInfo.formatVersion[0]==1 && /*formatVersion is also set to the one for test*/ dataInfo.dataVersion[0]==1 && /*dataVersion*/ dataInfo.dataVersion[1]==0 ) { log_verbose("PASS: udata_getInfo() filled in the right values\n"); } else { log_err("FAIL: udata_getInfo() filled in the wrong values\n"); } udata_close(result); } static void TestUDataGetMemory() { UDataMemory *result; const int32_t *table=NULL; uint16_t* intValue=0; UErrorCode status=U_ZERO_ERROR; const char* name="cnvalias"; const char* type; const char* name2="test"; const char* testPath = loadTestData(&status); if(U_FAILURE(status)) { log_data_err("Could not load testdata.dat, status = %s\n", u_errorName(status)); return; } type="icu"; log_verbose("Testing udata_getMemory() for \"cnvalias.icu\"\n"); result=udata_openChoice(NULL, type, name, isAcceptable1, NULL, &status); if(U_FAILURE(status)){ log_data_err("FAIL: udata_openChoice() failed for name=%s, type=%s, \n errorcode=%s\n", name, type, myErrorName(status)); return; } table=(const int32_t *)udata_getMemory(result); /* The alias table may list more converters than what's actually available now. [grhoten] */ if(ucnv_countAvailable() > table[1]) /*???*/ log_err("FAIL: udata_getMemory() failed ucnv_countAvailable returned = %d, expected = %d\n", ucnv_countAvailable(), table[1+2*(*table)]); udata_close(result); type="icu"; log_verbose("Testing udata_getMemory for \"test.icu\"()\n"); result=udata_openChoice(testPath, type, name2, isAcceptable3, NULL, &status); if(U_FAILURE(status)){ log_data_err("FAIL: udata_openChoice() failed for path=%s name=%s, type=%s, \n errorcode=%s\n", testPath, name2, type, myErrorName(status)); return; } intValue=(uint16_t *)udata_getMemory(result); /*printf("%d ..... %s", *(intValue), intValue+1));*/ if( *intValue != 2000 || strcmp((char*)(intValue+1), "YEAR") != 0 ) log_err("FAIL: udata_getMemory() failed: intValue :- Expected:2000 Got:%d \n\tstringValue:- Expected:YEAR Got:%s\n", *intValue, (intValue+1)); udata_close(result); } static void TestErrorConditions(){ UDataMemory *result=NULL; UErrorCode status=U_ZERO_ERROR; uint16_t* intValue=0; static UDataInfo dataInfo={ 30, /*sizeof(UDataInfo),*/ 0, U_IS_BIG_ENDIAN, U_CHARSET_FAMILY, sizeof(UChar), 0, {0x54, 0x65, 0x73, 0x74}, /* dataFormat="Test" */ {9, 0, 0, 0}, /* formatVersion */ {4, 0, 0, 0} /* dataVersion */ }; const char* name = "test"; const char* type="icu"; const char *testPath = loadTestData(&status); if(U_FAILURE(status)) { log_data_err("Could not load testdata.dat, status = %s\n", u_errorName(status)); return; } status = U_ILLEGAL_ARGUMENT_ERROR; /*Try udata_open with status != U_ZERO_ERROR*/ log_verbose("Testing udata_open() with status != U_ZERO_ERROR\n"); result=udata_open(testPath, type, name, &status); if(result != NULL){ log_data_err("FAIL: udata_open() is supposed to fail for path = %s, name=%s, type=%s, \n errorcode !=U_ZERO_ERROR\n", testPath, name, type); udata_close(result); } else { log_verbose("PASS: udata_open with errorCode != U_ZERO_ERROR failed as expected\n"); } /*Try udata_open with data name=NULL*/ log_verbose("Testing udata_open() with data name=NULL\n"); status=U_ZERO_ERROR; result=udata_open(testPath, type, NULL, &status); if(U_FAILURE(status)){ if(status != U_ILLEGAL_ARGUMENT_ERROR || result != NULL){ log_err("FAIL: udata_open() with name=NULL should return NULL and errocode U_ILLEGAL_ARGUMENT_ERROR, GOT: errorcode=%s\n", myErrorName(status)); }else{ log_verbose("PASS: udata_open with name=NULL failed as expected and errorcode = %s as expected\n", myErrorName(status)); } }else{ log_err("FAIL: udata_open() with data name=NULL is supposed to fail for path = %s, name=NULL type=%s errorcode=U_ZERO_ERROR \n", testPath, type); udata_close(result); } /*Try udata_openChoice with status != U_ZERO_ERROR*/ log_verbose("Testing udata_openChoice() with status != U_ZERO_ERROR\n"); status=U_ILLEGAL_ARGUMENT_ERROR; result=udata_openChoice(testPath, type, name, isAcceptable3, NULL, &status); if(result != NULL){ log_err("FAIL: udata_openChoice() is supposed to fail for path = %s, name=%s, type=%s, \n errorcode != U_ZERO_ERROR\n", testPath, name, type); udata_close(result); } else { log_verbose("PASS: udata_openChoice() with errorCode != U_ZERO_ERROR failed as expected\n"); } /*Try udata_open with data name=NULL*/ log_verbose("Testing udata_openChoice() with data name=NULL\n"); status=U_ZERO_ERROR; result=udata_openChoice(testPath, type, NULL, isAcceptable3, NULL, &status); if(U_FAILURE(status)){ if(status != U_ILLEGAL_ARGUMENT_ERROR || result != NULL){ log_err("FAIL: udata_openChoice() with name=NULL should return NULL and errocode U_ILLEGAL_ARGUMENT_ERROR, GOT: errorcode=%s\n", myErrorName(status)); }else{ log_verbose("PASS: udata_openChoice with name=NULL failed as expected and errorcode = %s as expected\n", myErrorName(status)); } }else{ log_err("FAIL: udata_openChoice() with data name=NULL is supposed to fail for path = %s, name=NULL type=%s errorcode=U_ZERO_ERROR \n", testPath, type); udata_close(result); } /*Try udata_getMemory with UDataMemory=NULL*/ log_verbose("Testing udata_getMemory with UDataMemory=NULL\n"); intValue=(uint16_t*)udata_getMemory(NULL); if(intValue != NULL){ log_err("FAIL: udata_getMemory with UDataMemory = NULL is supposed to fail\n"); } /*Try udata_getInfo with UDataMemory=NULL*/ status=U_ZERO_ERROR; udata_getInfo(NULL, &dataInfo); if(dataInfo.size != 0){ log_err("FAIL : udata_getInfo with UDataMemory = NULL us supposed to fail\n"); } /*Try udata_openChoice with a non existing binary file*/ log_verbose("Testing udata_openChoice() with a non existing binary file\n"); result=udata_openChoice(testPath, "tst", "nonexist", isAcceptable3, NULL, &status); if(status==U_FILE_ACCESS_ERROR){ log_verbose("Opening udata_openChoice with non-existing file handled correctly.\n"); status=U_ZERO_ERROR; } else { log_err("calling udata_open with non-existing file not handled correctly\n. Expected: U_FILE_ACCESS_ERROR, Got: %s\n", myErrorName(status)); if(U_SUCCESS(status)) { udata_close(result); } } if(result != NULL){ log_err("calling udata_open with non-existing file didn't return a null value\n"); } else { log_verbose("calling udat_open with non-existing file returned null as expected\n"); } } /* Test whether apps and ICU can each have their own root.res */ static void TestAppData() { UResourceBundle *icu, *app; UResourceBundle *tmp = NULL; UResourceBundle *tmp2 = NULL; const UChar *appString; const UChar *icuString; int32_t len; UErrorCode status = U_ZERO_ERROR; char testMsgBuf[256]; const char* testPath=loadTestData(&status); if(U_FAILURE(status)) { log_data_err("Could not load testdata.dat, status = %s\n", u_errorName(status)); return; } icu = ures_open(NULL, "root", &status); if(U_FAILURE(status)) { log_data_err("%s:%d: Couldn't open root ICU bundle- %s", __FILE__, __LINE__, u_errorName(status)); return; } /* log_info("Open icu root: %s size_%d\n", u_errorName(status), ures_getSize(icu)); */ status = U_ZERO_ERROR; app = ures_open(testPath, "root", &status); if(U_FAILURE(status)) { log_data_err("%s:%d: Couldn't open app ICU bundle [%s]- %s", __FILE__, __LINE__, testPath, u_errorName(status)); return; } /* log_info("Open app: %s, size %d\n", u_errorName(status), ures_getSize(app)); */ tmp = ures_getByKey(icu, "Version", tmp, &status); if(U_FAILURE(status)) { log_err("%s:%d: Couldn't get Version string from ICU root bundle- %s", __FILE__, __LINE__, u_errorName(status)); return; } icuString = ures_getString(tmp, &len, &status); if(U_FAILURE(status)) { log_err("%s:%d: Couldn't get string from Version string from ICU root bundle- %s", __FILE__, __LINE__, u_errorName(status)); return; } /* log_info("icuString=%p - %s\n", icuString, austrdup(icuString)); */ tmp2 = ures_getByKey(app, "Version", tmp2, &status); if(U_FAILURE(status)) { log_err("%s:%d: Couldn't get Version string from App root bundle- %s", __FILE__, __LINE__, u_errorName(status)); return; } appString = ures_getString(tmp2, &len, &status); if(U_FAILURE(status)) { log_err("%s:%d: Couldn't get string from Version string from App root bundle- %s", __FILE__, __LINE__, u_errorName(status)); return; } /* log_info("appString=%p - %s\n", appString, austrdup(appString)); */ if(!u_strcmp(icuString, appString)) { log_err("%s:%d: Error! Expected ICU and App root version strings to be DIFFERENT but they are both %s and %s\n", __FILE__, __LINE__, austrdup(icuString), austrdup(appString)); } else { log_verbose("%s:%d: appstr=%s, icustr=%s\n", __FILE__, __LINE__, u_austrcpy(testMsgBuf, appString), u_austrcpy(testMsgBuf, icuString)); } ures_close(tmp); ures_close(tmp2); ures_close(icu); ures_close(app); } #endif static void TestICUDataName() { UVersionInfo icuVersion; char expectDataName[20]; unsigned int expectLen = 8; char typeChar = '?'; /* Print out the version # we have .. */ log_verbose("utypes.h says U_ICUDATA_NAME = %s\n", U_ICUDATA_NAME); /* Build up the version # we expect to get */ u_getVersion(icuVersion); switch(U_CHARSET_FAMILY) { case U_ASCII_FAMILY: switch((int)U_IS_BIG_ENDIAN) { case 1: typeChar = 'b'; break; case 0: typeChar = 'l'; break; default: log_err("Expected 1 or 0 for U_IS_BIG_ENDIAN, got %d!\n", (int)U_IS_BIG_ENDIAN); /* return; */ } break; case U_EBCDIC_FAMILY: typeChar = 'e'; break; } /* Only major number is needed. */ sprintf(expectDataName, "%s%d%c", "icudt", (int)icuVersion[0], typeChar); log_verbose("Expected: %s\n", expectDataName); if(uprv_strlen(expectDataName) != expectLen) { log_err("*Expected* length is wrong (test err?), should be %d is %d\n", expectLen, uprv_strlen(expectDataName)); } if(uprv_strlen(U_ICUDATA_NAME) != expectLen) { log_err("U_ICUDATA_NAME length should be %d is %d\n", expectLen, uprv_strlen(U_ICUDATA_NAME)); } if(uprv_strcmp(U_ICUDATA_NAME, expectDataName)) { log_err("U_ICUDATA_NAME should be %s but is %s\n", expectDataName, U_ICUDATA_NAME); } /* ICUDATA_NAME comes from the build system on *nix */ #ifdef ICUDATA_NAME if(uprv_strcmp(U_ICUDATA_NAME, ICUDATA_NAME)) { log_err("ICUDATA_NAME and U_ICUDATA_NAME don't match: " "ICUDATA_NAME=%s, U_ICUDATA_NAME=%s. Check configure.in, icudefs.mk.in, utypes.h...\n", ICUDATA_NAME, U_ICUDATA_NAME); } else { log_verbose("ICUDATA_NAME=%s (from icudefs.mk), U_ICUDATA_NAME=%s (from utypes.h)\n", ICUDATA_NAME, U_ICUDATA_NAME); } #endif } /* test data swapping ------------------------------------------------------- */ #if U_PLATFORM == U_PF_OS400 /* See comments in genccode.c on when this special implementation can be removed. */ static const struct { double bogus; const char *bytes; } gOffsetTOCAppDataItem1={ 0.0, /* alignment bytes */ "\x00\x14" /* sizeof(UDataInfo) *//* MappedData { */ "\xda" "\x27" /* } */ "\x00\x14" /* sizeof(UDataInfo) *//* UDataInfo { */ "\0\0" "\1" /* U_IS_BIG_ENDIAN */ "\1" /* U_CHARSET_FAMILY */ "\2" /* U_SIZEOF_WHAR_T */ "\0" "\x31\x31\x31\x31" "\0\0\0\0" "\0\0\0\0" /* } */ }; #else static const struct { double bogus; MappedData bytes1; UDataInfo bytes2; uint8_t bytes3; } gOffsetTOCAppDataItem1={ 0.0, /* alignment bytes */ { sizeof(UDataInfo), 0xda, 0x27 }, /* MappedData */ {sizeof(UDataInfo), 0, U_IS_BIG_ENDIAN, U_CHARSET_FAMILY, sizeof(UChar), 0, {0x31, 0x31, 0x31, 0x31}, /* dataFormat="1111" */ {0, 0, 0, 0}, /* formatVersion */ {0, 0, 0, 0}}, /* dataVersion */ 0 }; #endif static const UChar gOffsetTOCGarbage[] = { /* "I have been very naughty!" */ 0x49, 0x20, 0x68, 0x61, 0x76, 0x65, 0x20, 0x62, 0x65, 0x65, 0x6E, 0x20, 0x76, 0x65, 0x72, 0x79, 0x20, 0x6E, 0x61, 0x75, 0x67, 0x68, 0x74, 0x79, 0x21 }; /* Original source: icu/source/tools/genccode */ static const struct { uint16_t headerSize; uint8_t magic1, magic2; UDataInfo info; char padding[8]; uint32_t count, reserved; const struct { const char *const name; const void *const data; } toc[3]; } gOffsetTOCAppData_dat = { 32, /* headerSize */ 0xda, /* magic1, (see struct MappedData in udata.c) */ 0x27, /* magic2 */ { /*UDataInfo */ sizeof(UDataInfo), /* size */ 0, /* reserved */ U_IS_BIG_ENDIAN, U_CHARSET_FAMILY, sizeof(UChar), 0, /* reserved */ { /* data format identifier */ 0x54, 0x6f, 0x43, 0x50}, /* "ToCP" */ {1, 0, 0, 0}, /* format version major, minor, milli, micro */ {0, 0, 0, 0} /* dataVersion */ }, {0,0,0,0,0,0,0,0}, /* Padding[8] */ 3, /* count */ 0, /* Reserved */ { /* TOC structure */ { "OffsetTOCAppData/a/b", &gOffsetTOCAppDataItem1 }, { "OffsetTOCAppData/gOffsetTOCAppDataItem1", &gOffsetTOCAppDataItem1 }, { "OffsetTOCAppData/gOffsetTOCGarbage", &gOffsetTOCGarbage } } }; /* Unfortunately, dictionaries are in a C++ header */ U_CAPI int32_t U_EXPORT2 udict_swap(const UDataSwapper *ds, const void *inData, int32_t length, void *outData, UErrorCode *pErrorCode); /* test cases for maximum data swapping code coverage */ static const struct { const char *name, *type; UDataSwapFn *swapFn; } swapCases[]={ /* resource bundles */ /* resource bundle with many data types */ {"*testtypes", "res", ures_swap}, /* resource bundle with collation data */ {"ja", "res", ures_swap}, /* resource bundle with options-only collation data */ {"ru", "res", ures_swap}, {"el", "res", ures_swap}, /* ICU's root */ {"root", "res", ures_swap}, /* Test a 32-bit key table. This is large. */ {"*testtable32", "res", ures_swap}, /* ICU 4.2 resource bundle - data format 1.2 (little-endian ASCII) */ {"*old_l_testtypes", "res", ures_swap}, /* same for big-endian EBCDIC */ {"*old_e_testtypes", "res", ures_swap}, #if !UCONFIG_NO_COLLATION /* standalone collation data files */ {"ucadata", "icu", ucol_swap}, #if 0 /* Starting with ICU 53, the "inverse UCA" data is integrated into ucadata.icu. */ {"invuca", "icu", ucol_swapInverseUCA}, #endif #endif #if !UCONFIG_NO_LEGACY_CONVERSION /* conversion table files */ /* SBCS conversion table file without extension */ {"ibm-913_P100-2000", "cnv", ucnv_swap}, /* EBCDIC_STATEFUL conversion table file with extension */ {"ibm-1390_P110-2003", "cnv", ucnv_swap}, /* DBCS extension-only conversion table file */ {"ibm-16684_P110-2003", "cnv", ucnv_swap}, /* EUC-TW (3-byte) conversion table file without extension */ {"ibm-964_P110-1999", "cnv", ucnv_swap}, /* GB 18030 (4-byte) conversion table file without extension */ {"gb18030", "cnv", ucnv_swap}, /* MBCS conversion table file with extension */ {"*test4x", "cnv", ucnv_swap}, /* * MBCS conversion table file without extension, * to test swapping and preflighting of UTF-8-friendly mbcsIndex[]. */ {"jisx-212", "cnv", ucnv_swap}, #endif #if !UCONFIG_NO_CONVERSION /* alias table */ {"cnvalias", "icu", ucnv_swapAliases}, #endif #if !UCONFIG_NO_IDNA {"rfc3491", "spp", usprep_swap}, #endif #if !UCONFIG_NO_BREAK_ITERATION {"char", "brk", ubrk_swap}, {"thaidict", "dict",udict_swap}, #endif #if 0 /* * Starting with ICU 4.8, the Unicode property (value) aliases data * is hardcoded in the ICU4C common library. * The swapper was moved to the toolutil library for swapping for ICU4J. */ /* Unicode properties */ {"pnames", "icu", upname_swap}, #endif #if 0 /* * Starting with ICU4C 3.4, the core Unicode properties files * (uprops.icu, ucase.icu, ubidi.icu, unorm.icu) * are hardcoded in the common DLL and therefore not included * in the data package any more. * Their swapping code is moved from the common DLL to the icuswap tool so that * we need not jump through hoops (like adding snapshots of these files * to testdata) for code coverage in tests. * See Jitterbug 4497. * * ICU4C 4.4 adds normalization data files again, e.g., nfkc.nrm. */ {"uprops", "icu", uprops_swap}, {"ucase", "icu", ucase_swap}, {"ubidi", "icu", ubidi_swap}, #endif #if !UCONFIG_NO_NORMALIZATION && !UCONFIG_ONLY_COLLATION {"nfkc", "nrm", unorm2_swap}, #if !UCONFIG_NO_REGULAR_EXPRESSIONS {"confusables", "cfu", uspoof_swap}, /* spoof data missing without regex */ #endif #endif {"unames", "icu", uchar_swapNames} /* the last item should not be #if'ed so that it can reliably omit the last comma */ }; /* Large enough for the largest swappable data item. */ #define SWAP_BUFFER_SIZE 1800000 static void U_CALLCONV printError(void *context, const char *fmt, va_list args) { (void)context; // suppress compiler warnings about unused variable vlog_info("[swap] ", fmt, args); log_err("\n"); /* Register error */ } static void TestSwapCase(UDataMemory *pData, const char *name, UDataSwapFn *swapFn, uint8_t *buffer, uint8_t *buffer2) { UDataSwapper *ds; const void *inData, *inHeader; int32_t length, dataLength, length2, headerLength; UErrorCode errorCode; UErrorCode badStatus; UBool inEndian, oppositeEndian; uint8_t inCharset, oppositeCharset; /* First we check that swapFn handles failures as expected. */ errorCode = U_UNSUPPORTED_ERROR; length = swapFn(NULL, NULL, 0, buffer, &errorCode); if (length != 0 || errorCode != U_UNSUPPORTED_ERROR) { log_err("%s() did not fail as expected - %s\n", name, u_errorName(errorCode)); } errorCode = U_ZERO_ERROR; length = swapFn(NULL, NULL, 0, buffer, &errorCode); if (length != 0 || errorCode != U_ILLEGAL_ARGUMENT_ERROR) { log_err("%s() did not fail as expected with bad arguments - %s\n", name, u_errorName(errorCode)); } /* Continue with the rest of the tests. */ errorCode = U_ZERO_ERROR; inData=udata_getMemory(pData); /* * get the data length if possible, to verify that swapping and preflighting * handles the entire data */ dataLength=udata_getLength(pData); /* * get the header and its length * all of the swap implementation functions require the header to be included */ inHeader=udata_getRawMemory(pData); headerLength=(int32_t)((const char *)inData-(const char *)inHeader); /* first swap to opposite endianness but same charset family */ errorCode=U_ZERO_ERROR; ds=udata_openSwapperForInputData(inHeader, headerLength, !U_IS_BIG_ENDIAN, U_CHARSET_FAMILY, &errorCode); if(U_FAILURE(errorCode)) { log_err("udata_openSwapperForInputData(%s->!isBig+same charset) failed - %s\n", name, u_errorName(errorCode)); return; } inEndian=ds->inIsBigEndian; inCharset=ds->inCharset; oppositeEndian=!inEndian; oppositeCharset= inCharset==U_ASCII_FAMILY ? U_EBCDIC_FAMILY : U_ASCII_FAMILY; /* make this test work with data files that are built for a different platform */ if(inEndian!=U_IS_BIG_ENDIAN || inCharset!=U_CHARSET_FAMILY) { udata_closeSwapper(ds); ds=udata_openSwapper(inEndian, inCharset, oppositeEndian, inCharset, &errorCode); if(U_FAILURE(errorCode)) { log_err("udata_openSwapper(%s->!isBig+same charset) failed - %s\n", name, u_errorName(errorCode)); return; } } /* Check error checking of swappable data not specific to this swapper. This should always fail. */ badStatus = U_ZERO_ERROR; length=swapFn(ds, &gOffsetTOCAppData_dat, -1, NULL, &badStatus); if(badStatus != U_UNSUPPORTED_ERROR) { log_err("swapFn(%s->!isBig+same charset) unexpectedly succeeded on bad data - %s\n", name, u_errorName(errorCode)); udata_closeSwapper(ds); return; } /* Now allow errors to be printed */ ds->printError=printError; /* preflight the length */ length=swapFn(ds, inHeader, -1, NULL, &errorCode); if(U_FAILURE(errorCode)) { log_err("swapFn(preflight %s->!isBig+same charset) failed - %s\n", name, u_errorName(errorCode)); udata_closeSwapper(ds); return; } /* compare the preflighted length against the data length */ if(dataLength>=0 && (length+15)<(headerLength+dataLength)) { log_err("swapFn(preflight %s->!isBig+same charset) length too small: %d < data length %d\n", name, length, (headerLength+dataLength)); udata_closeSwapper(ds); return; } /* swap, not in-place */ length2=swapFn(ds, inHeader, length, buffer, &errorCode); udata_closeSwapper(ds); if(U_FAILURE(errorCode)) { log_err("swapFn(%s->!isBig+same charset) failed - %s\n", name, u_errorName(errorCode)); return; } /* compare the swap length against the preflighted length */ if(length2!=length) { log_err("swapFn(%s->!isBig+same charset) length differs from preflighting: %d != preflighted %d\n", name, length2, length); return; } /* next swap to opposite charset family */ ds=udata_openSwapper(oppositeEndian, inCharset, oppositeEndian, oppositeCharset, &errorCode); if(U_FAILURE(errorCode)) { log_err("udata_openSwapper(%s->!isBig+other charset) failed - %s\n", name, u_errorName(errorCode)); return; } ds->printError=printError; /* swap in-place */ length2=swapFn(ds, buffer, length, buffer, &errorCode); udata_closeSwapper(ds); if(U_FAILURE(errorCode)) { log_err("swapFn(%s->!isBig+other charset) failed - %s\n", name, u_errorName(errorCode)); return; } /* compare the swap length against the original length */ if(length2!=length) { log_err("swapFn(%s->!isBig+other charset) length differs from original: %d != original %d\n", name, length2, length); return; } /* finally swap to original platform values */ ds=udata_openSwapper(oppositeEndian, oppositeCharset, inEndian, inCharset, &errorCode); if(U_FAILURE(errorCode)) { log_err("udata_openSwapper(%s->back to original) failed - %s\n", name, u_errorName(errorCode)); return; } ds->printError=printError; /* swap, not in-place */ length2=swapFn(ds, buffer, length, buffer2, &errorCode); udata_closeSwapper(ds); if(U_FAILURE(errorCode)) { log_err("swapFn(%s->back to original) failed - %s\n", name, u_errorName(errorCode)); return; } /* compare the swap length against the original length */ if(length2!=length) { log_err("swapFn(%s->back to original) length differs from original: %d != original %d\n", name, length2, length); return; } /* compare the final contents with the original */ if(0!=uprv_memcmp(inHeader, buffer2, length)) { const uint8_t *original; uint8_t diff[8]; int32_t i, j; log_err("swapFn(%s->back to original) contents differs from original\n", name); /* find the first difference */ original=(const uint8_t *)inHeader; for(i=0; ilength) { length2=length; } /* print the original bytes */ uprv_memset(diff, 0, sizeof(diff)); for(j=i; jprintError=printErrorToString; ds->printErrorContext=name; udata_printError(ds, "This %s a %s", "is", "test"); udata_closeSwapper(ds); if (strcmp(name, "This is a test") != 0) { log_err("udata_printError can't properly print error messages. Got = %s\n", name); } errorCode = U_USELESS_COLLATOR_ERROR; ds=udata_openSwapperForInputData(NULL, 0, !U_IS_BIG_ENDIAN, U_ASCII_FAMILY, &errorCode); if (ds != NULL || errorCode != U_USELESS_COLLATOR_ERROR) { log_err("udata_openSwapperForInputData should have returned NULL with bad argument\n", name); } errorCode=U_ZERO_ERROR; ds=udata_openSwapperForInputData(NULL, 0, !U_IS_BIG_ENDIAN, U_ASCII_FAMILY, &errorCode); if (ds != NULL || errorCode != U_ILLEGAL_ARGUMENT_ERROR) { log_err("udata_openSwapperForInputData should have returned NULL with bad argument\n", name); } errorCode=U_ZERO_ERROR; memset(buffer, 0, sizeof(2*SWAP_BUFFER_SIZE)); ds=udata_openSwapperForInputData(buffer, 2*SWAP_BUFFER_SIZE, !U_IS_BIG_ENDIAN, U_ASCII_FAMILY, &errorCode); if (ds != NULL || errorCode != U_UNSUPPORTED_ERROR) { log_err("udata_openSwapperForInputData should have returned NULL with bad argument\n", name); } errorCode=U_ZERO_ERROR; /* Test argument checking. ucol_swap is normally tested via ures_swap, and isn't normally called directly. */ #if !UCONFIG_NO_COLLATION ucol_swap(NULL, NULL, -1, NULL, &errorCode); if (errorCode != U_ILLEGAL_ARGUMENT_ERROR) { log_err("ucol_swap did not fail as expected\n", name); } errorCode=U_ZERO_ERROR; #endif for(i=0; i