| /******************************************************************** |
| * COPYRIGHT: |
| * Copyright (c) 1997-2001, International Business Machines Corporation and |
| * others. All Rights Reserved. |
| ********************************************************************/ |
| /******************************************************************************** |
| * |
| * File CU_CAPITST.C |
| * |
| * Modification History: |
| * Name Description |
| * Madhu Katragadda Ported for C API |
| ********************************************************************************* |
| */ |
| #include <stdio.h> |
| #include "ccapitst.h" |
| #include "unicode/uloc.h" |
| #include "unicode/ucnv.h" |
| #include "unicode/ucnv_err.h" |
| #include "cintltst.h" |
| #include "unicode/utypes.h" |
| #include "unicode/ustring.h" |
| #include "cstring.h" |
| #include "cmemory.h" |
| |
| #define NUM_CODEPAGE 1 |
| #define MAX_FILE_LEN 1024*20 |
| #define UCS_FILE_NAME_SIZE 512 |
| |
| /*returns an action other than the one provided*/ |
| static UConverterFromUCallback otherUnicodeAction(UConverterFromUCallback MIA); |
| static UConverterToUCallback otherCharAction(UConverterToUCallback MIA); |
| |
| static void TestCCSID(void); |
| static void TestJ932(void); |
| |
| void addTestConvert(TestNode** root); |
| |
| void addTestConvert(TestNode** root) |
| { |
| addTest(root, &TestConvert, "tsconv/ccapitst/TestConvert"); |
| addTest(root, &TestAlias, "tsconv/ccapitst/TestAlias"); |
| addTest(root, &TestConvertSafeClone, "tsconv/ccapitst/TestConvertSafeClone"); |
| addTest(root, &TestCCSID, "tsconv/ccapitst/TestCCSID"); |
| addTest(root, &TestJ932, "tsconv/ccapitst/TestJ932"); |
| } |
| |
| static void TestConvert() |
| { |
| char myptr[4]; |
| char save[4]; |
| int32_t testLong1 = 0; |
| uint16_t rest = 0; |
| int32_t len = 0; |
| int32_t x = 0; |
| FILE* ucs_file_in = NULL; |
| UChar BOM = 0x0000; |
| UChar myUChar = 0x0000; |
| char* mytarget; /* [MAX_FILE_LEN] */ |
| char* mytarget_1; |
| char* mytarget_use; |
| UChar* consumedUni = NULL; |
| char* consumed = NULL; |
| char* output_cp_buffer; /* [MAX_FILE_LEN] */ |
| UChar* ucs_file_buffer; /* [MAX_FILE_LEN] */ |
| UChar* ucs_file_buffer_use; |
| UChar* my_ucs_file_buffer; /* [MAX_FILE_LEN] */ |
| UChar* my_ucs_file_buffer_1; |
| int8_t ii = 0; |
| int32_t j = 0; |
| uint16_t codepage_index = 0; |
| uint16_t count; |
| int32_t cp = 0; |
| UErrorCode err = U_ZERO_ERROR; |
| const char* available_conv; |
| char ucs_file_name[UCS_FILE_NAME_SIZE]; |
| UConverterFromUCallback MIA1, MIA1_2; |
| UConverterToUCallback MIA2, MIA2_2; |
| const void *MIA1Context, *MIA1Context2, *MIA2Context, *MIA2Context2; |
| UConverter* someConverters[5]; |
| UConverter* myConverter = 0; |
| UChar* displayname = 0; |
| |
| const char* locale; |
| |
| UChar* uchar1 = 0; |
| UChar* uchar2 = 0; |
| UChar* uchar3 = 0; |
| int32_t targetcapacity2; |
| int32_t targetcapacity; |
| int32_t targetsize; |
| int32_t disnamelen; |
| |
| const UChar* tmp_ucs_buf; |
| const UChar* tmp_consumedUni=NULL; |
| const char* tmp_mytarget_use; |
| const char* tmp_consumed; |
| |
| int flushCount = 0; |
| |
| /****************************************************************** |
| Checking Unicode -> ksc |
| ******************************************************************/ |
| |
| const char* CodePagesToTest[NUM_CODEPAGE] = |
| { |
| "ibm-949_P110-2000" |
| |
| |
| }; |
| const uint16_t CodePageNumberToTest[NUM_CODEPAGE] = |
| { |
| 949 |
| }; |
| |
| |
| const int8_t CodePagesMinChars[NUM_CODEPAGE] = |
| { |
| 1 |
| |
| }; |
| |
| const int8_t CodePagesMaxChars[NUM_CODEPAGE] = |
| { |
| 2 |
| |
| }; |
| |
| const uint16_t CodePagesSubstitutionChars[NUM_CODEPAGE] = |
| { |
| 0xAFFE |
| }; |
| |
| const char* CodePagesTestFiles[NUM_CODEPAGE] = |
| { |
| "uni-text.bin" |
| }; |
| |
| |
| const UConverterPlatform CodePagesPlatform[NUM_CODEPAGE] = |
| { |
| UCNV_IBM |
| |
| }; |
| |
| const char* CodePagesLocale[NUM_CODEPAGE] = |
| { |
| "ko_KR" |
| }; |
| |
| UConverterFromUCallback oldFromUAction = NULL; |
| UConverterToUCallback oldToUAction = NULL; |
| const void* oldFromUContext = NULL; |
| const void* oldToUContext = NULL; |
| |
| /* Allocate memory */ |
| mytarget = (char*) malloc(MAX_FILE_LEN * sizeof(mytarget[0])); |
| output_cp_buffer = (char*) malloc(MAX_FILE_LEN * sizeof(output_cp_buffer[0])); |
| ucs_file_buffer = (UChar*) malloc(MAX_FILE_LEN * sizeof(ucs_file_buffer[0])); |
| my_ucs_file_buffer = (UChar*) malloc(MAX_FILE_LEN * sizeof(my_ucs_file_buffer[0])); |
| |
| ucs_file_buffer_use = ucs_file_buffer; |
| mytarget_1=mytarget; |
| mytarget_use = mytarget; |
| my_ucs_file_buffer_1=my_ucs_file_buffer; |
| |
| /* flush the converter cache to get a consistent state before the flushing is tested */ |
| flushCount = ucnv_flushCache(); |
| |
| /*Calling all the UnicodeConverterCPP API and checking functionality*/ |
| |
| /*Tests ucnv_getAvailableName(), getAvialableCount()*/ |
| |
| log_verbose("Testing ucnv_countAvailable()..."); |
| |
| testLong1=ucnv_countAvailable(); |
| log_verbose("Number of available Codepages: %d\n", testLong1); |
| |
| log_verbose("\n---Testing ucnv_getAvailableName.."); /*need to check this out */ |
| |
| available_conv = ucnv_getAvailableName(testLong1); |
| /*test ucnv_getAvailableName with err condition*/ |
| log_verbose("\n---Testing ucnv_getAvailableName..with index < 0 "); |
| available_conv = ucnv_getAvailableName(-1); |
| if(available_conv != NULL){ |
| log_err("ucnv_getAvailableName() with index < 0) should return NULL\n"); |
| } |
| |
| /* Test ucnv_countAliases() etc. */ |
| count = ucnv_countAliases("utf-8", &err); |
| if(U_FAILURE(err)) { |
| log_err("FAILURE! ucnv_countAliases(\"utf-8\") -> %s\n", myErrorName(err)); |
| } else if(count <= 0) { |
| log_err("FAILURE! ucnv_countAliases(\"utf-8\") -> %d aliases\n", count); |
| } else { |
| /* try to get the aliases individually */ |
| const char *alias; |
| alias = ucnv_getAlias("utf-8", 0, &err); |
| if(U_FAILURE(err)) { |
| log_err("FAILURE! ucnv_getAlias(\"utf-8\", 0) -> %s\n", myErrorName(err)); |
| } else if(uprv_strcmp("UTF-8", alias) != 0) { |
| log_err("FAILURE! ucnv_getAlias(\"utf-8\", 0) -> %s instead of UTF-8\n", alias); |
| } else { |
| uint16_t aliasNum; |
| for(aliasNum = 0; aliasNum < count; ++aliasNum) { |
| alias = ucnv_getAlias("utf-8", aliasNum, &err); |
| if(U_FAILURE(err)) { |
| log_err("FAILURE! ucnv_getAlias(\"utf-8\", %d) -> %s\n", aliasNum, myErrorName(err)); |
| } else if(uprv_strlen(alias) > 20) { |
| /* sanity check */ |
| log_err("FAILURE! ucnv_getAlias(\"utf-8\", %d) -> alias %s insanely long, corrupt?!\n", aliasNum, alias); |
| } else { |
| log_verbose("alias %d for utf-8: %s\n", aliasNum, alias); |
| } |
| } |
| if(U_SUCCESS(err)) { |
| /* try to fill an array with all aliases */ |
| const char **aliases; |
| aliases=(const char **)uprv_malloc(count * sizeof(const char *)); |
| if(aliases != 0) { |
| ucnv_getAliases("utf-8", aliases, &err); |
| if(U_FAILURE(err)) { |
| log_err("FAILURE! ucnv_getAliases(\"utf-8\") -> %s\n", myErrorName(err)); |
| } else { |
| for(aliasNum = 0; aliasNum < count; ++aliasNum) { |
| /* compare the pointers with the ones returned individually */ |
| alias = ucnv_getAlias("utf-8", aliasNum, &err); |
| if(U_FAILURE(err)) { |
| log_err("FAILURE! ucnv_getAlias(\"utf-8\", %d) -> %s\n", aliasNum, myErrorName(err)); |
| } else if(aliases[aliasNum] != alias) { |
| log_err("FAILURE! ucnv_getAliases(\"utf-8\")[%d] != ucnv_getAlias(\"utf-8\", %d)\n", aliasNum, aliasNum); |
| } |
| } |
| } |
| uprv_free((char **)aliases); |
| } |
| } |
| } |
| } |
| /*Testing ucnv_openU()*/ |
| { |
| UChar converterName[]={ 0x0069, 0x0062, 0x006d, 0x002d, 0x0039, 0x0034, 0x0033, 0x0000}; /*ibm-943*/ |
| const char *illegalNameChars={ "ibm-943 ibm-943 ibm-943 ibm-943 ibm-943 ibm-943 ibm-943 ibm-943 ibm-943 ibm-943"}; |
| UChar illegalName[100]; |
| UConverter *converter=NULL; |
| err=U_ZERO_ERROR; |
| converter=ucnv_openU(converterName, &err); |
| if(U_FAILURE(err)){ |
| log_err("FAILURE! ucnv_openU(ibm-943, err) failed. %s\n", myErrorName(err)); |
| } |
| ucnv_close(converter); |
| err=U_ZERO_ERROR; |
| converter=ucnv_openU(NULL, &err); |
| if(U_FAILURE(err)){ |
| log_err("FAILURE! ucnv_openU(NULL, err) failed. %s\n", myErrorName(err)); |
| } |
| ucnv_close(converter); |
| /*testing with error value*/ |
| err=U_ILLEGAL_ARGUMENT_ERROR; |
| converter=ucnv_openU(converterName, &err); |
| if(!(converter == NULL)){ |
| log_err("FAILURE! ucnv_openU(ibm-943, U_ILLEGAL_ARGUMENT_ERROR) is expected to fail\n"); |
| } |
| ucnv_close(converter); |
| err=U_ZERO_ERROR; |
| u_uastrcpy(illegalName, ""); |
| u_uastrcpy(illegalName, illegalNameChars); |
| ucnv_openU(illegalName, &err); |
| if(!(err==U_ILLEGAL_ARGUMENT_ERROR)){ |
| log_err("FAILURE! ucnv_openU(illegalName, err) is expected to fail\n"); |
| } |
| err=U_ZERO_ERROR; |
| |
| } |
| log_verbose("Testing ucnv_open() with converter name greater than 7 characters\n"); |
| { |
| UConverter *cnv=NULL; |
| err=U_ZERO_ERROR; |
| cnv=ucnv_open("ibm-949,Madhu", &err); |
| if(U_FAILURE(err)){ |
| log_err("FAILURE! ucnv_open(\"ibm-949,Madhu\", err) failed. %s\n", myErrorName(err)); |
| } |
| ucnv_close(cnv); |
| |
| } |
| /*Testing ucnv_convert()*/ |
| { |
| int32_t targetLimit=0, sourceLimit=0, i=0, targetCapacity=0; |
| const uint8_t source[]={ 0x00, 0x04, 0x05, 0x06, 0xa2, 0xb4, 0x00}; |
| const uint8_t expectedTarget[]={ 0x00, 0x37, 0x2d, 0x2e, 0x0e, 0x49, 0x62, 0x0f, 0x00}; |
| char *target=0; |
| sourceLimit=sizeof(source)/sizeof(source[0]); |
| err=U_ZERO_ERROR; |
| targetLimit=0; |
| |
| targetCapacity=ucnv_convert("ibm-1364", "ibm-1363", NULL, targetLimit , (const char*)source, sourceLimit, &err); |
| if(err == U_BUFFER_OVERFLOW_ERROR){ |
| err=U_ZERO_ERROR; |
| targetLimit=targetCapacity+1; |
| target=(char*)malloc(sizeof(char) * targetLimit); |
| targetCapacity=ucnv_convert("ibm-1364", "ibm-1363", target, targetLimit , (const char*)source, sourceLimit, &err); |
| } |
| if(U_FAILURE(err)){ |
| log_err("FAILURE! ucnv_convert(ibm-1363->ibm-1364) failed. %s\n", myErrorName(err)); |
| } |
| else { |
| for(i=0; i<targetCapacity; i++){ |
| if(target[i] != expectedTarget[i]){ |
| log_err("FAIL: ucnv_convert(ibm-1363->ibm-1364) failed.at index \n i=%d, Expected: %lx Got: %lx\n", i, (UChar)expectedTarget[i], (uint8_t)target[i]); |
| } |
| } |
| /*Test error conditions*/ |
| i=ucnv_convert("ibm-1364", "ibm-1363", target, targetLimit , (const char*)source, 0, &err); |
| if(i !=0){ |
| log_err("FAILURE! ucnv_convert() with sourceLimit=0 is expected to return 0\n"); |
| } |
| ucnv_convert("ibm-1364", "ibm-1363", target, targetLimit , (const char*)source, -1, &err); |
| if(!(U_FAILURE(err) && err==U_ILLEGAL_ARGUMENT_ERROR)){ |
| log_err("FAILURE! ucnv_convert() with sourceLimit=-1 is expected to fail\n"); |
| } |
| sourceLimit=sizeof(source)/sizeof(source[0]); |
| i=ucnv_convert("ibm-1364", "ibm-1363", target, targetLimit , (const char*)source, sourceLimit, &err); |
| if(i !=0 ){ |
| log_err("FAILURE! ucnv_convert() with err=U_ILLEGAL_ARGUMENT_ERROR is expected to return 0\n"); |
| } |
| err=U_ZERO_ERROR; |
| sourceLimit=sizeof(source)/sizeof(source[0]); |
| targetLimit=0; |
| i=ucnv_convert("ibm-1364", "ibm-1363", target, targetLimit , (const char*)source, sourceLimit, &err); |
| if(!(U_FAILURE(err) && err==U_BUFFER_OVERFLOW_ERROR)){ |
| log_err("FAILURE! ucnv_convert() with targetLimit=0 is expected to throw U_BUFFER_OVERFLOW_ERROR\n"); |
| } |
| err=U_ZERO_ERROR; |
| free(target); |
| ucnv_flushCache(); |
| } |
| } |
| |
| /*Testing ucnv_open()*/ |
| /* Note: These converters have been chosen because they do NOT |
| encode the Latin characters (U+0041, ...), and therefore are |
| highly unlikely to be chosen as system default codepages */ |
| |
| someConverters[0] = ucnv_open("ibm-1047", &err); |
| if (U_FAILURE(err)) { |
| log_err("FAILURE! %s\n", myErrorName(err)); |
| } |
| |
| someConverters[1] = ucnv_open("ibm-1047", &err); |
| if (U_FAILURE(err)) { |
| log_err("FAILURE! %s\n", myErrorName(err)); |
| } |
| |
| someConverters[2] = ucnv_open("ibm-1047", &err); |
| if (U_FAILURE(err)) { |
| log_err("FAILURE! %s\n", myErrorName(err)); |
| } |
| |
| someConverters[3] = ucnv_open("ibm-834", &err); |
| if (U_FAILURE(err)) { |
| log_err("FAILURE! %s\n", myErrorName(err)); |
| } |
| |
| someConverters[4] = ucnv_open("ibm-949", &err); |
| if (U_FAILURE(err)) { |
| log_err("FAILURE! %s\n", myErrorName(err)); |
| } |
| |
| |
| /* Testing ucnv_flushCache() */ |
| log_verbose("\n---Testing ucnv_flushCache...\n"); |
| if ((flushCount=ucnv_flushCache())==0) |
| log_verbose("Flush cache ok\n"); |
| else |
| log_err("Flush Cache failed [line %d], expect 0 got %d \n", __LINE__, flushCount); |
| |
| /*testing ucnv_close() and ucnv_flushCache() */ |
| ucnv_close(someConverters[0]); |
| ucnv_close(someConverters[1]); |
| ucnv_close(someConverters[2]); |
| ucnv_close(someConverters[3]); |
| |
| if ((flushCount=ucnv_flushCache())==2) |
| log_verbose("Flush cache ok\n"); /*because first, second and third are same */ |
| else |
| log_err("Flush Cache failed line %d, got %d expected 2 or there is an error in ucnv_close()\n", |
| __LINE__, |
| flushCount); |
| |
| ucnv_close(someConverters[4]); |
| if ( (flushCount=ucnv_flushCache())==1) |
| log_verbose("Flush cache ok\n"); |
| else |
| log_err("Flush Cache failed line %d, expected 1 got %d \n", __LINE__, flushCount); |
| |
| /*Testing ucnv_openCCSID and ucnv_open with error conditions*/ |
| log_verbose("\n---Testing ucnv_open with err ! = U_ZERO_ERROR...\n"); |
| err=U_ILLEGAL_ARGUMENT_ERROR; |
| if(ucnv_open(NULL, &err) != NULL){ |
| log_err("ucnv_open with err != U_ZERO_ERROR is supposed to fail\n"); |
| } |
| if(ucnv_openCCSID(1051, UCNV_IBM, &err) != NULL){ |
| log_err("ucnv_open with err != U_ZERO_ERROR is supposed to fail\n"); |
| } |
| err=U_ZERO_ERROR; |
| |
| /* Testing ucnv_openCCSID(), ucnv_open(), ucnv_getName() */ |
| log_verbose("\n---Testing ucnv_open default...\n"); |
| someConverters[0] = ucnv_open(NULL,&err); |
| someConverters[1] = ucnv_open(NULL,&err); |
| someConverters[2] = ucnv_open("utf8", &err); |
| someConverters[3] = ucnv_openCCSID(949,UCNV_IBM,&err); |
| ucnv_close(ucnv_openCCSID(1051, UCNV_IBM, &err)); /* test for j350; ucnv_close(NULL) is safe */ |
| if (U_FAILURE(err)){ log_err("FAILURE! %s\n", myErrorName(err));} |
| |
| /* Testing ucnv_getName()*/ |
| /*default code page */ |
| ucnv_getName(someConverters[0], &err); |
| if(U_FAILURE(err)) { |
| log_err("getName[0] failed\n"); |
| } else { |
| log_verbose("getName(someConverters[0]) returned %s\n", ucnv_getName(someConverters[0], &err)); |
| } |
| ucnv_getName(someConverters[1], &err); |
| if(U_FAILURE(err)) { |
| log_err("getName[1] failed\n"); |
| } else { |
| log_verbose("getName(someConverters[1]) returned %s\n", ucnv_getName(someConverters[1], &err)); |
| } |
| |
| /*Testing ucnv_getDefaultName() and ucnv_setDefaultNAme()*/ |
| { |
| const char* defaultName=ucnv_getDefaultName(); |
| log_verbose("getDefaultName returned %s\n", defaultName); |
| |
| /*change the default name by setting it */ |
| ucnv_setDefaultName("changed"); |
| if(strcmp(ucnv_getDefaultName(), "changed")==0) |
| log_verbose("setDefaultName o.k"); |
| else |
| log_err("setDefaultName failed"); |
| /*set the default name back*/ |
| ucnv_setDefaultName(defaultName); |
| } |
| |
| ucnv_close(someConverters[0]); |
| ucnv_close(someConverters[1]); |
| ucnv_close(someConverters[2]); |
| ucnv_close(someConverters[3]); |
| |
| |
| for (codepage_index=0; codepage_index < NUM_CODEPAGE; ++codepage_index) |
| { |
| int32_t i = 0; |
| |
| strcpy(ucs_file_name, ctest_getTestDirectory()); |
| strcat(ucs_file_name, CodePagesTestFiles[codepage_index]); |
| |
| ucs_file_in = fopen(ucs_file_name,"rb"); |
| if (!ucs_file_in) |
| { |
| log_err("Couldn't open the Unicode file [%s]... Exiting...\n", ucs_file_name); |
| return; |
| } |
| |
| /*Creates a converter and testing ucnv_openCCSID(u_int code_page, platform, errstatus*/ |
| |
| /* myConverter =ucnv_openCCSID(CodePageNumberToTest[codepage_index],UCNV_IBM, &err); */ |
| /* ucnv_flushCache(); */ |
| myConverter =ucnv_open( "ibm-949", &err); |
| if (!myConverter || U_FAILURE(err)) |
| { |
| log_err("Error creating the convertor \n"); |
| |
| return; |
| } |
| |
| /*testing for ucnv_getName() */ |
| log_verbose("Testing ucnv_getName()...\n"); |
| ucnv_getName(myConverter, &err); |
| if(U_FAILURE(err)) |
| log_err("Error in getName\n"); |
| else |
| { |
| log_verbose("getName o.k. %s\n", ucnv_getName(myConverter, &err)); |
| } |
| if (uprv_stricmp(ucnv_getName(myConverter, &err), CodePagesToTest[codepage_index])) |
| log_err("getName failed\n"); |
| else |
| log_verbose("getName ok\n"); |
| /*Test getName with error condition*/ |
| { |
| const char* name=0; |
| err=U_ILLEGAL_ARGUMENT_ERROR; |
| log_verbose("Testing ucnv_getName with err != U_ZERO_ERROR"); |
| name=ucnv_getName(myConverter, &err); |
| if(name != NULL){ |
| log_err("ucnv_getName() with err != U_ZERO_ERROR is expected to fail"); |
| } |
| err=U_ZERO_ERROR; |
| } |
| |
| |
| /*Tests ucnv_getMaxCharSize() and ucnv_getMinCharSize()*/ |
| |
| log_verbose("Testing ucnv_getMaxCharSize()...\n"); |
| if (ucnv_getMaxCharSize(myConverter)==CodePagesMaxChars[codepage_index]) |
| log_verbose("Max byte per character OK\n"); |
| else |
| log_err("Max byte per character failed\n"); |
| |
| log_verbose("\n---Testing ucnv_getMinCharSize()...\n"); |
| if (ucnv_getMinCharSize(myConverter)==CodePagesMinChars[codepage_index]) |
| log_verbose("Min byte per character OK\n"); |
| else |
| log_err("Min byte per character failed\n"); |
| |
| |
| /*Testing for ucnv_getSubstChars() and ucnv_setSubstChars()*/ |
| log_verbose("\n---Testing ucnv_getSubstChars...\n"); |
| ii=4; |
| ucnv_getSubstChars(myConverter, myptr, &ii, &err); |
| |
| for(x=0;x<ii;x++) |
| rest = (uint16_t)(((unsigned char)rest << 8) + (unsigned char)myptr[x]); |
| if (rest==CodePagesSubstitutionChars[codepage_index]) |
| log_verbose("Substitution character ok\n"); |
| else |
| log_err("Substitution character failed.\n"); |
| |
| log_verbose("\n---Testing ucnv_setSubstChars RoundTrip Test ...\n"); |
| ucnv_setSubstChars(myConverter, myptr, ii, &err); |
| if (U_FAILURE(err)) |
| { |
| log_err("FAILURE! %s\n", myErrorName(err)); |
| } |
| ucnv_getSubstChars(myConverter,save, &ii, &err); |
| if (U_FAILURE(err)) |
| { |
| log_err("FAILURE! %s\n", myErrorName(err)); |
| } |
| |
| if (strncmp(save, myptr, ii)) |
| log_err("Saved substitution character failed\n"); |
| else |
| log_verbose("Saved substitution character ok\n"); |
| |
| /*Testing for ucnv_getSubstChars() and ucnv_setSubstChars() with error conditions*/ |
| log_verbose("\n---Testing ucnv_getSubstChars.. with len < minBytesPerChar\n"); |
| ii=1; |
| ucnv_getSubstChars(myConverter, myptr, &ii, &err); |
| if(err != U_INDEX_OUTOFBOUNDS_ERROR){ |
| log_err("ucnv_getSubstChars() with len < minBytesPerChar should throw U_INDEX_OUTOFBOUNDS_ERROR Got %s\n", myErrorName(err)); |
| } |
| err=U_ZERO_ERROR; |
| ii=4; |
| ucnv_getSubstChars(myConverter, myptr, &ii, &err); |
| log_verbose("\n---Testing ucnv_setSubstChars.. with len < minBytesPerChar\n"); |
| ucnv_setSubstChars(myConverter, myptr, 0, &err); |
| if(err != U_ILLEGAL_ARGUMENT_ERROR){ |
| log_err("ucnv_setSubstChars() with len < minBytesPerChar should throw U_ILLEGAL_ARGUMENT_ERROR Got %s\n", myErrorName(err)); |
| } |
| log_verbose("\n---Testing ucnv_setSubstChars.. with err != U_ZERO_ERROR \n"); |
| strcpy(myptr, "abc"); |
| ucnv_setSubstChars(myConverter, myptr, ii, &err); |
| err=U_ZERO_ERROR; |
| ucnv_getSubstChars(myConverter, save, &ii, &err); |
| if(strncmp(save, myptr, ii) == 0){ |
| log_err("uncv_setSubstChars() with err != U_ZERO_ERROR shouldn't set the SubstChars and just return\n"); |
| } |
| log_verbose("\n---Testing ucnv_getSubstChars.. with err != U_ZERO_ERROR \n"); |
| err=U_ZERO_ERROR; |
| strcpy(myptr, "abc"); |
| ucnv_setSubstChars(myConverter, myptr, ii, &err); |
| err=U_ILLEGAL_ARGUMENT_ERROR; |
| ucnv_getSubstChars(myConverter, save, &ii, &err); |
| if(strncmp(save, myptr, ii) == 0){ |
| log_err("uncv_setSubstChars() with err != U_ZERO_ERROR shouldn't fill the SubstChars in the buffer, it just returns\n"); |
| } |
| err=U_ZERO_ERROR; |
| /*------*/ |
| |
| /*resetState ucnv_reset()*/ |
| log_verbose("\n---Testing ucnv_reset()..\n"); |
| ucnv_reset(myConverter); |
| { |
| UChar32 c; |
| const uint8_t in[]={ 0x1b, 0x25, 0x42, 0x31, 0x32, 0x61, 0xc0, 0x80, 0xe0, 0x80, 0x80, 0xf0, 0x80, 0x80, 0x80}; |
| const char *source=(const char *)in, *limit=(const char *)in+sizeof(in); |
| UConverter *cnv=ucnv_open("ISO_2022", &err); |
| if(U_FAILURE(err)) { |
| log_err("Unable to open a iso-2022 converter: %s\n", u_errorName(err)); |
| } |
| c=ucnv_getNextUChar(cnv, &source, limit, &err); |
| if((U_FAILURE(err) || c != (UChar32)0x0031)) { |
| log_err("ucnv_getNextUChar() failed: %s\n", u_errorName(err)); |
| } |
| ucnv_reset(cnv); |
| ucnv_close(cnv); |
| |
| } |
| |
| /*getDisplayName*/ |
| log_verbose("\n---Testing ucnv_getDisplayName()...\n"); |
| locale=CodePagesLocale[codepage_index]; |
| displayname=(UChar*)malloc(1 * sizeof(UChar)); |
| len=0; |
| disnamelen = ucnv_getDisplayName(myConverter,locale,displayname, len, &err); |
| if(err==U_BUFFER_OVERFLOW_ERROR) |
| { |
| err=U_ZERO_ERROR; |
| displayname=(UChar*)realloc(displayname, (disnamelen+1) * sizeof(UChar)); |
| ucnv_getDisplayName(myConverter,locale,displayname,disnamelen+1, &err); |
| if(U_FAILURE(err)) |
| { |
| log_err("getDisplayName failed the error is %s\n", myErrorName(err)); |
| } |
| else |
| log_verbose(" getDisplayName o.k.\n"); |
| } |
| /*test ucnv_getDiaplayName with error condition*/ |
| log_verbose("\n---Testing ucnv_getDisplayName()...\n"); |
| err= U_ILLEGAL_ARGUMENT_ERROR; |
| len=ucnv_getDisplayName(myConverter,locale,displayname,disnamelen+1, &err); |
| if( len !=0 ){ |
| log_err("ucnv_getDisplayName() with err != U_ZERO_ERROR is supposed to return 0\n"); |
| } |
| err=U_ZERO_ERROR; |
| |
| /* testing ucnv_setFromUCallBack() and ucnv_getFromUCallBack()*/ |
| ucnv_getFromUCallBack(myConverter, &MIA1, &MIA1Context); |
| |
| log_verbose("\n---Testing ucnv_setFromUCallBack...\n"); |
| ucnv_setFromUCallBack(myConverter, otherUnicodeAction(MIA1), &BOM, &oldFromUAction, &oldFromUContext, &err); |
| if (U_FAILURE(err) || oldFromUAction != MIA1 || oldFromUContext != MIA1Context) |
| { |
| log_err("FAILURE! %s\n", myErrorName(err)); |
| } |
| |
| ucnv_getFromUCallBack(myConverter, &MIA1_2, &MIA1Context2); |
| if (MIA1_2 != otherUnicodeAction(MIA1) || MIA1Context2 != &BOM) |
| log_err("get From UCallBack failed\n"); |
| else |
| log_verbose("get From UCallBack ok\n"); |
| |
| log_verbose("\n---Testing getFromUCallBack Roundtrip...\n"); |
| ucnv_setFromUCallBack(myConverter,MIA1, MIA1Context, &oldFromUAction, &oldFromUContext, &err); |
| if (U_FAILURE(err) || oldFromUAction != otherUnicodeAction(MIA1) || oldFromUContext != &BOM) |
| { |
| log_err("FAILURE! %s\n", myErrorName(err)); |
| } |
| |
| ucnv_getFromUCallBack(myConverter, &MIA1_2, &MIA1Context2); |
| if (MIA1_2 != MIA1 || MIA1Context2 != MIA1Context) |
| log_err("get From UCallBack action failed\n"); |
| else |
| log_verbose("get From UCallBack action ok\n"); |
| |
| /*testing ucnv_setToUCallBack with error conditions*/ |
| err=U_ILLEGAL_ARGUMENT_ERROR; |
| log_verbose("\n---Testing setFromUCallBack. with err != U_ZERO_ERROR..\n"); |
| ucnv_setFromUCallBack(myConverter, otherUnicodeAction(MIA1), &BOM, &oldFromUAction, &oldFromUContext, &err); |
| ucnv_getFromUCallBack(myConverter, &MIA1_2, &MIA1Context2); |
| if(MIA1_2 == otherUnicodeAction(MIA1) || MIA1Context2 == &BOM){ |
| log_err("To setFromUCallBack with err != U_ZERO_ERROR is supposed to fail\n"); |
| } |
| err=U_ZERO_ERROR; |
| |
| |
| /*testing ucnv_setToUCallBack() and ucnv_getToUCallBack()*/ |
| ucnv_getToUCallBack(myConverter, &MIA2, &MIA2Context); |
| |
| log_verbose("\n---Testing setTo UCallBack...\n"); |
| ucnv_setToUCallBack(myConverter,otherCharAction(MIA2), &BOM, &oldToUAction, &oldToUContext, &err); |
| if (U_FAILURE(err) || oldToUAction != MIA2 || oldToUContext != MIA2Context) |
| { |
| log_err("FAILURE! %s\n", myErrorName(err)); |
| } |
| |
| ucnv_getToUCallBack(myConverter, &MIA2_2, &MIA2Context2); |
| if (MIA2_2 != otherCharAction(MIA2) || MIA2Context2 != &BOM) |
| log_err("To UCallBack failed\n"); |
| else |
| log_verbose("To UCallBack ok\n"); |
| |
| log_verbose("\n---Testing setTo UCallBack Roundtrip...\n"); |
| ucnv_setToUCallBack(myConverter,MIA2, MIA2Context, &oldToUAction, &oldToUContext, &err); |
| if (U_FAILURE(err) || oldToUAction != otherCharAction(MIA2) || oldToUContext != &BOM) |
| { log_err("FAILURE! %s\n", myErrorName(err)); } |
| |
| ucnv_getToUCallBack(myConverter, &MIA2_2, &MIA2Context2); |
| if (MIA2_2 != MIA2 || MIA2Context2 != MIA2Context) |
| log_err("To UCallBack failed\n"); |
| else |
| log_verbose("To UCallBack ok\n"); |
| |
| /*testing ucnv_setToUCallBack with error conditions*/ |
| err=U_ILLEGAL_ARGUMENT_ERROR; |
| log_verbose("\n---Testing setToUCallBack. with err != U_ZERO_ERROR..\n"); |
| ucnv_setToUCallBack(myConverter,otherCharAction(MIA2), NULL, &oldToUAction, &oldToUContext, &err); |
| ucnv_getToUCallBack(myConverter, &MIA2_2, &MIA2Context2); |
| if (MIA2_2 == otherCharAction(MIA2) || MIA2Context2 == &BOM){ |
| log_err("To setToUCallBack with err != U_ZERO_ERROR is supposed to fail\n"); |
| } |
| err=U_ZERO_ERROR; |
| |
| |
| /*getcodepageid testing ucnv_getCCSID() */ |
| log_verbose("\n----Testing getCCSID....\n"); |
| cp = ucnv_getCCSID(myConverter,&err); |
| if (U_FAILURE(err)) |
| { |
| log_err("FAILURE!..... %s\n", myErrorName(err)); |
| } |
| if (cp != CodePageNumberToTest[codepage_index]) |
| log_err("Codepage number test failed\n"); |
| else |
| log_verbose("Codepage number test OK\n"); |
| |
| /*testing ucnv_getCCSID() with err != U_ZERO_ERROR*/ |
| err=U_ILLEGAL_ARGUMENT_ERROR; |
| if( ucnv_getCCSID(myConverter,&err) != -1){ |
| log_err("ucnv_getCCSID() with err != U_ZERO_ERROR is supposed to fail\n"); |
| } |
| err=U_ZERO_ERROR; |
| |
| /*getCodepagePlatform testing ucnv_getPlatform()*/ |
| log_verbose("\n---Testing getCodepagePlatform ..\n"); |
| if (CodePagesPlatform[codepage_index]!=ucnv_getPlatform(myConverter, &err)) |
| log_err("Platform codepage test failed\n"); |
| else |
| log_verbose("Platform codepage test ok\n"); |
| |
| if (U_FAILURE(err)) |
| { |
| log_err("FAILURE! %s\n", myErrorName(err)); |
| } |
| /*testing ucnv_getPlatform() with err != U_ZERO_ERROR*/ |
| err= U_ILLEGAL_ARGUMENT_ERROR; |
| if(ucnv_getPlatform(myConverter, &err) != UCNV_UNKNOWN){ |
| log_err("ucnv)getPlatform with err != U_ZERO_ERROR is supposed to fail\n"); |
| } |
| err=U_ZERO_ERROR; |
| |
| |
| /*Reads the BOM*/ |
| fread(&BOM, sizeof(UChar), 1, ucs_file_in); |
| if (BOM!=0xFEFF && BOM!=0xFFFE) |
| { |
| log_err("File Missing BOM...Bailing!\n"); |
| return; |
| } |
| |
| |
| /*Reads in the file*/ |
| while(!feof(ucs_file_in)&&(i+=fread(ucs_file_buffer+i, sizeof(UChar), 1, ucs_file_in))) |
| { |
| myUChar = ucs_file_buffer[i-1]; |
| |
| ucs_file_buffer[i-1] = (UChar)((BOM==0xFEFF)?myUChar:((myUChar >> 8) | (myUChar << 8))); /*adjust if BIG_ENDIAN*/ |
| } |
| |
| myUChar = ucs_file_buffer[i-1]; |
| ucs_file_buffer[i-1] = (UChar)((BOM==0xFEFF)?myUChar:((myUChar >> 8) | (myUChar << 8))); /*adjust if BIG_ENDIAN Corner Case*/ |
| |
| |
| /*testing ucnv_fromUChars() and ucnv_toUChars() */ |
| /*uchar1---fromUChar--->output_cp_buffer --toUChar--->uchar2*/ |
| |
| uchar1=(UChar*)malloc(sizeof(UChar) * (i+1)); |
| u_uastrcpy(uchar1,""); |
| u_strncpy(uchar1,ucs_file_buffer,i); |
| uchar1[i] = 0; |
| |
| uchar3=(UChar*)malloc(sizeof(UChar)*(i+1)); |
| u_uastrcpy(uchar3,""); |
| u_strncpy(uchar3,ucs_file_buffer,i); |
| uchar3[i] = 0; |
| |
| /*Calls the Conversion Routine */ |
| testLong1 = MAX_FILE_LEN; |
| log_verbose("\n---Testing ucnv_fromUChars()\n"); |
| targetcapacity = ucnv_fromUChars(myConverter, output_cp_buffer, testLong1, uchar1, -1, &err); |
| if (U_FAILURE(err)) |
| { |
| log_err("\nFAILURE...%s\n", myErrorName(err)); |
| } |
| else |
| log_verbose(" ucnv_fromUChars() o.k.\n"); |
| |
| /*test the conversion routine */ |
| log_verbose("\n---Testing ucnv_toUChars()\n"); |
| /*call it first time for trapping the targetcapacity and size needed to allocate memory for the buffer uchar2 */ |
| targetcapacity2=0; |
| targetsize = ucnv_toUChars(myConverter, |
| NULL, |
| targetcapacity2, |
| output_cp_buffer, |
| strlen(output_cp_buffer), |
| &err); |
| /*if there is an buffer overflow then trap the values and pass them and make the actual call*/ |
| |
| if(err==U_BUFFER_OVERFLOW_ERROR) |
| { |
| err=U_ZERO_ERROR; |
| uchar2=(UChar*)malloc((targetsize+1) * sizeof(UChar)); |
| targetsize = ucnv_toUChars(myConverter, |
| uchar2, |
| targetsize+1, |
| output_cp_buffer, |
| strlen(output_cp_buffer), |
| &err); |
| |
| if(U_FAILURE(err)) |
| log_err("ucnv_toUChars() FAILED %s\n", myErrorName(err)); |
| else |
| log_verbose(" ucnv_toUChars() o.k.\n"); |
| |
| if(u_strcmp(uchar1,uchar2)!=0) |
| log_err("equality test failed with conversion routine\n"); |
| } |
| else |
| { |
| log_err("ERR: calling toUChars: Didn't get U_BUFFER_OVERFLOW .. expected it.\n"); |
| } |
| /*Testing ucnv_fromUChars and ucnv_toUChars with error conditions*/ |
| err=U_ILLEGAL_ARGUMENT_ERROR; |
| log_verbose("\n---Testing ucnv_fromUChars() with err != U_ZERO_ERROR\n"); |
| targetcapacity = ucnv_fromUChars(myConverter, output_cp_buffer, testLong1, uchar1, -1, &err); |
| if (targetcapacity !=0) { |
| log_err("\nFAILURE: ucnv_fromUChars with err != U_ZERO_ERROR is expected to fail and return 0\n"); |
| } |
| err=U_ZERO_ERROR; |
| log_verbose("\n---Testing ucnv_fromUChars() with converter=NULL\n"); |
| targetcapacity = ucnv_fromUChars(NULL, output_cp_buffer, testLong1, uchar1, -1, &err); |
| if (targetcapacity !=0 || err != U_ILLEGAL_ARGUMENT_ERROR) { |
| log_err("\nFAILURE: ucnv_fromUChars with converter=NULL is expected to fail\n"); |
| } |
| err=U_ZERO_ERROR; |
| log_verbose("\n---Testing ucnv_fromUChars() with sourceLength = 0\n"); |
| targetcapacity = ucnv_fromUChars(myConverter, output_cp_buffer, testLong1, uchar1, 0, &err); |
| if (targetcapacity !=0) { |
| log_err("\nFAILURE: ucnv_fromUChars with sourceLength 0 is expected to return 0\n"); |
| } |
| log_verbose("\n---Testing ucnv_fromUChars() with targetLength = 0\n"); |
| targetcapacity = ucnv_fromUChars(myConverter, output_cp_buffer, 0, uchar1, -1, &err); |
| if (err != U_BUFFER_OVERFLOW_ERROR) { |
| log_err("\nFAILURE: ucnv_fromUChars with targetLength 0 is expected to fail and throw U_BUFFER_OVERFLOW_ERROR\n"); |
| } |
| /*toUChars with error conditions*/ |
| targetsize = ucnv_toUChars(myConverter, uchar2, targetsize, output_cp_buffer, strlen(output_cp_buffer), &err); |
| if(targetsize != 0){ |
| log_err("\nFAILURE: ucnv_toUChars with err != U_ZERO_ERROR is expected to fail and return 0\n"); |
| } |
| err=U_ZERO_ERROR; |
| targetsize = ucnv_toUChars(myConverter, uchar2, -1, output_cp_buffer, strlen(output_cp_buffer), &err); |
| if(targetsize != 0 || err != U_ILLEGAL_ARGUMENT_ERROR){ |
| log_err("\nFAILURE: ucnv_toUChars with targetsize < 0 is expected to throw U_ILLEGAL_ARGUMENT_ERROR and return 0\n"); |
| } |
| err=U_ZERO_ERROR; |
| targetsize = ucnv_toUChars(myConverter, uchar2, 0, output_cp_buffer, 0, &err); |
| if (targetsize !=0) { |
| log_err("\nFAILURE: ucnv_toUChars with sourceLength 0 is expected to return 0\n"); |
| } |
| targetcapacity2=0; |
| targetsize = ucnv_toUChars(myConverter, NULL, targetcapacity2, output_cp_buffer, strlen(output_cp_buffer), &err); |
| if (err != U_STRING_NOT_TERMINATED_WARNING) { |
| log_err("\nFAILURE: ucnv_toUChars(targetLength)->%s instead of U_STRING_NOT_TERMINATED_WARNING\n", |
| u_errorName(err)); |
| } |
| err=U_ZERO_ERROR; |
| /*-----*/ |
| |
| |
| /*testing for ucnv_fromUnicode() and ucnv_toUnicode() */ |
| /*Clean up re-usable vars*/ |
| j=0; |
| log_verbose("Testing ucnv_fromUnicode().....\n"); |
| tmp_ucs_buf=ucs_file_buffer_use; |
| ucnv_fromUnicode(myConverter, &mytarget_1, |
| mytarget + MAX_FILE_LEN, |
| &tmp_ucs_buf, |
| ucs_file_buffer_use+i, |
| NULL, |
| TRUE, |
| &err); |
| consumedUni = (UChar*)tmp_consumedUni; |
| |
| if (U_FAILURE(err)) |
| { |
| log_err("FAILURE! %s\n", myErrorName(err)); |
| } |
| else |
| log_verbose("ucnv_fromUnicode() o.k.\n"); |
| |
| /*Uni1 ----ToUnicode----> Cp2 ----FromUnicode---->Uni3 */ |
| log_verbose("Testing ucnv_toUnicode().....\n"); |
| tmp_mytarget_use=mytarget_use; |
| tmp_consumed = consumed; |
| ucnv_toUnicode(myConverter, &my_ucs_file_buffer_1, |
| my_ucs_file_buffer + MAX_FILE_LEN, |
| &tmp_mytarget_use, |
| mytarget_use + (mytarget_1 - mytarget), |
| NULL, |
| FALSE, |
| &err); |
| consumed = (char*)tmp_consumed; |
| if (U_FAILURE(err)) |
| { |
| log_err("FAILURE! %s\n", myErrorName(err)); |
| } |
| else |
| log_verbose("ucnv_toUnicode() o.k.\n"); |
| |
| |
| log_verbose("\n---Testing RoundTrip ...\n"); |
| |
| |
| u_strncpy(uchar3, my_ucs_file_buffer,i); |
| uchar3[i] = 0; |
| |
| if(u_strcmp(uchar1,uchar3)==0) |
| log_verbose("Equality test o.k.\n"); |
| else |
| log_err("Equality test failed\n"); |
| |
| /*sanity compare */ |
| if(uchar2 == NULL) |
| { |
| log_err("uchar2 was NULL (ccapitst.c line %d), couldn't do sanity check\n", __LINE__); |
| } |
| else |
| { |
| if(u_strcmp(uchar2, uchar3)==0) |
| log_verbose("Equality test o.k.\n"); |
| else |
| log_err("Equality test failed\n"); |
| } |
| |
| fclose(ucs_file_in); |
| ucnv_close(myConverter); |
| free(displayname); |
| if (uchar1 != 0) free(uchar1); |
| if (uchar2 != 0) free(uchar2); |
| if (uchar3 != 0) free(uchar3); |
| } |
| |
| free((void*)mytarget); |
| free((void*)output_cp_buffer); |
| free((void*)ucs_file_buffer); |
| free((void*)my_ucs_file_buffer); |
| } |
| |
| static UConverterFromUCallback otherUnicodeAction(UConverterFromUCallback MIA) |
| { |
| return (MIA==(UConverterFromUCallback)UCNV_FROM_U_CALLBACK_STOP)?(UConverterFromUCallback)UCNV_FROM_U_CALLBACK_SUBSTITUTE:(UConverterFromUCallback)UCNV_FROM_U_CALLBACK_STOP; |
| } |
| |
| |
| static UConverterToUCallback otherCharAction(UConverterToUCallback MIA) |
| { |
| return (MIA==(UConverterToUCallback)UCNV_TO_U_CALLBACK_STOP)?(UConverterToUCallback)UCNV_TO_U_CALLBACK_SUBSTITUTE:(UConverterToUCallback)UCNV_TO_U_CALLBACK_STOP; |
| } |
| |
| /** |
| * Test the converter alias API, specifically the fuzzy matching of |
| * alias names and the alias table integrity. Make sure each |
| * converter has at least one alias (itself), and that its listed |
| * aliases map back to itself. Check some hard-coded UTF-8 and |
| * ISO_2022 aliases to make sure they work. |
| */ |
| static void TestAlias() { |
| int32_t i, ncnv; |
| UErrorCode status = U_ZERO_ERROR; |
| |
| /* Predetermined aliases that we expect to map back to ISO_2022 |
| * and UTF-8. UPDATE THIS DATA AS NECESSARY. */ |
| const char* ISO_2022_NAMES[] = |
| {"ISO_2022", "iso-2022", "2022", |
| "cp2022", "iso2022", "iso_2022"}; |
| int32_t ISO_2022_NAMES_LENGTH = |
| sizeof(ISO_2022_NAMES) / sizeof(ISO_2022_NAMES[0]); |
| const char *UTF8_NAMES[] = |
| { "UTF-8", "utf-8", "utf8", "ibm-1208", |
| "utf_8", "ibm1208", "cp1208" }; |
| int32_t UTF8_NAMES_LENGTH = |
| sizeof(UTF8_NAMES) / sizeof(UTF8_NAMES[0]); |
| |
| struct { |
| const char *name; |
| const char *alias; |
| } CONVERTERS_NAMES[] = { |
| { "UTF-32BE", "UTF32_BigEndian" }, |
| { "UTF-32LE", "UTF32_LittleEndian" }, |
| { "UTF-32", "ISO-10646-UCS-4" }, |
| { "UTF-32", "UTF32_PlatformEndian" }, |
| { "UTF-32", "ucs-4" } |
| }; |
| int32_t CONVERTERS_NAMES_LENGTH = sizeof(CONVERTERS_NAMES) / sizeof(*CONVERTERS_NAMES); |
| |
| /* When there are bugs in gencnval or in ucnv_io, converters can |
| appear to have no aliases. */ |
| ncnv = ucnv_countAvailable(); |
| log_verbose("%d converters\n", ncnv); |
| for (i=0; i<ncnv; ++i) { |
| const char *name = ucnv_getAvailableName(i); |
| const char *alias0; |
| uint16_t na = ucnv_countAliases(name, &status); |
| uint16_t j; |
| |
| if (na == 0) { |
| log_err("FAIL: Converter \"%s\" (i=%d)" |
| " has no aliases; expect at least one\n", |
| name, i); |
| continue; |
| } |
| |
| alias0 = ucnv_getAlias(name, 0, &status); |
| for (j=1; j<na; ++j) { |
| const char *alias = ucnv_getAlias(name, j, &status); |
| /* Make sure each alias maps back to the the same list of |
| aliases. Assume that if alias 0 is the same, the whole |
| list is the same (this should always be true). */ |
| const char *mapBack; |
| |
| if (alias == NULL) { |
| log_err("FAIL: Converter \"%s\" -> " |
| "alias[%d]=NULL\n", |
| name, j); |
| continue; |
| } |
| |
| mapBack = ucnv_getAlias(alias, 0, &status); |
| |
| if (mapBack == NULL) { |
| log_err("FAIL: Converter \"%s\" -> " |
| "alias[%d]=\"%s\" -> " |
| "alias[0]=NULL, exp. \"%s\"\n", |
| name, j, alias, alias0); |
| continue; |
| } |
| |
| if (0 != uprv_strcmp(alias0, mapBack)) { |
| log_err("FAIL: Converter \"%s\" -> " |
| "alias[%d]=\"%s\" -> " |
| "alias[0]=\"%s\", exp. \"%s\"\n", |
| name, j, alias, mapBack, alias0); |
| } |
| } |
| } |
| |
| /* Check a list of predetermined aliases that we expect to map |
| * back to ISO_2022 and UTF-8. */ |
| for (i=1; i<ISO_2022_NAMES_LENGTH; ++i) { |
| const char* mapBack = ucnv_getAlias(ISO_2022_NAMES[i], 0, &status); |
| if (0 != uprv_strcmp(mapBack, ISO_2022_NAMES[0])) { |
| log_err("FAIL: \"%s\" -> \"%s\", expect ISO_2022\n", |
| ISO_2022_NAMES[i], mapBack); |
| } |
| } |
| |
| for (i=1; i<UTF8_NAMES_LENGTH; ++i) { |
| const char* mapBack = ucnv_getAlias(UTF8_NAMES[i], 0, &status); |
| if (0 != uprv_strcmp(mapBack, UTF8_NAMES[0])) { |
| log_err("FAIL: \"%s\" -> \"%s\", expect UTF-8\n", |
| UTF8_NAMES[i], mapBack); |
| } |
| } |
| |
| /* |
| * Check a list of predetermined aliases that we expect to map |
| * back to predermined converter names. |
| */ |
| |
| for (i = 0; i < CONVERTERS_NAMES_LENGTH; ++i) { |
| const char* mapBack = ucnv_getAlias(CONVERTERS_NAMES[i].alias, 0, &status); |
| if (0 != uprv_strcmp(mapBack, CONVERTERS_NAMES[i].name)) { |
| log_err("FAIL: \"%s\" -> \"%s\", expect %s\n", |
| CONVERTERS_NAMES[i].alias, mapBack, CONVERTERS_NAMES[i].name); |
| } |
| } |
| } |
| |
| static void TestConvertSafeClone() |
| { |
| #define CLONETEST_CONVERTER_COUNT 8 |
| |
| char charBuffer [21]; /* Leave at an odd number for alignment testing */ |
| uint8_t buffer [CLONETEST_CONVERTER_COUNT] [U_CNV_SAFECLONE_BUFFERSIZE]; |
| int32_t bufferSize = U_CNV_SAFECLONE_BUFFERSIZE; |
| UConverter * someConverters [CLONETEST_CONVERTER_COUNT]; |
| UConverter * someClonedConverters [CLONETEST_CONVERTER_COUNT]; |
| UConverter * cnv; |
| UErrorCode err = U_ZERO_ERROR; |
| |
| char *pCharBuffer; |
| const char *pConstCharBuffer; |
| const char *charBufferLimit = charBuffer + sizeof(charBuffer)/sizeof(*charBuffer); |
| UChar uniBuffer [] = {0x0058, 0x0059, 0x005A}; /* "XYZ" */ |
| UChar uniCharBuffer [20]; |
| char charSourceBuffer [] = { 0x1b, 0x24, 0x42 }; |
| const char *pCharSource = charSourceBuffer; |
| const char *pCharSourceLimit = charSourceBuffer + sizeof(charSourceBuffer); |
| UChar *pUCharTarget = uniCharBuffer; |
| UChar *pUCharTargetLimit = uniCharBuffer + sizeof(uniCharBuffer)/sizeof(*uniCharBuffer); |
| const UChar * pUniBuffer; |
| const UChar *uniBufferLimit = uniBuffer + sizeof(uniBuffer)/sizeof(*uniBuffer); |
| int index; |
| |
| /* one 'regular' & all the 'private stateful' converters */ |
| someConverters[0] = ucnv_open("ibm-1047", &err); |
| someConverters[1] = ucnv_open("ISO_2022", &err); |
| someConverters[2] = ucnv_open("SCSU", &err); |
| someConverters[3] = ucnv_open("HZ", &err); |
| someConverters[4] = ucnv_open("lmbcs", &err); |
| someConverters[5] = ucnv_open("ISCII,version=0",&err); |
| someConverters[6] = ucnv_open("ISO_2022,locale=kr,version=1",&err); |
| someConverters[7] = ucnv_open("ISO_2022,locale=jp,version=1",&err); |
| |
| /* Check the various error & informational states: */ |
| |
| /* Null status - just returns NULL */ |
| if (0 != ucnv_safeClone(someConverters[0], buffer[0], &bufferSize, 0)) |
| { |
| log_err("FAIL: Cloned converter failed to deal correctly with null status\n"); |
| } |
| /* error status - should return 0 & keep error the same */ |
| err = U_MEMORY_ALLOCATION_ERROR; |
| if (0 != ucnv_safeClone(someConverters[0], buffer[0], &bufferSize, &err) || err != U_MEMORY_ALLOCATION_ERROR) |
| { |
| log_err("FAIL: Cloned converter failed to deal correctly with incoming error status\n"); |
| } |
| err = U_ZERO_ERROR; |
| |
| /* Null buffer size pointer - just returns NULL & set error to U_ILLEGAL_ARGUMENT_ERROR*/ |
| if (0 != ucnv_safeClone(someConverters[0], buffer[0], 0, &err) || err != U_ILLEGAL_ARGUMENT_ERROR) |
| { |
| log_err("FAIL: Cloned converter failed to deal correctly with null bufferSize pointer\n"); |
| } |
| err = U_ZERO_ERROR; |
| |
| /* buffer size pointer is 0 - fill in pbufferSize with a size */ |
| bufferSize = 0; |
| if (0 != ucnv_safeClone(someConverters[0], buffer[0], &bufferSize, &err) || U_FAILURE(err) || bufferSize <= 0) |
| { |
| log_err("FAIL: Cloned converter failed a sizing request ('preflighting')\n"); |
| } |
| /* Verify our define is large enough */ |
| if (U_CNV_SAFECLONE_BUFFERSIZE < bufferSize) |
| { |
| log_err("FAIL: Pre-calculated buffer size is too small\n"); |
| } |
| /* Verify we can use this run-time calculated size */ |
| if (0 == (cnv = ucnv_safeClone(someConverters[0], buffer[0], &bufferSize, &err)) || U_FAILURE(err)) |
| { |
| log_err("FAIL: Converter can't be cloned with run-time size\n"); |
| } |
| if (cnv) |
| ucnv_close(cnv); |
| /* size one byte too small - should allocate & let us know */ |
| --bufferSize; |
| if (0 == (cnv = ucnv_safeClone(someConverters[0], 0, &bufferSize, &err)) || err != U_SAFECLONE_ALLOCATED_ERROR) |
| { |
| log_err("FAIL: Cloned converter failed to deal correctly with too-small buffer size\n"); |
| } |
| if (cnv) |
| ucnv_close(cnv); |
| err = U_ZERO_ERROR; |
| bufferSize = U_CNV_SAFECLONE_BUFFERSIZE; |
| |
| /* Null buffer pointer - return converter & set error to U_SAFECLONE_ALLOCATED_ERROR */ |
| if (0 == (cnv = ucnv_safeClone(someConverters[0], 0, &bufferSize, &err)) || err != U_SAFECLONE_ALLOCATED_ERROR) |
| { |
| log_err("FAIL: Cloned converter failed to deal correctly with null buffer pointer\n"); |
| } |
| if (cnv) |
| ucnv_close(cnv); |
| err = U_ZERO_ERROR; |
| |
| /* Null converter - return NULL & set U_ILLEGAL_ARGUMENT_ERROR */ |
| if (0 != ucnv_safeClone(0, buffer[0], &bufferSize, &err) || err != U_ILLEGAL_ARGUMENT_ERROR) |
| { |
| log_err("FAIL: Cloned converter failed to deal correctly with null converter pointer\n"); |
| } |
| |
| err = U_ZERO_ERROR; |
| |
| /* Do these cloned converters work at all - shuffle UChars to chars & back again..*/ |
| |
| for (index = 0; index < CLONETEST_CONVERTER_COUNT; index++) |
| { |
| bufferSize = U_CNV_SAFECLONE_BUFFERSIZE; |
| someClonedConverters[index] = ucnv_safeClone(someConverters[index], buffer[index], &bufferSize, &err); |
| pCharBuffer = charBuffer; |
| pUniBuffer = uniBuffer; |
| |
| ucnv_fromUnicode(someClonedConverters[index], |
| &pCharBuffer, |
| charBufferLimit, |
| &pUniBuffer, |
| uniBufferLimit, |
| NULL, |
| TRUE, |
| &err); |
| if(U_FAILURE(err)){ |
| log_err("FAIL: cloned converter failed to do fromU conversion. Error: %s\n",u_errorName(err)); |
| } |
| ucnv_toUnicode(someClonedConverters[index], |
| &pUCharTarget, |
| pUCharTargetLimit, |
| &pCharSource, |
| pCharSourceLimit, |
| NULL, |
| TRUE, |
| &err |
| ); |
| |
| if(U_FAILURE(err)){ |
| log_err("FAIL: cloned converter failed to do toU conversion. Error: %s\n",u_errorName(err)); |
| } |
| |
| pConstCharBuffer = charBuffer; |
| if (uniBuffer [0] != ucnv_getNextUChar(someClonedConverters[index], &pConstCharBuffer, pCharBuffer, &err)) |
| { |
| log_err("FAIL: Cloned converter failed to do conversion. Error: %s\n",u_errorName(err)); |
| } |
| ucnv_close(someClonedConverters[index]); |
| ucnv_close(someConverters[index]); |
| } |
| } |
| |
| static void TestCCSID() { |
| UConverter *cnv; |
| UErrorCode errorCode; |
| int32_t ccsids[]={ 37, 850, 943, 949, 950, 1047, 1252, 33722 }; |
| int32_t i, ccsid; |
| |
| for(i=0; i<(int32_t)(sizeof(ccsids)/sizeof(int32_t)); ++i) { |
| ccsid=ccsids[i]; |
| |
| errorCode=U_ZERO_ERROR; |
| cnv=ucnv_openCCSID(ccsid, UCNV_IBM, &errorCode); |
| if(U_FAILURE(errorCode)) { |
| log_err("error: ucnv_openCCSID(%ld) failed (%s)\n", ccsid, u_errorName(errorCode)); |
| continue; |
| } |
| |
| if(ccsid!=ucnv_getCCSID(cnv, &errorCode)) { |
| log_err("error: ucnv_getCCSID(ucnv_openCCSID(%ld))=%ld\n", ccsid, ucnv_getCCSID(cnv, &errorCode)); |
| } |
| |
| if(UCNV_IBM!=ucnv_getPlatform(cnv, &errorCode)) { |
| log_err("error: ucnv_getPlatform(ucnv_openCCSID(%ld))=%ld!=UCNV_IBM\n", ccsid, ucnv_getPlatform(cnv, &errorCode)); |
| } |
| |
| ucnv_close(cnv); |
| } |
| } |
| |
| /* jitterbug 932: ucnv_convert() bugs --------------------------------------- */ |
| |
| /* CHUNK_SIZE defined in common\ucnv.c: */ |
| #define CHUNK_SIZE 5*1024 |
| |
| static void bug1(void); |
| static void bug2(void); |
| static void bug3(void); |
| |
| static void |
| TestJ932(void) |
| { |
| bug1(); /* Unicode intermediate buffer straddle bug */ |
| bug2(); /* pre-flighting size incorrect caused by simple overflow */ |
| bug3(); /* pre-flighting size incorrect caused by expansion overflow */ |
| } |
| |
| /* |
| * jitterbug 932: test chunking boundary conditions in |
| |
| int32_t ucnv_convert(const char *toConverterName, |
| const char *fromConverterName, |
| char *target, |
| int32_t targetSize, |
| const char *source, |
| int32_t sourceSize, |
| UErrorCode * err) |
| |
| * See discussions on the icu mailing list in |
| * 2001-April with the subject "converter 'flush' question". |
| * |
| * Bug report and test code provided by Edward J. Batutis. |
| */ |
| static void bug1() |
| { |
| static char char_in[CHUNK_SIZE+32]; |
| static char char_out[CHUNK_SIZE*2]; |
| |
| /* GB 18030 equivalent of U+10000 is 90308130 */ |
| static const char test_seq[]={ (char)0x90u, 0x30, (char)0x81u, 0x30 }; |
| |
| UErrorCode err = U_ZERO_ERROR; |
| int32_t i, test_seq_len = sizeof(test_seq); |
| |
| /* |
| * causes straddle bug in Unicode intermediate buffer by sliding the test sequence forward |
| * until the straddle bug appears. I didn't want to hard-code everything so this test could |
| * be expanded - however this is the only type of straddle bug I can think of at the moment - |
| * a high surrogate in the last position of the Unicode intermediate buffer. Apparently no |
| * other Unicode sequences cause a bug since combining sequences are not supported by the |
| * converters. |
| */ |
| |
| for (i = test_seq_len; i >= 0; i--) { |
| /* put character sequence into input buffer */ |
| uprv_memset(char_in, 0x61, sizeof(char_in)); /* GB 18030 'a' */ |
| uprv_memcpy(char_in + (CHUNK_SIZE - i), test_seq, test_seq_len); |
| |
| /* do the conversion */ |
| ucnv_convert("us-ascii", /* out */ |
| "gb18030", /* in */ |
| char_out, |
| sizeof(char_out), |
| char_in, |
| sizeof(char_in), |
| &err); |
| |
| /* bug1: */ |
| if (err == U_TRUNCATED_CHAR_FOUND) { |
| /* this happens when surrogate pair straddles the intermediate buffer in |
| * T_UConverter_fromCodepageToCodepage */ |
| log_err("error j932 bug 1: expected success, got U_TRUNCATED_CHAR_FOUND\n"); |
| } |
| } |
| } |
| |
| /* bug2: pre-flighting loop bug: simple overflow causes bug */ |
| static void bug2() |
| { |
| /* US-ASCII "1234567890" */ |
| static const char source[]={ 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37, 0x38, 0x39 }; |
| static char target[5]; |
| |
| UErrorCode err = U_ZERO_ERROR; |
| int32_t size; |
| |
| /* do the conversion */ |
| size = ucnv_convert("iso-8859-1", /* out */ |
| "us-ascii", /* in */ |
| target, |
| sizeof(target), |
| source, |
| sizeof(source), |
| &err); |
| |
| if ( size != 10 ) { |
| /* bug2: size is 5, should be 10 */ |
| log_err("error j932 bug 2: got preflighting size %d instead of 10\n", size); |
| } |
| } |
| |
| /* |
| * bug3: when the characters expand going from source to target codepage |
| * you get bug3 in addition to bug2 |
| */ |
| static void bug3() |
| { |
| static char char_in[CHUNK_SIZE*4]; |
| static char target[5]; |
| UErrorCode err = U_ZERO_ERROR; |
| int32_t size; |
| |
| /* |
| * first get the buggy size from bug2 then |
| * compare it to buggy size with an expansion |
| */ |
| uprv_memset(char_in, 0x61, sizeof(char_in)); /* US-ASCII 'a' */ |
| |
| /* do the conversion */ |
| size = ucnv_convert("lmbcs", /* out */ |
| "us-ascii", /* in */ |
| target, |
| sizeof(target), |
| char_in, |
| sizeof(char_in), |
| &err); |
| |
| if ( size != sizeof(char_in) ) { |
| /* |
| * bug2: size is 0x2805 (CHUNK_SIZE*2+5 - maybe 5 is the size of the overflow buffer |
| * in the converter?), should be CHUNK_SIZE*4 |
| * |
| * Markus 2001-05-18: 5 is the size of our target[] here, ucnv_convert() did not reset targetSize... |
| */ |
| log_err("error j932 bug 2/3a: expected preflighting size 0x%04x, got 0x%04x\n", sizeof(char_in), size); |
| } |
| |
| /* |
| * now do the conversion with expansion |
| * ascii 0x08 expands to 0x0F 0x28 in lmbcs |
| */ |
| uprv_memset(char_in, 8, sizeof(char_in)); |
| err = U_ZERO_ERROR; |
| |
| /* do the conversion */ |
| size = ucnv_convert("lmbcs", /* out */ |
| "us-ascii", /* in */ |
| target, |
| sizeof(target), |
| char_in, |
| sizeof(char_in), |
| &err); |
| |
| /* expect 2X expansion */ |
| if ( size != sizeof(char_in) * 2 ) { |
| /* |
| * bug3: |
| * bug2 would lead us to expect 0x2805, but it isn't that either, it is 0x3c05: |
| */ |
| log_err("error j932 bug 3b: expected 0x%04x, got 0x%04x\n", sizeof(char_in) * 2, size); |
| } |
| } |