source/test/cintltst/ucnvseltst.c - external/github.com/unicode-org/icu - Git at Google

 /********************************************************************
  * Copyright (c) 1997-2008, International Business Machines
  * Corporation and others. All Rights Reserved.
  ********************************************************************
  *
  * File UCNVSELTST.C
  *
  * Modification History:
  *        Name                     Description
  *     MOHAMED ELDAWY               Creation
  ********************************************************************
  */

 /* C API AND FUNCTIONALITY TEST FOR CONVERTER SELECTOR (ucnvsel.h)*/

 #include "ucnvseltst.h"

 #include <stdio.h>

 #include "unicode/utypes.h"
 #include "unicode/ucnvsel.h"
 #include "unicode/ustring.h"
 #include "cmemory.h"
 #include "cstring.h"

 #define FILENAME_BUFFER 1024

 #define TDSRCPATH  ".."U_FILE_SEP_STRING"test"U_FILE_SEP_STRING"testdata"U_FILE_SEP_STRING

 static FILE *fopenOrError(const char *filename) {
     int32_t needLen;
     FILE *f;
     char fnbuf[FILENAME_BUFFER];
     const char* directory= ctest_dataSrcDir();
     needLen = uprv_strlen(directory)+uprv_strlen(TDSRCPATH)+uprv_strlen(filename)+1;
     if(needLen > FILENAME_BUFFER) {
         log_err("FAIL: Could not load %s. Filename buffer overflow, needed %d but buffer is %d\n",
                 filename, needLen, FILENAME_BUFFER);
         return NULL;
     }

     strcpy(fnbuf, directory);
     strcat(fnbuf, TDSRCPATH);
     strcat(fnbuf, filename);

     f = fopen(fnbuf, "rb");

     if(f == NULL) {
         log_data_err("FAIL: Could not load %s [%s]\n", fnbuf, filename);
     }
     return f;
 }

 void addCnvSelTest(TestNode** root)
 {
     addTest(root, &TestConversionUTF16, "tsconv/ucnvseltst/TestConversionUTF16");
     addTest(root, &TestConversionUTF8, "tsconv/ucnvseltst/TestConversionUTF8");
     addTest(root, &TestSerializationAndUnserialization, "tsconv/ucnvseltst/TestSerializationAndUnserialization");
 }

 /*
  * there doesn't seem to be a fn in ucnv to get the index of a converter
  * given one of its aliases!
  */
 int32_t findIndex (const char* converterName) {
   UErrorCode status = U_ZERO_ERROR;
   int32_t i;
   for (i = 0 ; i < ucnv_countAvailable() ; i++) {
     uint16_t alias_index;
     const char* convName = ucnv_getAvailableName(i);
     if(ucnv_compareNames(convName, converterName) == 0) {
       return i;
     }

     for (alias_index = 0 ; alias_index < ucnv_countAliases(convName, & status) ; alias_index++) {
       const char* aliasName = ucnv_getAlias(convName, alias_index, & status);
       if(ucnv_compareNames(aliasName, converterName) == 0) {
         return i;
       }
     }
   }
   return -1;
 }

 /*
  * fill a boolean array with whether the conversion succeeded
  * or not
  */
 void fillBool(UEnumeration* res, UBool* toFill, int32_t toFillLen) {
   UErrorCode status = U_ZERO_ERROR;
   int32_t i;
   for(i = 0 ; i < toFillLen ; i++)
     toFill[i] = FALSE;
   for(i = 0 ; i < uenum_count(res,&status) ; i++) {
     const char* name = uenum_next(res,NULL, &status);
     toFill[findIndex(name)] = TRUE;
   }
 }


 void verifyResultUTF8(const char* const s, const char** encodings, int32_t num_encodings, UEnumeration* res, const USet* excludedEncodings, const UConverterUnicodeSet   whichSet) {
   UBool* resultsFromSystem;
   UBool* resultsManually;
   int32_t i;
   resultsFromSystem = (UBool*) uprv_malloc(ucnv_countAvailable() * sizeof(UBool));
   resultsManually = (UBool*) uprv_malloc(ucnv_countAvailable() * sizeof(UBool));
   for(i = 0 ; i < ucnv_countAvailable() ; i++)
     resultsFromSystem[i] = resultsManually[i] = FALSE;


   for(i = 0 ; i < num_encodings ; i++) {
     UErrorCode status = U_ZERO_ERROR;
     /* get unicode set for that converter */
     USet* unicode_point_set;
     UConverter* test_converter;
     int32_t offset;
     int32_t length;
     UChar32 next;

     unicode_point_set = uset_open(1, 0);
     test_converter = ucnv_open(encodings[i], &status);
     ucnv_getUnicodeSet(test_converter, unicode_point_set,
                        whichSet, &status);


     offset = 0;
     length = uprv_strlen(s);

     resultsManually[findIndex(encodings[i])] = TRUE;
     next = 0;

     while(offset<length) {
       U8_NEXT(s, offset, length, next)
       if (next >= 0 && uset_contains(excludedEncodings, next)==FALSE && uset_contains(unicode_point_set, next)==FALSE) {
         resultsManually[findIndex(encodings[i])] = FALSE;
         break;
       }
     }
     uset_close(unicode_point_set);

     ucnv_close(test_converter);
   }

   /* fill the bool for the selector results! */
   fillBool(res, resultsFromSystem, ucnv_countAvailable());
   for(i = 0 ; i < ucnv_countAvailable() ; i++) {
     if(resultsManually[i] != resultsFromSystem[i]) {
       log_err("failure in converter selector converter %s had conflicting results manual: %d, system %d\n",ucnv_getAvailableName(i), resultsManually[i], resultsFromSystem[i]);
       exit(1);
     }
   }
   uprv_free(resultsFromSystem);
   uprv_free(resultsManually);
 }


 static void TestConversionUTF8()
 {
   /*
    * test cases are separated by a -1
    * each line is one test case including encodings to check for
    * I'd like to generate this array randomly but not sure if this is an allowed practice in ICU
    */
   int32_t encodingsTestCases[] = {  90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, -1,
                                     1, 3, 7, 9, 11, 13, 12, 15, 19, 20, 22, 24, -1,
                                     0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, -1,
                                     0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30, 32, 34, 36, 38, 40, 42, 44, 46, 48, 50, 52, 54, 56, -1,
                                     1, 5, 9, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, -1,
                                     0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29,
                                     30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59,
                                     60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89,
                                     90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129,
                                     130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159,
                                     160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189,
                                     190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, -1, 1, -1};

   int32_t test_case_count = sizeof(encodingsTestCases) / sizeof(encodingsTestCases[0]);

   USet* excluded_sets[3];
   int32_t i;
   int32_t prev, testCaseIdx;
   int32_t excluded_set_id;
   int32_t curCase = 0;

   excluded_sets[0] = uset_open(1,0);
   for(i = 1 ; i < 3 ; i++)
     excluded_sets[i] = uset_open(i*30, i*30+500);

  for(excluded_set_id = 0 ; excluded_set_id < 3 ; excluded_set_id++)
   for(testCaseIdx = 0, prev=0, curCase=0 ; testCaseIdx < test_case_count ; testCaseIdx++)
   {
     UErrorCode status;
     UEnumeration* res1;
     int32_t i;
     USet* partial_set;
     UConverterSelector* sel;
     char** encodings;
     int32_t num_rndm_encodings;
     int32_t totalStrLen;
     char* names;
     FILE* f1;
     int32_t counter;
     char c;
     char* text;
     int32_t curTestCase;

     if(encodingsTestCases[testCaseIdx] != -1) continue;
     curCase++;

     if(QUICK && curCase > 2)
       break;

     status = U_ZERO_ERROR;
     partial_set = NULL;
     encodings = (char**) uprv_malloc((testCaseIdx - prev) * sizeof(char*));
     num_rndm_encodings = testCaseIdx - prev;
     totalStrLen = 0;
     for(i = prev ; i < testCaseIdx ; i++) {
       totalStrLen += uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i]))+1;
     }
     names = (char*)uprv_malloc(totalStrLen);
     uprv_memset(names, 0, totalStrLen);

     for(i = prev ; i < testCaseIdx ; i++) {
       uprv_memcpy(names, ucnv_getAvailableName(encodingsTestCases[i]), uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i])));
       encodings[i-prev] = names;
       names+=uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i]))+1;
     }

     status = U_ZERO_ERROR;
     sel = ucnvsel_open((const char**)encodings, testCaseIdx-prev, excluded_sets[excluded_set_id], UCNV_ROUNDTRIP_SET, &status);
     /* count how many bytes (Is there a portable function that is more efficient than this?) */
     f1 = fopenOrError("ConverterSelectorTestUTF8.txt");
     if(!f1) {
         return;
     }
     counter = 0;
     while(fread(&c, sizeof(c), 1, f1) > 0)
         counter++;
     fclose(f1);
     text = (char*)uprv_malloc((counter+1));
     f1 = fopenOrError("ConverterSelectorTestUTF8.txt");
     if(!f1) {
         return;
     }
     fread(text,1, counter,f1);
     fclose(f1);


     for (i = 0 ; i < counter ; i++) {
       if(text[i] == '#')
         text[i] = 0;
     }
     text[counter] = 0;

     curTestCase=0;
     for (i = 0 ; i < counter ; i++) {
       if(i==0 || text[i-1] == 0) {
         curTestCase++;
         if(curTestCase > 2 && QUICK)
           break;
         /* test, both with length, and NULL terminated */
         res1 = ucnvsel_selectForUTF8(sel, text+i, -1, &status);
         /* make sure result is correct! */
         verifyResultUTF8(text+i, (const char**) encodings, num_rndm_encodings, res1, excluded_sets[excluded_set_id], UCNV_ROUNDTRIP_SET);
         uenum_close(res1);

         res1 = ucnvsel_selectForUTF8(sel, text+i, uprv_strlen(text+i), &status);
         /* make sure result is correct! */
         verifyResultUTF8(text+i, (const char**)encodings, num_rndm_encodings, res1, excluded_sets[excluded_set_id], UCNV_ROUNDTRIP_SET);
         uenum_close(res1);
       }
     }
     uprv_free(text);
     uprv_free(encodings[0]);
     uprv_free(encodings);
     ucnvsel_close(sel);
     prev = testCaseIdx + 1;
   }

 /* ////////////////////////////////////////////////////////////////////////// */

  /* try fallback mapping! */
  curCase = 0;
  for(excluded_set_id = 0 ; excluded_set_id < 3 ; excluded_set_id++)
   for(testCaseIdx = 0, prev=0, curCase=0 ; testCaseIdx < test_case_count ; testCaseIdx++)
   {
     UErrorCode status;
     UEnumeration* res1;
     int32_t i;
     USet* partial_set;
     UConverterSelector* sel;
     char** encodings;
     int32_t num_rndm_encodings;
     int32_t totalStrLen;
     char* names;
     FILE* f1;
     int32_t counter;
     char c;
     char* text;
     int32_t curTestCase;

     if(encodingsTestCases[testCaseIdx] != -1) continue;

     curCase++;

     if(QUICK && curCase > 2)
       break;

     status = U_ZERO_ERROR;
     partial_set = NULL;
     encodings = (char**)uprv_malloc((testCaseIdx - prev) * sizeof(char*));
     num_rndm_encodings = testCaseIdx - prev;
     totalStrLen = 0;
     for(i = prev ; i < testCaseIdx ; i++) {
       totalStrLen += uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i]))+1;
     }
     names = (char*)uprv_malloc(totalStrLen);
     uprv_memset(names, 0, totalStrLen);

     for(i = prev ; i < testCaseIdx ; i++) {
       uprv_memcpy(names, ucnv_getAvailableName(encodingsTestCases[i]), uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i])));
       encodings[i-prev] = names;
       names+=uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i]))+1;
     }


     status = U_ZERO_ERROR;
     sel = ucnvsel_open((const char**)encodings, testCaseIdx-prev, excluded_sets[excluded_set_id], UCNV_ROUNDTRIP_AND_FALLBACK_SET, &status);
     /* count how many bytes (Is there a portable function that is more efficient than this?) */
     f1 = fopenOrError("ConverterSelectorTestUTF8.txt");
     if(!f1) {
         return;
     }
     counter = 0;
     while(fread(&c, sizeof(c), 1, f1) > 0) counter++;
     fclose(f1);
     text = (char*)uprv_malloc(counter+1);
     f1 = fopenOrError("ConverterSelectorTestUTF8.txt");
     if(!f1) {
         return;
     }
     fread(text,1, counter,f1);
     fclose(f1);


     for (i = 0 ; i < counter ; i++) {
       if(text[i] == '#')
         text[i] = 0;
     }
     text[counter] = 0;

     curTestCase=0;
     for (i = 0 ; i < counter ; i++) {
       if(i==0 || text[i-1] == 0) {
         curTestCase++;
         if(curTestCase > 2 && QUICK)
           break;
         /* test, both with length, and NULL terminated */
         res1 = ucnvsel_selectForUTF8(sel, text+i, -1, &status);
         /* make sure result is correct! */
         verifyResultUTF8(text+i, (const char**)encodings, num_rndm_encodings, res1,excluded_sets[excluded_set_id],  UCNV_ROUNDTRIP_AND_FALLBACK_SET);
         uenum_close(res1);

         res1 = ucnvsel_selectForUTF8(sel, text+i, uprv_strlen(text+i), &status);
         /* make sure result is correct! */
         verifyResultUTF8(text+i, (const char**)encodings, num_rndm_encodings, res1,excluded_sets[excluded_set_id],  UCNV_ROUNDTRIP_AND_FALLBACK_SET);
         uenum_close(res1);
       }
     }
     uprv_free(encodings[0]);
     uprv_free(encodings);
     uprv_free(text);
     ucnvsel_close(sel);
     prev = testCaseIdx + 1;
   }


   for(i = 0 ; i < 3 ; i++)
     uset_close(excluded_sets[i]);

 }

 void verifyResultUTF16(const UChar* const s, const char** encodings, int32_t num_encodings, UEnumeration* res, const USet* excludedEncodings, const UConverterUnicodeSet   whichSet) {
   UBool* resultsFromSystem;
   UBool* resultsManually;
   int32_t i;
   resultsFromSystem = (UBool*) uprv_malloc(ucnv_countAvailable() * sizeof(UBool));
   resultsManually = (UBool*) uprv_malloc(ucnv_countAvailable() * sizeof(UBool));
   for(i = 0 ; i < ucnv_countAvailable() ; i++)
     resultsFromSystem[i] = resultsManually[i] = FALSE;


   for(i = 0 ; i < num_encodings ; i++) {
     UErrorCode status = U_ZERO_ERROR;

     /* get unicode set for that converter */
     USet* unicode_point_set;
     UConverter* test_converter;
     int32_t offset;
     int32_t length;
     UChar32 next;

     resultsManually[findIndex(encodings[i])] = TRUE;

     unicode_point_set = uset_open(1, 0);
     test_converter = ucnv_open(encodings[i], &status);
     ucnv_getUnicodeSet(test_converter, unicode_point_set,
                        whichSet, &status);

     offset = 0;
     length = u_strlen(s);

     resultsManually[findIndex(encodings[i])] = TRUE;
     next = 0;

     while(offset<length) {
     /* loop over string */
       U16_NEXT(s, offset, length, next)
       if (uset_contains(excludedEncodings, next)==FALSE && uset_contains(unicode_point_set, next)==FALSE) {
         resultsManually[findIndex(encodings[i])] = FALSE;
         break;
       }
     }
     uset_close(unicode_point_set);

     ucnv_close(test_converter);
   }

   /* fill the bool for the selector results! */
   fillBool(res, resultsFromSystem, ucnv_countAvailable());
   for(i = 0 ; i < ucnv_countAvailable() ; i++) {
     if(resultsManually[i] != resultsFromSystem[i]) {
       log_err("failure in converter selector converter %s had conflicting results manual: %d, system %d\n",ucnv_getAvailableName(i), resultsManually[i], resultsFromSystem[i]);
     }
   }

   uprv_free(resultsFromSystem);
   uprv_free(resultsManually);
 }

 /* does selectForUTF16() work well? */
 static void TestConversionUTF16()
 {
   /*
    * test cases are separated by a -1
    * each line is one test case including encodings to check for
    * I'd like to generate this array randomly but not sure if this is an allowed practice in ICU
    */
   int32_t encodingsTestCases[] = {  90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, -1,
                                     1, 3, 7, 9, 11, 13, 12, 15, 19, 20, 22, 24, -1,
                                     0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, -1,
                                     0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30, 32, 34, 36, 38, 40, 42, 44, 46, 48, 50, 52, 54, 56, -1,
                                     1, 5, 9, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, -1,
                                     0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29,
                                     30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59,
                                     60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89,
                                     90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129,
                                     130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159,
                                     160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189,
                                     190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, -1, 1, -1};

   int32_t test_case_count = sizeof(encodingsTestCases) / sizeof(encodingsTestCases[0]);

   USet* excluded_sets[3];
   int32_t i;
   int32_t prev, testCaseIdx;
   /* try roundtrip mapping */
   int32_t excluded_set_id;
   int32_t curCase = 0;

   excluded_sets[0] = uset_open(1,0);
   for(i = 1 ; i < 3 ; i++)
     excluded_sets[i] = uset_open(i*30, i*30+500);


  curCase = 0;
  for(excluded_set_id = 0 ; excluded_set_id < 3 ; excluded_set_id++)
   for(testCaseIdx = 0, prev=0, curCase=0 ; testCaseIdx < test_case_count ; testCaseIdx++)
   {
     UErrorCode status;
     UEnumeration* res1;
     int32_t i;
     USet* partial_set;
     UConverterSelector* sel;
     char** encodings;
     int32_t num_rndm_encodings;
     int32_t totalStrLen;
     char* names;
     FILE* f1;
     int32_t counter;
     UChar c;
     UChar* text;
     int32_t curTestCase;

     if(encodingsTestCases[testCaseIdx] != -1) continue;
     curCase++;

     if(QUICK && curCase > 2)
       break;

     status = U_ZERO_ERROR;
     partial_set = NULL;
     encodings = (char**) uprv_malloc((testCaseIdx - prev) * sizeof(char*));
     num_rndm_encodings = testCaseIdx - prev;
     totalStrLen = 0;
     for(i = prev ; i < testCaseIdx ; i++) {
       totalStrLen += uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i]))+1;
     }
     names = (char*)uprv_malloc(totalStrLen);
     uprv_memset(names, 0, totalStrLen);

     for(i = prev ; i < testCaseIdx ; i++) {
       uprv_memcpy(names, ucnv_getAvailableName(encodingsTestCases[i]), uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i])));
       encodings[i-prev] = names;
       names+=uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i]))+1;
     }

     status = U_ZERO_ERROR;
     sel = ucnvsel_open((const char**)encodings, testCaseIdx-prev, excluded_sets[excluded_set_id], UCNV_ROUNDTRIP_SET, &status);
     /* count how many bytes (Is there a portable function that is more efficient than this?) */
     f1 = fopenOrError("ConverterSelectorTestUTF16.txt");
     if(!f1) {
         return; /* error was already printed */
     }
     counter = 0;
     while(fread(&c, sizeof(c), 1, f1) > 0) counter++;
     fclose(f1);
     text = (UChar*)uprv_malloc((counter+1)*sizeof(UChar));
     f1 = fopenOrError("ConverterSelectorTestUTF16.txt");
     if(!f1) {
         return; /* error was already printed */
     }
     fread(text,sizeof(UChar), counter,f1);
     fclose(f1);


     for (i = 0 ; i < counter ; i++) {
       if(text[i] == (UChar)'#')
         text[i] = 0;
     }
     text[counter] = 0;

     curTestCase=0;
     for (i = 0 ; i < counter ; i++) {
       if(i==0 || text[i-1] == 0) {
         curTestCase++;
         if(curTestCase > 2 && QUICK)
           break;
         /* test, both with length, and NULL terminated */
         res1 = ucnvsel_selectForString(sel, text+i, -1, &status);
         /* make sure result is correct! */
         verifyResultUTF16(text+i, (const char**) encodings, num_rndm_encodings, res1, excluded_sets[excluded_set_id], UCNV_ROUNDTRIP_SET);
         uenum_close(res1);

         res1 = ucnvsel_selectForString(sel, text+i, u_strlen(text+i), &status);
         /* make sure result is correct! */
         verifyResultUTF16(text+i, (const char**)encodings, num_rndm_encodings, res1, excluded_sets[excluded_set_id], UCNV_ROUNDTRIP_SET);
         uenum_close(res1);
       }
     }
     uprv_free(text);
     uprv_free(encodings[0]);
     uprv_free(encodings);
     ucnvsel_close(sel);
     prev = testCaseIdx + 1;
   }

 /* ////////////////////////////////////////////////////////////////////////// */

  /* try fallback mapping! */

  for(excluded_set_id = 0 ; excluded_set_id < 3 ; excluded_set_id++)
   for(testCaseIdx = 0, prev=0, curCase=0 ; testCaseIdx < test_case_count ; testCaseIdx++)
   {
     UErrorCode status;
     UEnumeration* res1;
     int32_t i;
     USet* partial_set;
     UConverterSelector* sel;
     char** encodings;
     int32_t num_rndm_encodings;
     int32_t totalStrLen;
     char* names;
     FILE* f1;
     int32_t counter;
     UChar c;
     UChar* text;
     int32_t curTestCase;

     if(encodingsTestCases[testCaseIdx] != -1) continue;

     curCase++;

     if(QUICK && curCase > 2)
       break;

     status = U_ZERO_ERROR;
     partial_set = NULL;
     encodings = (char**)uprv_malloc((testCaseIdx - prev) * sizeof(char*));
     num_rndm_encodings = testCaseIdx - prev;
     totalStrLen = 0;
     for(i = prev ; i < testCaseIdx ; i++) {
       totalStrLen += uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i]))+1;
     }
     names = (char*)uprv_malloc(totalStrLen);
     uprv_memset(names, 0, totalStrLen);

     for(i = prev ; i < testCaseIdx ; i++) {
       uprv_memcpy(names, ucnv_getAvailableName(encodingsTestCases[i]), uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i])));
       encodings[i-prev] = names;
       names+=uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i]))+1;
     }


     /* first time */
     status = U_ZERO_ERROR;
     sel = ucnvsel_open((const char**)encodings, testCaseIdx-prev, excluded_sets[excluded_set_id], UCNV_ROUNDTRIP_AND_FALLBACK_SET, &status);
     /* count how many bytes (Is there a portable function that is more efficient than this?) */
     f1 = fopenOrError("ConverterSelectorTestUTF16.txt");
     if(!f1) {
         return; /* error was already printed */
     }
       counter = 0;
       while(fread(&c, sizeof(c), 1, f1) > 0) counter++;
     fclose(f1);
     text = (UChar*)uprv_malloc((counter+1)*sizeof(UChar));
     f1 = fopenOrError("ConverterSelectorTestUTF16.txt");
     if(!f1) {
         return; /* error was already printed */
     }
       fread(text,sizeof(UChar), counter,f1);
     fclose(f1);


     for (i = 0 ; i < counter ; i++) {
       if(text[i] == (UChar)'#')
         text[i] = 0;
     }
     text[counter] = 0;

     curTestCase=0;
     for (i = 0 ; i < counter ; i++) {
       if(i==0 || text[i-1] == 0) {
         curTestCase++;
         if(curTestCase > 2 && QUICK)
           break;
         /* test, both with length, and NULL terminated */
         res1 = ucnvsel_selectForString(sel, text+i, -1, &status);
         /* make sure result is correct! */
         verifyResultUTF16(text+i, (const char**)encodings, num_rndm_encodings, res1,excluded_sets[excluded_set_id],  UCNV_ROUNDTRIP_AND_FALLBACK_SET);
         uenum_close(res1);

         res1 = ucnvsel_selectForString(sel, text+i, u_strlen(text+i), &status);
         /* make sure result is correct! */
         verifyResultUTF16(text+i, (const char**)encodings, num_rndm_encodings, res1,excluded_sets[excluded_set_id],  UCNV_ROUNDTRIP_AND_FALLBACK_SET);
         uenum_close(res1);
       }
     }
     uprv_free(encodings[0]);
     uprv_free(encodings);
     uprv_free(text);
     ucnvsel_close(sel);
     prev = testCaseIdx + 1;
   }
   for(i = 0 ; i < 3 ; i++)
     uset_close(excluded_sets[i]);
 }


 /* does selectForUTF16() work well? */
 static void TestSerializationAndUnserialization()
 {
   /*
    * test cases are separated by a -1
    * each line is one test case including encodings to check for
    * I'd like to generate this array randomly but not sure if this is an allowed practice in ICU
    */
   int32_t encodingsTestCases[] = {  90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, -1,
                                     1, 3, 7, 9, 11, 13, 12, 15, 19, 20, 22, 24, -1,
                                     0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, -1,
                                     0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30, 32, 34, 36, 38, 40, 42, 44, 46, 48, 50, 52, 54, 56, -1,
                                     1, 5, 9, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, -1,
                                     0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29,
                                     30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59,
                                     60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89,
                                     90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129,
                                     130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159,
                                     160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189,
                                     190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, -1, 1, -1};

   int32_t test_case_count = sizeof(encodingsTestCases) / sizeof(encodingsTestCases[0]);


   USet* excluded_sets[3];
   int32_t i;
   int32_t prev, testCaseIdx;
   /* try roundtrip mapping */
   int32_t excluded_set_id;
   int32_t curCase;

  excluded_sets[0] = uset_open(1,0);
   for(i = 1 ; i < 3 ; i++)
     excluded_sets[i] = uset_open(i*30, i*30+500);


  curCase = 0;
  for(excluded_set_id = 0 ; excluded_set_id < 3 ; excluded_set_id++)
   for(testCaseIdx = 0, prev=0, curCase =0 ; testCaseIdx < test_case_count ; testCaseIdx++)
   {
     UErrorCode status;
     UEnumeration* res1;
     int32_t i;
     USet* partial_set;
     UConverterSelector* sel;
     char** encodings;
     int32_t num_rndm_encodings;
     int32_t totalStrLen;
     char* names;
     char *buffer;
     uint32_t ser_len;
     FILE* f1;
     int32_t counter;
     UChar c;
     UChar* text;
     int32_t curTestCase;

     if(encodingsTestCases[testCaseIdx] != -1) continue;

     curCase++;

     if(QUICK && curCase > 2)
       break;

     status = U_ZERO_ERROR;
     partial_set = NULL;
     encodings = (char**) uprv_malloc((testCaseIdx - prev) * sizeof(char*));
     num_rndm_encodings = testCaseIdx - prev;
     totalStrLen = 0;
     for(i = prev ; i < testCaseIdx ; i++) {
       totalStrLen += uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i]))+1;
     }
     names = (char*)uprv_malloc(totalStrLen);
     uprv_memset(names, 0, totalStrLen);

     for(i = prev ; i < testCaseIdx ; i++) {
       uprv_memcpy(names, ucnv_getAvailableName(encodingsTestCases[i]), uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i])));
       encodings[i-prev] = names;
       names+=uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i]))+1;
     }

     /* first time */
     status = U_ZERO_ERROR;
     sel = ucnvsel_open((const char**)encodings, testCaseIdx-prev, excluded_sets[excluded_set_id], UCNV_ROUNDTRIP_SET, &status);
     if (U_FAILURE(status)) {
       log_err("ucnvsel_open(test case %d) failed: %s\n", curCase, u_errorName(status));
       uprv_free(encodings);
       uprv_free(names);
       return;
     }

     buffer = NULL;
     ser_len = ucnvsel_serialize(sel, NULL, 0, &status);
     if (status != U_BUFFER_OVERFLOW_ERROR) {
       log_err("ucnvsel_serialize(test case %d preflighting) failed: %s\n", curCase, u_errorName(status));
       ucnvsel_close(sel);
       uprv_free(encodings);
       uprv_free(names);
       return;
     }
     buffer = uprv_malloc(ser_len);
     status = U_ZERO_ERROR;
     ucnvsel_serialize(sel, buffer, ser_len, &status);
     ucnvsel_close(sel);
     if (U_FAILURE(status)) {
       log_err("ucnvsel_serialize(test case %d) failed: %s\n", curCase, u_errorName(status));
       uprv_free(encodings);
       uprv_free(names);
       uprv_free(buffer);
       return;
     }
     sel = ucnvsel_openFromSerialized( buffer,  ser_len,&status);
     if (U_FAILURE(status)) {
       log_err("ucnvsel_openFromSerialized(test case %d) failed: %s\n", curCase, u_errorName(status));
       uprv_free(encodings);
       uprv_free(names);
       uprv_free(buffer);
       return;
     }

     /* count how many bytes (Is there a portable function that is more efficient than this?) */
     f1 = fopenOrError("ConverterSelectorTestUTF16.txt");
     if(!f1) {
         return; /* error was already printed */
     }
       counter = 0;
       while(fread(&c, sizeof(c), 1, f1) > 0) counter++;
     fclose(f1);
     text = (UChar*)uprv_malloc((counter+1)*sizeof(UChar));
     f1 = fopenOrError("ConverterSelectorTestUTF16.txt");
     if(!f1) {
         return; /* error was already printed */
     }
       fread(text,sizeof(text[0]), counter,f1);
     fclose(f1);

     for (i = 0 ; i < counter ; i++) {
       if(text[i] == (UChar)'#')
         text[i] = 0;
     }
     text[counter] = 0;

     curTestCase=0;
     for (i = 0 ; i < counter ; i++) {
       if(i==0 || text[i-1] == 0) {
         curTestCase++;
         if(curTestCase > 2 && QUICK)
           break;
         /* test, both with length, and NULL terminated */
         res1 = ucnvsel_selectForString(sel, text+i, -1, &status);
         if (U_FAILURE(status)) {
           log_err("ucnvsel_selectForString(test case %d, string %d with NUL) failed: %s\n",
                   curCase, curTestCase, u_errorName(status));
           continue;
         }
         /* make sure result is correct! */
         verifyResultUTF16(text+i, (const char**) encodings, num_rndm_encodings, res1, excluded_sets[excluded_set_id], UCNV_ROUNDTRIP_SET);
         uenum_close(res1);

         res1 = ucnvsel_selectForString(sel, text+i, u_strlen(text+i), &status);
         if (U_FAILURE(status)) {
           log_err("ucnvsel_selectForString(test case %d, string %d with length) failed: %s\n",
                   curCase, curTestCase, u_errorName(status));
           continue;
         }
         /* make sure result is correct! */
         verifyResultUTF16(text+i, (const char**)encodings, num_rndm_encodings, res1, excluded_sets[excluded_set_id], UCNV_ROUNDTRIP_SET);
         uenum_close(res1);
       }
     }
     uprv_free(text);
     uprv_free(encodings[0]);
     uprv_free(encodings);
     ucnvsel_close(sel);
     prev = testCaseIdx + 1;
     uprv_free(buffer);
   }

 /* ////////////////////////////////////////////////////////////////////////// */

  /* try fallback mapping! */
  for(excluded_set_id = 0 ; excluded_set_id < 3 ; excluded_set_id++)
   for(testCaseIdx = 0, prev=0, curCase=0 ; testCaseIdx < test_case_count ; testCaseIdx++)
   {
     UErrorCode status;
     UEnumeration* res1;
     int32_t i;
     USet* partial_set;
     UConverterSelector* sel;
     char** encodings;
     int32_t num_rndm_encodings;
     int32_t totalStrLen;
     char* names;
     char *buffer;
     uint32_t ser_len;
     FILE* f1;
     int32_t counter;
     UChar c;
     UChar* text;
     int32_t curTestCase;

     if(encodingsTestCases[testCaseIdx] != -1) continue;

     curCase++;

     if(QUICK && curCase > 2)
       break;

     status = U_ZERO_ERROR;
     partial_set = NULL;
     encodings = (char**)uprv_malloc((testCaseIdx - prev) * sizeof(char*));
     num_rndm_encodings = testCaseIdx - prev;
     totalStrLen = 0;
     for(i = prev ; i < testCaseIdx ; i++) {
       totalStrLen += uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i]))+1;
     }
     names = (char*)uprv_malloc(totalStrLen);
     uprv_memset(names, 0, totalStrLen);

     for(i = prev ; i < testCaseIdx ; i++) {
       uprv_memcpy(names, ucnv_getAvailableName(encodingsTestCases[i]), uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i])));
       encodings[i-prev] = names;
       names+=uprv_strlen(ucnv_getAvailableName(encodingsTestCases[i]))+1;
     }

     /* first time */
     status = U_ZERO_ERROR;
     sel = ucnvsel_open((const char**)encodings, testCaseIdx-prev, excluded_sets[excluded_set_id], UCNV_ROUNDTRIP_AND_FALLBACK_SET, &status);

     buffer = NULL;
     ser_len = ucnvsel_serialize(sel, NULL, 0, &status);
     buffer = uprv_malloc(ser_len);
     status = U_ZERO_ERROR;
     ucnvsel_serialize(sel, buffer, ser_len, &status);

     ucnvsel_close(sel);
     sel = ucnvsel_openFromSerialized( buffer,  ser_len,&status);

     /* count how many bytes (Is there a portable function that is more efficient than this?) */
     f1 = fopenOrError("ConverterSelectorTestUTF16.txt");
     if(!f1) {
         return; /* error was already printed */
     }
       counter = 0;
       while(fread(&c, sizeof(c), 1, f1) > 0) counter++;
     fclose(f1);
     text = (UChar*)uprv_malloc((counter+1)*sizeof(UChar));
     f1 = fopenOrError("ConverterSelectorTestUTF16.txt");
     if(!f1) {
         return; /* error was already printed */
     }
       fread(text,sizeof(text[0]), counter,f1);
     fclose(f1);

     for (i = 0 ; i < counter ; i++) {
       if(text[i] == (UChar)'#')
         text[i] = 0;
     }
     text[counter] = 0;

     curTestCase=0;
     for (i = 0 ; i < counter ; i++) {
       if(i==0 || text[i-1] == 0) {
         curTestCase++;
         if(curTestCase > 2 && QUICK)
           break;
         /* test, both with length, and NULL terminated */
         res1 = ucnvsel_selectForString(sel, text+i, -1, &status);
         /* make sure result is correct! */
         verifyResultUTF16(text+i, (const char**)encodings, num_rndm_encodings, res1,excluded_sets[excluded_set_id],  UCNV_ROUNDTRIP_AND_FALLBACK_SET);
         uenum_close(res1);

         res1 = ucnvsel_selectForString(sel, text+i, u_strlen(text+i), &status);
         /* make sure result is correct! */
         verifyResultUTF16(text+i, (const char**)encodings, num_rndm_encodings, res1,excluded_sets[excluded_set_id],  UCNV_ROUNDTRIP_AND_FALLBACK_SET);
         uenum_close(res1);
       }
     }
     uprv_free(encodings[0]);
     uprv_free(encodings);
     uprv_free(text);
     ucnvsel_close(sel);
     prev = testCaseIdx + 1;
     uprv_free(buffer);
   }

   for(i = 0 ; i < 3 ; i++)
     uset_close(excluded_sets[i]);
 }