| /* |
| ******************************************************************************** |
| * |
| * Copyright (C) 1998-1999, International Business Machines |
| * Corporation and others. All Rights Reserved. |
| * |
| ******************************************************************************** |
| * |
| * |
| * makeconv.c: |
| * tool creating a binary (compressed) representation of the conversion mapping |
| * table (IBM NLTC ucmap format). |
| * |
| * 05/04/2000 helena Added fallback mapping into the picture... |
| * 06/29/2000 helena Major rewrite of the callback APIs. |
| */ |
| |
| #include <stdio.h> |
| #include "ucmp16.h" |
| #include "ucmp8.h" |
| #include "ucnv_io.h" |
| #include "unicode/ucnv_err.h" |
| #include "ucnv_bld.h" |
| #include "ucnv_imp.h" |
| #include "ucnv_cnv.h" |
| #include "cstring.h" |
| #include "cmemory.h" |
| #include "filestrm.h" |
| #include "toolutil.h" |
| #include "uoptions.h" |
| #include "unicode/udata.h" |
| #include "unewdata.h" |
| #include "ucmpwrit.h" |
| #include "makeconv.h" |
| #include "genmbcs.h" |
| |
| #ifdef XP_MAC_CONSOLE |
| # include <console.h> |
| #endif |
| |
| #define DEBUG 0 |
| |
| /* |
| * from ucnvstat.c - static prototypes of data-based converters |
| */ |
| extern const UConverterStaticData * ucnv_converterStaticData[UCNV_NUMBER_OF_SUPPORTED_CONVERTER_TYPES]; |
| |
| /* |
| * Global - verbosity |
| */ |
| UBool VERBOSE = FALSE; |
| |
| /*Reads the header of the table file and fills in basic knowledge about the converter |
| *in "converter" |
| */ |
| static void readHeaderFromFile(UConverterSharedData* myConverter, FileStream* convFile, const char* converterName, UErrorCode* err); |
| |
| /*Reads the rest of the file, and fills up the shared objects if necessary |
| Returns the UConverterTable. */ |
| static void loadTableFromFile(FileStream* convFile, UConverterSharedData* sharedData, UErrorCode* err); |
| |
| /* creates a UConverterSharedData from a mapping file. |
| * Fills in: *staticData, *table. Converter is NOT otherwise useful. |
| */ |
| static UConverterSharedData* createConverterFromTableFile(const char* realName, UErrorCode* err); |
| |
| /* |
| * Set up the UNewData and write the converter.. |
| */ |
| void writeConverterData(UConverterSharedData *mySharedData, const char *cnvName, const char *cnvDir, UErrorCode *status); |
| |
| /* |
| * Utility functions |
| */ |
| static UConverterPlatform getPlatformFromName(char* name); |
| static int32_t getCodepageNumberFromName(char* name); |
| |
| static const char NLTC_SEPARATORS[9] = { '\r', '\n', '\t', ' ', '<', '>' ,'"' , 'U', '\0' }; |
| static const char FALLBACK_SEPARATOR = '|'; |
| static const char PLAIN_SEPARATORS[9] = { '\r', '\n', '\t', ' ', '<', '>' ,'"' , '\0' }; |
| static const char STATE_SEPARATORS[9] = { '\r', '\n', '\t', '<', '>' ,'"' , '\0' }; /* do not break on space */ |
| static const char CODEPOINT_SEPARATORS[8] = { '\r', '>', '\\', 'x', '\n', ' ', '\t', '\0' }; |
| static const char UNICODE_CODEPOINT_SEPARATORS[6] = { '<', '>', 'U', ' ', '\t', '\0' }; |
| |
| /* Remove all characters followed by '#' |
| */ |
| char * |
| removeComments (char *line) |
| { |
| char *pound = uprv_strchr (line, '#'); |
| char *fallback = uprv_strchr(line, '|'); |
| if (pound != NULL) |
| { |
| if (fallback != NULL) |
| { |
| uprv_memset(pound, ' ', fallback-pound); |
| } |
| else |
| { |
| *pound = '\0'; |
| } |
| } |
| return line; |
| } |
| |
| /*Returns uppercased string */ |
| char * |
| strtoupper (char *name) |
| { |
| char *oldPtr = name; |
| |
| do { |
| *name = (char)uprv_toupper(*name); |
| } |
| while (*(name++)); |
| |
| return oldPtr; |
| } |
| |
| /* Returns true in c is a in set 'setOfChars', false otherwise |
| */ |
| UBool |
| isInSet (char c, const char *setOfChars) |
| { |
| uint8_t i = 0; |
| |
| while (setOfChars[i] != '\0') |
| { |
| if (c == setOfChars[i++]) |
| return TRUE; |
| } |
| |
| return FALSE; |
| } |
| |
| /* Returns pointer to the next non-whitespace (or non-separator) |
| */ |
| int32_t |
| nextTokenOffset (const char *line, const char *separators) |
| { |
| int32_t i = 0; |
| |
| while (line[i] && isInSet(line[i], separators)) |
| i++; |
| |
| return i; |
| } |
| |
| /* Returns pointer to the next token based on the set of separators |
| */ |
| char * |
| getToken (char *token, char *line, const char *separators) |
| { |
| int32_t i = nextTokenOffset (line, separators); |
| int8_t j = 0; |
| |
| while (line[i] && (!isInSet(line[i], separators))) |
| token[j++] = line[i++]; |
| token[j] = '\0'; |
| |
| return line + i; |
| } |
| |
| UBool haveCopyright=TRUE; |
| |
| static UDataInfo dataInfo={ |
| sizeof(UDataInfo), |
| 0, |
| |
| U_IS_BIG_ENDIAN, |
| U_CHARSET_FAMILY, |
| sizeof(UChar), |
| 0, |
| |
| 0x63, 0x6e, 0x76, 0x74, /* dataFormat="cnvt" */ |
| 6, 0, 0, 0, /* formatVersion */ |
| 0, 0, 0, 0 /* dataVersion (calculated at runtime) */ |
| }; |
| |
| void writeConverterData(UConverterSharedData *mySharedData, |
| const char *cnvName, |
| const char *cnvDir, |
| UErrorCode *status) |
| { |
| UNewDataMemory *mem = NULL; |
| uint32_t sz2; |
| uint32_t size = 0; |
| |
| if(U_FAILURE(*status)) |
| { |
| return; |
| } |
| |
| mem = udata_create(cnvDir, "cnv", cnvName, &dataInfo, haveCopyright ? U_COPYRIGHT_STRING : NULL, status); |
| |
| if(U_FAILURE(*status)) |
| { |
| fprintf(stderr, "Couldn't create the udata %s.%s: %s\n", |
| cnvName, |
| "cnv", |
| u_errorName(*status)); |
| return; |
| } |
| |
| if(VERBOSE) |
| { |
| fprintf(stderr, "- Opened udata %s.%s\n", cnvName, "cnv"); |
| } |
| |
| /* all read only, clean, platform independent data. Mmmm. :) */ |
| udata_writeBlock(mem, mySharedData->staticData, sizeof(UConverterStaticData)); |
| size += sizeof(UConverterStaticData); /* Is 4-aligned - by size */ |
| /* Now, write the table */ |
| size += ((NewConverter *)mySharedData->table)->write((NewConverter *)mySharedData->table, mySharedData->staticData, mem); |
| |
| sz2 = udata_finish(mem, status); |
| if(size != sz2) |
| { |
| fprintf(stderr, "error: wrote %ld bytes to the .cnv file but counted %ld bytes\n", sz2, size); |
| *status=U_INTERNAL_PROGRAM_ERROR; |
| } |
| if(VERBOSE) |
| { |
| fprintf(stderr, "- Wrote %d bytes to the udata.\n", sz2); |
| } |
| } |
| |
| static UOption options[]={ |
| UOPTION_HELP_H, /* 0 Numbers for those who*/ |
| UOPTION_HELP_QUESTION_MARK, /* 1 can't count. */ |
| UOPTION_COPYRIGHT, /* 2 */ |
| UOPTION_VERSION, /* 3 */ |
| UOPTION_DESTDIR, /* 4 */ |
| UOPTION_VERBOSE /* 5 */ |
| }; |
| |
| int main(int argc, char* argv[]) |
| { |
| UConverterSharedData* mySharedData = NULL; |
| UErrorCode err = U_ZERO_ERROR; |
| char outFileName[UCNV_MAX_FULL_FILE_NAME_LENGTH]; |
| const char* destdir, *arg; |
| size_t destdirlen; |
| char* dot = NULL, *outBasename; |
| char cnvName[UCNV_MAX_FULL_FILE_NAME_LENGTH]; |
| UVersionInfo icuVersion; |
| |
| #ifdef XP_MAC_CONSOLE |
| argc = ccommand((char***)&argv); |
| #endif |
| |
| /* Set up the ICU version number */ |
| u_getVersion(icuVersion); |
| uprv_memcpy(&dataInfo.dataVersion, &icuVersion, sizeof(UVersionInfo)); |
| |
| /* preset then read command line options */ |
| options[4].value=u_getDataDirectory(); |
| argc=u_parseArgs(argc, argv, sizeof(options)/sizeof(options[0]), options); |
| |
| /* error handling, printing usage message */ |
| if(argc<0) { |
| fprintf(stderr, |
| "error in command line argument \"%s\"\n", |
| argv[-argc]); |
| } else if(argc<2) { |
| argc=-1; |
| } |
| if(argc<0 || options[0].doesOccur || options[1].doesOccur) { |
| fprintf(stderr, |
| "usage: %s [-options] files...\n" |
| "\tread .ucm codepage mapping files and write .cnv files\n" |
| "\toptions:\n" |
| "\t\t-h or -? or --help this usage text\n" |
| "\t\t-V or --version show a version message\n" |
| "\t\t-c or --copyright include a copyright notice\n" |
| "\t\t-d or --destdir destination directory, followed by the path\n" |
| "\t\t-v or --verbose Turn on verbose output\n", |
| argv[0]); |
| return argc<0 ? U_ILLEGAL_ARGUMENT_ERROR : U_ZERO_ERROR; |
| } |
| |
| if(options[3].doesOccur) { |
| fprintf(stderr,"makeconv version %hu.%hu, ICU tool to read .ucm codepage mapping files and write .cnv files\n", |
| dataInfo.formatVersion[0], dataInfo.formatVersion[1]); |
| fprintf(stderr, "Copyright (C) 1998-2000, International Business Machines\n"); |
| fprintf(stderr,"Corporation and others. All Rights Reserved.\n"); |
| exit(0); |
| } |
| |
| /* get the options values */ |
| haveCopyright = options[2].doesOccur; |
| destdir = options[4].value; |
| VERBOSE = options[5].doesOccur; |
| |
| if (destdir != NULL && *destdir != 0) { |
| uprv_strcpy(outFileName, destdir); |
| destdirlen = uprv_strlen(destdir); |
| outBasename = outFileName + destdirlen; |
| if (*(outBasename - 1) != U_FILE_SEP_CHAR) { |
| *outBasename++ = U_FILE_SEP_CHAR; |
| ++destdirlen; |
| } |
| } else { |
| destdirlen = 0; |
| outBasename = outFileName; |
| } |
| |
| #if DEBUG |
| { |
| int i; |
| printf("makeconv: processing %d files...\n", argc - 1); |
| for(i=1; i<argc; ++i) { |
| printf("%s ", argv[i]); |
| } |
| printf("\n"); |
| fflush(stdout); |
| } |
| #endif |
| |
| for (++argv; --argc; ++argv) |
| { |
| err = U_ZERO_ERROR; |
| arg = getLongPathname(*argv); |
| |
| /*produces the right destination path for display*/ |
| if (destdirlen != 0) |
| { |
| const char *basename; |
| |
| /* find the last file sepator */ |
| basename = uprv_strrchr(arg, U_FILE_SEP_CHAR); |
| if (basename == NULL) { |
| basename = arg; |
| } else { |
| ++basename; |
| } |
| |
| uprv_strcpy(outBasename, basename); |
| } |
| else |
| { |
| uprv_strcpy(outFileName, arg); |
| } |
| |
| /*removes the extension if any is found*/ |
| dot = uprv_strrchr(outBasename, '.'); |
| if (dot) |
| { |
| *dot = '\0'; |
| } |
| |
| /* the basename without extension is the converter name */ |
| uprv_strcpy(cnvName, outBasename); |
| |
| /*Adds the target extension*/ |
| uprv_strcat(outBasename, CONVERTER_FILE_EXTENSION); |
| |
| #if DEBUG |
| printf("makeconv: processing %s ...\n", arg); |
| fflush(stdout); |
| #endif |
| mySharedData = createConverterFromTableFile(arg, &err); |
| |
| if (U_FAILURE(err) || (mySharedData == NULL)) |
| { |
| /* if an error is found, print out an error msg and keep going */ |
| fprintf(stderr, "Error creating \"%s\" file for \"%s\" (error code %d - %s)\n", outFileName, arg, err, |
| u_errorName(err)); |
| err = U_ZERO_ERROR; |
| } |
| else |
| { |
| /* Make the static data name equal to the file name */ |
| if( /*VERBOSE && */ uprv_stricmp(cnvName,mySharedData->staticData->name)) |
| { |
| fprintf(stderr, "Warning: %s%s claims to be '%s'\n", |
| cnvName, |
| CONVERTER_FILE_EXTENSION, |
| mySharedData->staticData->name); |
| } |
| |
| uprv_strcpy((char*)mySharedData->staticData->name, cnvName); |
| |
| writeConverterData(mySharedData, cnvName, destdir, &err); |
| ((NewConverter *)mySharedData->table)->close((NewConverter *)mySharedData->table); |
| uprv_free((UConverterStaticData *)mySharedData->staticData); |
| uprv_free(mySharedData); |
| |
| if(U_FAILURE(err)) |
| { |
| /* if an error is found, print out an error msg and keep going*/ |
| fprintf(stderr, "Error writing \"%s\" file for \"%s\" (error code %d - %s)\n", outFileName, arg, err, |
| u_errorName(err)); |
| } |
| else |
| { |
| puts(outFileName); |
| } |
| } |
| |
| } |
| |
| return err; |
| } |
| |
| UConverterPlatform getPlatformFromName(char* name) |
| { |
| char myPlatform[10]; |
| char mySeparators[2] = { '-', '\0' }; |
| |
| getToken(myPlatform, name, mySeparators); |
| strtoupper(myPlatform); |
| |
| if (uprv_strcmp(myPlatform, "IBM") == 0) |
| return UCNV_IBM; |
| else |
| return UCNV_UNKNOWN; |
| } |
| |
| int32_t getCodepageNumberFromName(char* name) |
| { |
| char myNumber[10]; |
| char mySeparators[2] = { '-', '\0' }; |
| char* line = NULL; |
| |
| line = getToken(myNumber, name, mySeparators); |
| getToken(myNumber, line, mySeparators); |
| |
| return T_CString_stringToInteger(myNumber, 10); |
| } |
| |
| /*Reads the header of the table file and fills in basic knowledge about the converter in "converter"*/ |
| void readHeaderFromFile(UConverterSharedData* mySharedData, |
| FileStream* convFile, |
| const char* converterName, |
| UErrorCode* err) |
| { |
| char storeLine[200]; |
| char key[16]; |
| char value[200]; |
| char* line = storeLine; |
| UBool endOfHeader = FALSE; |
| UBool hasConvClass = FALSE; |
| UBool hasSubChar = FALSE; |
| char codepointByte[3]; |
| |
| UConverterStaticData *myConverter = (UConverterStaticData *)mySharedData->staticData; |
| |
| if (U_FAILURE(*err)) return; |
| while (T_FileStream_readLine(convFile, line, sizeof(storeLine))) |
| { |
| removeComments(line); |
| |
| /*skip blank lines*/ |
| if (*(line + nextTokenOffset(line, NLTC_SEPARATORS)) != '\0') |
| { |
| /*gets the key that will qualify adjacent information*/ |
| /*gets the adjacent value*/ |
| line = getToken(key, line, NLTC_SEPARATORS); |
| if (uprv_strcmp(key, "uconv_class") == 0) |
| line = getToken(value, line, PLAIN_SEPARATORS); |
| else if (uprv_strcmp(key, "icu:state") == 0) |
| line = getToken(value, line, STATE_SEPARATORS); |
| else |
| line = getToken(value, line, NLTC_SEPARATORS); |
| |
| |
| /* |
| Figure out what key was found and fills in myConverter with the appropriate values |
| a switch statement for strings... |
| */ |
| |
| /*Checks for end of header marker*/ |
| if (uprv_strcmp(key, "CHARMAP") == 0) |
| { |
| endOfHeader = TRUE; |
| break; |
| } |
| |
| /*get name tag*/ |
| else if (uprv_strcmp(key, "code_set_name") == 0) |
| { |
| if (uprv_strlen(value) != 0) |
| { |
| uprv_strcpy((char*)myConverter->name, value); |
| myConverter->platform = (int8_t)getPlatformFromName(value); |
| myConverter->codepage = getCodepageNumberFromName(value); |
| } else { |
| uprv_strcpy((char*)myConverter->name, converterName); |
| myConverter->platform = UCNV_IBM; |
| } |
| |
| } |
| |
| /*get conversion type*/ |
| else if (uprv_strcmp(key, "uconv_class") == 0) |
| { |
| |
| hasConvClass = TRUE; |
| #if DEBUG |
| printf(" %s\n", value); |
| fflush(stdout); |
| #endif |
| if (uprv_strcmp(value, "DBCS") == 0) |
| { |
| myConverter->conversionType = UCNV_DBCS; |
| } |
| else if (uprv_strcmp(value, "SBCS") == 0) |
| { |
| myConverter->conversionType = UCNV_SBCS; |
| } |
| else if (uprv_strcmp(value, "MBCS") == 0) |
| { |
| myConverter->conversionType = UCNV_MBCS; |
| } |
| else if (uprv_strcmp(value, "EBCDIC_STATEFUL") == 0) |
| { |
| myConverter->conversionType = UCNV_EBCDIC_STATEFUL; |
| } |
| else |
| { |
| fprintf(stderr, "error: unknown <uconv_class> %s\n", key); |
| *err = U_INVALID_TABLE_FORMAT; |
| return; |
| } |
| |
| /* Now that we know the type, copy any 'default' values |
| from the table. */ |
| { |
| const UConverterStaticData *prototype = ucnv_converterStaticData[myConverter->conversionType]; |
| if ( prototype != NULL ) |
| { |
| if ( myConverter->name[0] == 0 ) |
| { |
| uprv_strcpy((char*)myConverter->name, prototype->name); |
| } |
| |
| if ( myConverter->codepage == 0 ) |
| { |
| myConverter->codepage = prototype->codepage; |
| } |
| |
| if ( myConverter->platform == 0 ) |
| { |
| myConverter->platform = prototype->platform; |
| } |
| |
| if ( myConverter->minBytesPerChar == 0 ) |
| { |
| myConverter->minBytesPerChar = prototype->minBytesPerChar; |
| } |
| |
| if ( myConverter->maxBytesPerChar == 0 ) |
| { |
| myConverter->maxBytesPerChar = prototype->maxBytesPerChar; |
| } |
| |
| if ( myConverter->subCharLen == 0 ) |
| { |
| myConverter->subCharLen = prototype->subCharLen; |
| uprv_memcpy(myConverter->subChar, prototype->subChar, |
| prototype->subCharLen); |
| } |
| } |
| } |
| |
| } |
| |
| /*get mb_cur_max amount*/ |
| else if (uprv_strcmp(key, "mb_cur_max") == 0) |
| myConverter->maxBytesPerChar = (int8_t)T_CString_stringToInteger(value, 10); |
| |
| /*get mb_cur_max amount*/ |
| else if (uprv_strcmp(key, "mb_cur_min") == 0) |
| myConverter->minBytesPerChar = (int8_t)T_CString_stringToInteger(value, 10); |
| |
| |
| else if (uprv_strcmp(key, "subchar") == 0) |
| { |
| hasSubChar = TRUE; |
| myConverter->subCharLen = 0; |
| |
| /*readies value for tokenizing, we want to break each byte of the codepoint into single tokens*/ |
| line = value; |
| while (*line) |
| { |
| line = getToken(codepointByte, line, CODEPOINT_SEPARATORS); |
| myConverter->subChar[(myConverter->subCharLen++)] = |
| (unsigned char)T_CString_stringToInteger(codepointByte, 16); |
| } |
| |
| /*Initializes data from the mutable area to that found in the immutable area*/ |
| |
| } |
| else if (uprv_strcmp(key, "icu:state") == 0) |
| { |
| if (myConverter->conversionType != UCNV_MBCS) |
| { |
| fprintf(stderr, "error: <icu:state> entry for non-MBCS table or before the <uconv_class> line\n"); |
| *err = U_INVALID_TABLE_FORMAT; |
| break; |
| } |
| if (myConverter->maxBytesPerChar == 0) |
| { |
| fprintf(stderr, "error: <icu:state> before the <mb_cur_max> line\n"); |
| *err = U_INVALID_TABLE_FORMAT; |
| break; |
| } |
| if (mySharedData->table == NULL) |
| { |
| mySharedData->table = (UConverterTable *)MBCSOpen(myConverter->maxBytesPerChar); |
| if (mySharedData->table == NULL) |
| { |
| *err = U_MEMORY_ALLOCATION_ERROR; |
| break; |
| } |
| } |
| if (!MBCSAddState((NewConverter *)mySharedData->table, value)) |
| { |
| *err = U_INVALID_TABLE_FORMAT; |
| } |
| } |
| } |
| /*make line point to the beginning of the storage buffer again*/ |
| line = storeLine; |
| } |
| |
| if (!endOfHeader || !hasConvClass) |
| { |
| *err = U_INVALID_TABLE_FORMAT; |
| } |
| else if (myConverter->conversionType == UCNV_MBCS && mySharedData->table == NULL) |
| { |
| fprintf(stderr, "error: missing state table information (<icu:state>) for MBCS\n"); |
| *err = U_INVALID_TABLE_FORMAT; |
| } |
| return; |
| } |
| |
| void loadTableFromFile(FileStream* convFile, UConverterSharedData* sharedData, UErrorCode* err) |
| { |
| char storageLine[200]; |
| char* line = NULL; |
| UConverterStaticData *staticData=(UConverterStaticData *)sharedData->staticData; |
| NewConverter *cnvData = (NewConverter *)sharedData->table; |
| UChar32 unicodeValue, codepageValue; |
| uint8_t mbcsBytes[8]; |
| int32_t mbcsLength; |
| char codepointBytes[20]; |
| UBool isOK = TRUE; |
| uint8_t precisionMask = 0; |
| char endOfLine; |
| |
| if(cnvData->startMappings!=NULL) |
| { |
| cnvData->startMappings(cnvData); |
| } |
| |
| staticData->hasFromUnicodeFallback = staticData->hasToUnicodeFallback = FALSE; |
| |
| while (T_FileStream_readLine(convFile, storageLine, sizeof(storageLine))) |
| { |
| removeComments(storageLine); |
| line = storageLine; |
| if (line[nextTokenOffset(line, NLTC_SEPARATORS)] != '\0') |
| { |
| /* get the Unicode code point */ |
| line = getToken(codepointBytes, line, UNICODE_CODEPOINT_SEPARATORS); |
| if (uprv_strcmp(codepointBytes, "END") == 0) |
| { |
| break; |
| } |
| unicodeValue = (UChar32)T_CString_stringToInteger(codepointBytes, 16); |
| |
| /* get the codepage bytes */ |
| codepageValue = 0; |
| mbcsLength = 0; |
| do |
| { |
| line = getToken(codepointBytes, line, CODEPOINT_SEPARATORS); |
| mbcsBytes[mbcsLength] = (uint8_t)T_CString_stringToInteger(codepointBytes, 16); |
| codepageValue = codepageValue << 8 | mbcsBytes[mbcsLength++]; |
| |
| /* End of line could be \0 or | (if fallback) */ |
| endOfLine= line[nextTokenOffset(line, CODEPOINT_SEPARATORS)]; |
| } while((endOfLine != '\0') && (endOfLine != FALLBACK_SEPARATOR)); |
| if((uint32_t)unicodeValue > 0x10ffff) |
| { |
| fprintf(stderr, "error: Unicode code point > U+10ffff in '%s'\n", storageLine); |
| isOK = FALSE; |
| } |
| else if(endOfLine == FALLBACK_SEPARATOR) |
| { |
| /* we know that there is a fallback separator */ |
| precisionMask |= 1; |
| line = uprv_strchr(line, FALLBACK_SEPARATOR) + 1; |
| switch(*line) |
| { |
| case '0': |
| /* set roundtrip mappings */ |
| isOK &= cnvData->addToUnicode(cnvData, mbcsBytes, mbcsLength, unicodeValue, codepageValue, 0) && |
| cnvData->addFromUnicode(cnvData, mbcsBytes, mbcsLength, unicodeValue, codepageValue, 0); |
| break; |
| case '1': |
| /* set only a fallback mapping from Unicode to codepage */ |
| staticData->hasFromUnicodeFallback = TRUE; |
| isOK &= cnvData->addFromUnicode(cnvData, mbcsBytes, mbcsLength, unicodeValue, codepageValue, 1); |
| break; |
| case '2': |
| /* skip subchar mappings */ |
| break; |
| case '3': |
| /* set only a fallback mapping from codepage to Unicode */ |
| staticData->hasToUnicodeFallback = TRUE; |
| isOK &= cnvData->addToUnicode(cnvData, mbcsBytes, mbcsLength, unicodeValue, codepageValue, 1); |
| break; |
| default: |
| fprintf(stderr, "error: illegal fallback indicator '%s' in '%s'\n", line - 1, storageLine); |
| *err = U_INVALID_TABLE_FORMAT; |
| break; |
| } |
| } |
| else |
| { |
| precisionMask |= 2; |
| /* set the mappings */ |
| isOK &= cnvData->addToUnicode(cnvData, mbcsBytes, mbcsLength, unicodeValue, codepageValue, -1) && |
| cnvData->addFromUnicode(cnvData, mbcsBytes, mbcsLength, unicodeValue, codepageValue, -1); |
| } |
| } |
| } |
| |
| if(cnvData->finishMappings!=NULL) |
| { |
| cnvData->finishMappings(cnvData, staticData); |
| } |
| |
| if(!isOK) |
| { |
| *err = U_INVALID_TABLE_FORMAT; |
| } |
| else if(precisionMask == 3) |
| { |
| fprintf(stderr, "error: some entries have the mapping precision (with '|'), some do not\n"); |
| *err = U_INVALID_TABLE_FORMAT; |
| } |
| } |
| |
| /*creates a UConverterStaticData, fills in necessary links to it the appropriate function pointers*/ |
| UConverterSharedData* createConverterFromTableFile(const char* converterName, UErrorCode* err) |
| { |
| FileStream* convFile = NULL; |
| UConverterSharedData* mySharedData = NULL; |
| UConverterStaticData* myStaticData = NULL; |
| |
| if (U_FAILURE(*err)) return NULL; |
| |
| convFile = T_FileStream_open(converterName, "r"); |
| if (convFile == NULL) |
| { |
| *err = U_FILE_ACCESS_ERROR; |
| return NULL; |
| } |
| |
| |
| mySharedData = (UConverterSharedData*) uprv_malloc(sizeof(UConverterSharedData)); |
| if (mySharedData == NULL) |
| { |
| *err = U_MEMORY_ALLOCATION_ERROR; |
| T_FileStream_close(convFile); |
| return NULL; |
| } |
| |
| uprv_memset(mySharedData, 0, sizeof(UConverterSharedData)); |
| |
| mySharedData->structSize = sizeof(UConverterSharedData); |
| |
| myStaticData = (UConverterStaticData*) uprv_malloc(sizeof(UConverterStaticData)); |
| if (myStaticData == NULL) |
| { |
| *err = U_MEMORY_ALLOCATION_ERROR; |
| T_FileStream_close(convFile); |
| return NULL; |
| } |
| uprv_memset(myStaticData, 0, sizeof(UConverterStaticData)); |
| mySharedData->staticData = myStaticData; |
| myStaticData->structSize = sizeof(UConverterStaticData); |
| mySharedData->staticDataOwned = TRUE; |
| |
| uprv_strcpy(myStaticData->name, converterName); |
| |
| mySharedData->dataMemory = NULL; /* for init */ |
| |
| readHeaderFromFile(mySharedData, convFile, converterName, err); |
| |
| if (U_FAILURE(*err)) return NULL; |
| |
| switch (myStaticData->conversionType) |
| { |
| case UCNV_SBCS: |
| { |
| mySharedData->table = (UConverterTable *)SBCSOpen(); |
| break; |
| } |
| case UCNV_MBCS: |
| { |
| /* MBCSOpen() was called by */ |
| break; |
| } |
| case UCNV_EBCDIC_STATEFUL: |
| { |
| mySharedData->table = (UConverterTable *)EBCDICStatefulOpen(); |
| break; |
| } |
| case UCNV_DBCS: |
| { |
| mySharedData->table = (UConverterTable *)DBCSOpen(); |
| break; |
| } |
| |
| default : |
| fprintf(stderr, "error: <uconv_class> omitted\n"); |
| *err = U_INVALID_TABLE_FORMAT; |
| mySharedData->table = NULL; |
| break; |
| }; |
| |
| if(mySharedData->table != NULL) |
| { |
| loadTableFromFile(convFile, mySharedData, err); |
| } |
| |
| T_FileStream_close(convFile); |
| |
| return mySharedData; |
| } |
| |
| /* |
| * Hey, Emacs, please set the following: |
| * |
| * Local Variables: |
| * indent-tabs-mode: nil |
| * End: |
| * |
| */ |