blob: a0f5e277e00e978313ba1495a0ef805490e53281 [file] [log] [blame]
/*
*******************************************************************************
*
* Copyright (C) 2004-2008, International Business Machines
* Corporation and others. All Rights Reserved.
*
*******************************************************************************
* file name: gencase.h
* encoding: US-ASCII
* tab size: 8 (not used)
* indentation:4
*
* created on: 2004aug28
* created by: Markus W. Scherer
*/
#ifndef __GENCASE_H__
#define __GENCASE_H__
#include "unicode/utypes.h"
#include "utrie.h"
#include "ucase.h"
U_CDECL_BEGIN
/* Unicode versions --------------------------------------------------------- */
enum {
UNI_1_0,
UNI_1_1,
UNI_2_0,
UNI_3_0,
UNI_3_1,
UNI_3_2,
UNI_4_0,
UNI_4_0_1,
UNI_4_1,
UNI_VER_COUNT
};
extern int32_t ucdVersion;
/* gencase ------------------------------------------------------------------ */
#define UGENCASE_EXC_SHIFT 16
#define UGENCASE_EXC_MASK 0xffff0000
/*
* Values for the ucase.icu unfold[] data array, see store.c.
* The values are stored in ucase.icu so that the runtime code will work with
* changing values, but they are hardcoded for gencase for simplicity.
* They are optimized, that is, provide for minimal table column widths,
* for the actual Unicode data, so that the table size is minimized.
* Future versions of Unicode may require increases of some of these values.
*/
enum {
UGENCASE_UNFOLD_STRING_WIDTH=3,
UGENCASE_UNFOLD_CP_WIDTH=2,
UGENCASE_UNFOLD_WIDTH=UGENCASE_UNFOLD_STRING_WIDTH+UGENCASE_UNFOLD_CP_WIDTH,
UGENCASE_UNFOLD_MAX_ROWS=250
};
/* Values for additional data stored in pv column 1 */
enum {
UGENCASE_IS_MID_LETTER_SHIFT /* bit 0 WB=MidLetter or WB=MidNumLet */
};
/* special casing data */
typedef struct {
UChar32 code;
UBool isComplex;
UChar lowerCase[32], upperCase[32], titleCase[32];
} SpecialCasing;
/* case folding data */
typedef struct {
UChar32 code, simple;
char status;
UChar full[32];
} CaseFolding;
/* case mapping properties */
typedef struct {
UChar32 code, lowerCase, upperCase, titleCase;
UChar32 closure[8];
SpecialCasing *specialCasing;
CaseFolding *caseFolding;
uint8_t gc, cc;
} Props;
/* global flags */
extern UBool beVerbose, haveCopyright;
/* properties vectors in gencase.c */
extern uint32_t *pv;
/* prototypes */
U_CFUNC void
writeUCDFilename(char *basename, const char *filename, const char *suffix);
U_CFUNC UBool
isToken(const char *token, const char *s);
extern void
setUnicodeVersion(const char *v);
extern void
setProps(Props *p);
U_CFUNC uint32_t U_EXPORT2
getFoldedPropsValue(UNewTrie *trie, UChar32 start, int32_t offset);
extern void
addCaseSensitive(UChar32 first, UChar32 last);
extern void
makeCaseClosure(void);
extern void
makeExceptions(void);
extern void
generateData(const char *dataDir, UBool csource);
U_CDECL_END
#endif