| // © 2016 and later: Unicode, Inc. and others. |
| // License & terms of use: http://www.unicode.org/copyright.html |
| /* |
| ************************************************************************ |
| * Copyright (c) 1997-2003, International Business Machines |
| * Corporation and others. All Rights Reserved. |
| ************************************************************************ |
| */ |
| |
| #ifndef _NORMCONF |
| #define _NORMCONF |
| |
| #include "unicode/utypes.h" |
| |
| #if !UCONFIG_NO_NORMALIZATION |
| |
| #include "unicode/normalizer2.h" |
| #include "unicode/normlzr.h" |
| #include "intltest.h" |
| |
| typedef struct _FileStream FileStream; |
| |
| class NormalizerConformanceTest : public IntlTest { |
| Normalizer normalizer; |
| const Normalizer2 *nfc, *nfd, *nfkc, *nfkd; |
| |
| public: |
| NormalizerConformanceTest(); |
| virtual ~NormalizerConformanceTest(); |
| |
| void runIndexedTest(int32_t index, UBool exec, const char* &name, char* par=NULL); |
| |
| /** |
| * Test the conformance of Normalizer to |
| * http://www.unicode.org/Public/UNIDATA/NormalizationTest.txt |
| */ |
| void TestConformance(); |
| void TestConformance32(); |
| void TestConformance(FileStream *input, int32_t options); |
| |
| // Specific tests for debugging. These are generally failures taken from |
| // the conformance file, but culled out to make debugging easier. |
| void TestCase6(void); |
| |
| private: |
| FileStream *openNormalizationTestFile(const char *filename); |
| |
| /** |
| * Verify the conformance of the given line of the Unicode |
| * normalization (UTR 15) test suite file. For each line, |
| * there are five columns, corresponding to field[0]..field[4]. |
| * |
| * The following invariants must be true for all conformant implementations |
| * c2 == NFC(c1) == NFC(c2) == NFC(c3) |
| * c3 == NFD(c1) == NFD(c2) == NFD(c3) |
| * c4 == NFKC(c1) == NFKC(c2) == NFKC(c3) == NFKC(c4) == NFKC(c5) |
| * c5 == NFKD(c1) == NFKD(c2) == NFKD(c3) == NFKD(c4) == NFKD(c5) |
| * |
| * @param field the 5 columns |
| * @param line the source line from the test suite file |
| * @return true if the test passes |
| */ |
| UBool checkConformance(const UnicodeString* field, |
| const char *line, |
| int32_t options, |
| UErrorCode &status); |
| |
| UBool checkNorm(UNormalizationMode mode, int32_t options, |
| const Normalizer2 *norm2, |
| const UnicodeString &s, const UnicodeString &exp, |
| int32_t field); |
| |
| void iterativeNorm(const UnicodeString& str, |
| UNormalizationMode mode, int32_t options, |
| UnicodeString& result, |
| int8_t dir); |
| |
| /** |
| * @param op name of normalization form, e.g., "KC" |
| * @param op2 name of test case variant, e.g., "(-1)" |
| * @param s string being normalized |
| * @param got value received |
| * @param exp expected value |
| * @param msg description of this test |
| * @param return true if got == exp |
| */ |
| UBool assertEqual(const char *op, const char *op2, |
| const UnicodeString& s, |
| const UnicodeString& got, |
| const UnicodeString& exp, |
| const char *msg); |
| |
| /** |
| * Split a string into pieces based on the given delimiter |
| * character. Then, parse the resultant fields from hex into |
| * characters. That is, "0040 0400;0C00;0899" -> new String[] { |
| * "\u0040\u0400", "\u0C00", "\u0899" }. The output is assumed to |
| * be of the proper length already, and exactly output.length |
| * fields are parsed. If there are too few an exception is |
| * thrown. If there are too many the extras are ignored. |
| * |
| * @param buf scratch buffer |
| * @return FALSE upon failure |
| */ |
| UBool hexsplit(const char *s, char delimiter, |
| UnicodeString output[], int32_t outputLength); |
| |
| void _testOneLine(const char *line); |
| void compare(const UnicodeString& s1,const UnicodeString& s2); |
| }; |
| |
| #endif /* #if !UCONFIG_NO_NORMALIZATION */ |
| |
| #endif |