blob: 52a955fa38c0fe548fdd0d87b4a99ab377c405b6 [file] [log] [blame]
/*
*******************************************************************************
* Copyright (C) 1996-2012, International Business Machines Corporation and *
* others. All Rights Reserved. *
*******************************************************************************
*/
package com.ibm.icu.dev.test.rbbi;
import java.text.StringCharacterIterator;
import java.util.ArrayList;
import java.util.List;
import java.util.Locale;
import com.ibm.icu.dev.test.TestFmwk;
import com.ibm.icu.text.BreakIterator;
public class BreakIteratorTest extends TestFmwk
{
private BreakIterator characterBreak;
private BreakIterator wordBreak;
private BreakIterator lineBreak;
private BreakIterator sentenceBreak;
private BreakIterator titleBreak;
public static void main(String[] args) throws Exception {
new BreakIteratorTest().run(args);
}
public BreakIteratorTest()
{
}
protected void init(){
characterBreak = BreakIterator.getCharacterInstance();
wordBreak = BreakIterator.getWordInstance();
lineBreak = BreakIterator.getLineInstance();
//logln("Creating sentence iterator...");
sentenceBreak = BreakIterator.getSentenceInstance();
//logln("Finished creating sentence iterator...");
titleBreak = BreakIterator.getTitleInstance();
}
//=========================================================================
// general test subroutines
//=========================================================================
private void generalIteratorTest(BreakIterator bi, List<String> expectedResult) {
StringBuffer buffer = new StringBuffer();
String text;
for (int i = 0; i < expectedResult.size(); i++) {
text = expectedResult.get(i);
buffer.append(text);
}
text = buffer.toString();
bi.setText(text);
List<String> nextResults = _testFirstAndNext(bi, text);
List<String> previousResults = _testLastAndPrevious(bi, text);
logln("comparing forward and backward...");
int errs = getErrorCount();
compareFragmentLists("forward iteration", "backward iteration", nextResults,
previousResults);
if (getErrorCount() == errs) {
logln("comparing expected and actual...");
compareFragmentLists("expected result", "actual result", expectedResult,
nextResults);
}
int[] boundaries = new int[expectedResult.size() + 3];
boundaries[0] = BreakIterator.DONE;
boundaries[1] = 0;
for (int i = 0; i < expectedResult.size(); i++)
boundaries[i + 2] = boundaries[i + 1] + (expectedResult.get(i)).
length();
boundaries[boundaries.length - 1] = BreakIterator.DONE;
_testFollowing(bi, text, boundaries);
_testPreceding(bi, text, boundaries);
_testIsBoundary(bi, text, boundaries);
doMultipleSelectionTest(bi, text);
}
private List<String> _testFirstAndNext(BreakIterator bi, String text) {
int p = bi.first();
int lastP = p;
List<String> result = new ArrayList<String>();
if (p != 0)
errln("first() returned " + p + " instead of 0");
while (p != BreakIterator.DONE) {
p = bi.next();
if (p != BreakIterator.DONE) {
if (p <= lastP)
errln("next() failed to move forward: next() on position "
+ lastP + " yielded " + p);
result.add(text.substring(lastP, p));
}
else {
if (lastP != text.length())
errln("next() returned DONE prematurely: offset was "
+ lastP + " instead of " + text.length());
}
lastP = p;
}
return result;
}
private List<String> _testLastAndPrevious(BreakIterator bi, String text) {
int p = bi.last();
int lastP = p;
List<String> result = new ArrayList<String>();
if (p != text.length())
errln("last() returned " + p + " instead of " + text.length());
while (p != BreakIterator.DONE) {
p = bi.previous();
if (p != BreakIterator.DONE) {
if (p >= lastP)
errln("previous() failed to move backward: previous() on position "
+ lastP + " yielded " + p);
result.add(0, text.substring(p, lastP));
}
else {
if (lastP != 0)
errln("previous() returned DONE prematurely: offset was "
+ lastP + " instead of 0");
}
lastP = p;
}
return result;
}
private void compareFragmentLists(String f1Name, String f2Name, List<String> f1, List<String> f2) {
int p1 = 0;
int p2 = 0;
String s1;
String s2;
int t1 = 0;
int t2 = 0;
while (p1 < f1.size() && p2 < f2.size()) {
s1 = f1.get(p1);
s2 = f2.get(p2);
t1 += s1.length();
t2 += s2.length();
if (s1.equals(s2)) {
debugLogln(" >" + s1 + "<");
++p1;
++p2;
}
else {
int tempT1 = t1;
int tempT2 = t2;
int tempP1 = p1;
int tempP2 = p2;
while (tempT1 != tempT2 && tempP1 < f1.size() && tempP2 < f2.size()) {
while (tempT1 < tempT2 && tempP1 < f1.size()) {
tempT1 += (f1.get(tempP1)).length();
++tempP1;
}
while (tempT2 < tempT1 && tempP2 < f2.size()) {
tempT2 += (f2.get(tempP2)).length();
++tempP2;
}
}
logln("*** " + f1Name + " has:");
while (p1 <= tempP1 && p1 < f1.size()) {
s1 = f1.get(p1);
t1 += s1.length();
debugLogln(" *** >" + s1 + "<");
++p1;
}
logln("***** " + f2Name + " has:");
while (p2 <= tempP2 && p2 < f2.size()) {
s2 = f2.get(p2);
t2 += s2.length();
debugLogln(" ***** >" + s2 + "<");
++p2;
}
errln("Discrepancy between " + f1Name + " and " + f2Name);
}
}
}
private void _testFollowing(BreakIterator bi, String text, int[] boundaries) {
logln("testFollowing():");
int p = 2;
for (int i = 0; i <= text.length(); i++) {
if (i == boundaries[p])
++p;
int b = bi.following(i);
logln("bi.following(" + i + ") -> " + b);
if (b != boundaries[p])
errln("Wrong result from following() for " + i + ": expected " + boundaries[p]
+ ", got " + b);
}
}
private void _testPreceding(BreakIterator bi, String text, int[] boundaries) {
logln("testPreceding():");
int p = 0;
for (int i = 0; i <= text.length(); i++) {
int b = bi.preceding(i);
logln("bi.preceding(" + i + ") -> " + b);
if (b != boundaries[p])
errln("Wrong result from preceding() for " + i + ": expected " + boundaries[p]
+ ", got " + b);
if (i == boundaries[p + 1])
++p;
}
}
private void _testIsBoundary(BreakIterator bi, String text, int[] boundaries) {
logln("testIsBoundary():");
int p = 1;
boolean isB;
for (int i = 0; i <= text.length(); i++) {
isB = bi.isBoundary(i);
logln("bi.isBoundary(" + i + ") -> " + isB);
if (i == boundaries[p]) {
if (!isB)
errln("Wrong result from isBoundary() for " + i + ": expected true, got false");
++p;
}
else {
if (isB)
errln("Wrong result from isBoundary() for " + i + ": expected false, got true");
}
}
}
private void doMultipleSelectionTest(BreakIterator iterator, String testText)
{
logln("Multiple selection test...");
BreakIterator testIterator = (BreakIterator)iterator.clone();
int offset = iterator.first();
int testOffset;
int count = 0;
do {
testOffset = testIterator.first();
testOffset = testIterator.next(count);
logln("next(" + count + ") -> " + testOffset);
if (offset != testOffset)
errln("next(n) and next() not returning consistent results: for step " + count + ", next(n) returned " + testOffset + " and next() had " + offset);
if (offset != BreakIterator.DONE) {
count++;
offset = iterator.next();
}
} while (offset != BreakIterator.DONE);
// now do it backwards...
offset = iterator.last();
count = 0;
do {
testOffset = testIterator.last();
testOffset = testIterator.next(count);
logln("next(" + count + ") -> " + testOffset);
if (offset != testOffset)
errln("next(n) and next() not returning consistent results: for step " + count + ", next(n) returned " + testOffset + " and next() had " + offset);
if (offset != BreakIterator.DONE) {
count--;
offset = iterator.previous();
}
} while (offset != BreakIterator.DONE);
}
private void doOtherInvariantTest(BreakIterator tb, String testChars)
{
StringBuffer work = new StringBuffer("a\r\na");
int errorCount = 0;
// a break should never occur between CR and LF
for (int i = 0; i < testChars.length(); i++) {
work.setCharAt(0, testChars.charAt(i));
for (int j = 0; j < testChars.length(); j++) {
work.setCharAt(3, testChars.charAt(j));
tb.setText(work.toString());
for (int k = tb.first(); k != BreakIterator.DONE; k = tb.next())
if (k == 2) {
errln("Break between CR and LF in string U+" + Integer.toHexString(
(int)(work.charAt(0))) + ", U+d U+a U+" + Integer.toHexString(
(int)(work.charAt(3))));
errorCount++;
if (errorCount >= 75)
return;
}
}
}
// a break should never occur before a non-spacing mark, unless it's preceded
// by a line terminator
work.setLength(0);
work.append("aaaa");
for (int i = 0; i < testChars.length(); i++) {
char c = testChars.charAt(i);
if (c == '\n' || c == '\r' || c == '\u2029' || c == '\u2028' || c == '\u0003')
continue;
work.setCharAt(1, c);
for (int j = 0; j < testChars.length(); j++) {
c = testChars.charAt(j);
if (Character.getType(c) != Character.NON_SPACING_MARK && Character.getType(c)
!= Character.ENCLOSING_MARK)
continue;
work.setCharAt(2, c);
tb.setText(work.toString());
for (int k = tb.first(); k != BreakIterator.DONE; k = tb.next())
if (k == 2) {
errln("Break between U+" + Integer.toHexString((int)(work.charAt(1)))
+ " and U+" + Integer.toHexString((int)(work.charAt(2))));
errorCount++;
if (errorCount >= 75)
return;
}
}
}
}
public void debugLogln(String s) {
final String zeros = "0000";
String temp;
StringBuffer out = new StringBuffer();
for (int i = 0; i < s.length(); i++) {
char c = s.charAt(i);
if (c >= ' ' && c < '\u007f')
out.append(c);
else {
out.append("\\u");
temp = Integer.toHexString((int)c);
out.append(zeros.substring(0, 4 - temp.length()));
out.append(temp);
}
}
logln(out.toString());
}
//=========================================================================
// tests
//=========================================================================
/**
* @bug 4097779
*/
public void TestBug4097779() {
List<String> wordSelectionData = new ArrayList<String>(2);
wordSelectionData.add("aa\u0300a");
wordSelectionData.add(" ");
generalIteratorTest(wordBreak, wordSelectionData);
}
/**
* @bug 4098467
*/
public void TestBug4098467Words() {
List<String> wordSelectionData = new ArrayList<String>();
// What follows is a string of Korean characters (I found it in the Yellow Pages
// ad for the Korean Presbyterian Church of San Francisco, and I hope I transcribed
// it correctly), first as precomposed syllables, and then as conjoining jamo.
// Both sequences should be semantically identical and break the same way.
// precomposed syllables...
wordSelectionData.add("\uc0c1\ud56d");
wordSelectionData.add(" ");
wordSelectionData.add("\ud55c\uc778");
wordSelectionData.add(" ");
wordSelectionData.add("\uc5f0\ud569");
wordSelectionData.add(" ");
wordSelectionData.add("\uc7a5\ub85c\uad50\ud68c");
wordSelectionData.add(" ");
// conjoining jamo...
wordSelectionData.add("\u1109\u1161\u11bc\u1112\u1161\u11bc");
wordSelectionData.add(" ");
wordSelectionData.add("\u1112\u1161\u11ab\u110b\u1175\u11ab");
wordSelectionData.add(" ");
wordSelectionData.add("\u110b\u1167\u11ab\u1112\u1161\u11b8");
wordSelectionData.add(" ");
wordSelectionData.add("\u110c\u1161\u11bc\u1105\u1169\u1100\u116d\u1112\u116c");
wordSelectionData.add(" ");
generalIteratorTest(wordBreak, wordSelectionData);
}
/**
* @bug 4111338
*/
public void TestBug4111338() {
List<String> sentenceSelectionData = new ArrayList<String>();
// test for bug #4111338: Don't break sentences at the boundary between CJK
// and other letters
sentenceSelectionData.add("\u5487\u67ff\ue591\u5017\u61b3\u60a1\u9510\u8165:\"JAVA\u821c"
+ "\u8165\u7fc8\u51ce\u306d,\u2494\u56d8\u4ec0\u60b1\u8560\u51ba"
+ "\u611d\u57b6\u2510\u5d46\".\u2029");
sentenceSelectionData.add("\u5487\u67ff\ue591\u5017\u61b3\u60a1\u9510\u8165\u9de8"
+ "\u97e4JAVA\u821c\u8165\u7fc8\u51ce\u306d\ue30b\u2494\u56d8\u4ec0"
+ "\u60b1\u8560\u51ba\u611d\u57b6\u2510\u5d46\u97e5\u7751\u2029");
sentenceSelectionData.add("\u5487\u67ff\ue591\u5017\u61b3\u60a1\u9510\u8165\u9de8\u97e4"
+ "\u6470\u8790JAVA\u821c\u8165\u7fc8\u51ce\u306d\ue30b\u2494\u56d8"
+ "\u4ec0\u60b1\u8560\u51ba\u611d\u57b6\u2510\u5d46\u97e5\u7751\u2029");
sentenceSelectionData.add("He said, \"I can go there.\"\u2029");
generalIteratorTest(sentenceBreak, sentenceSelectionData);
}
/**
* @bug 4143071
*/
public void TestBug4143071() {
List<String> sentenceSelectionData = new ArrayList<String>(3);
// Make sure sentences that end with digits work right
sentenceSelectionData.add("Today is the 27th of May, 1998. ");
sentenceSelectionData.add("Tomorrow will be 28 May 1998. ");
sentenceSelectionData.add("The day after will be the 30th.\u2029");
generalIteratorTest(sentenceBreak, sentenceSelectionData);
}
/**
* @bug 4152416
*/
public void TestBug4152416() {
List<String> sentenceSelectionData = new ArrayList<String>(2);
// Make sure sentences ending with a capital letter are treated correctly
sentenceSelectionData.add("The type of all primitive "
+ "<code>boolean</code> values accessed in the target VM. ");
sentenceSelectionData.add("Calls to xxx will return an "
+ "implementor of this interface.\u2029");
generalIteratorTest(sentenceBreak, sentenceSelectionData);
}
/**
* @bug 4152117
*/
public void TestBug4152117() {
List<String> sentenceSelectionData = new ArrayList<String>(3);
// Make sure sentence breaking is handling punctuation correctly
// [COULD NOT REPRODUCE THIS BUG, BUT TEST IS HERE TO MAKE SURE
// IT DOESN'T CROP UP]
sentenceSelectionData.add("Constructs a randomly generated "
+ "BigInteger, uniformly distributed over the range <tt>0</tt> "
+ "to <tt>(2<sup>numBits</sup> - 1)</tt>, inclusive. ");
sentenceSelectionData.add("The uniformity of the distribution "
+ "assumes that a fair source of random bits is provided in "
+ "<tt>rnd</tt>. ");
sentenceSelectionData.add("Note that this constructor always "
+ "constructs a non-negative BigInteger.\u2029");
generalIteratorTest(sentenceBreak, sentenceSelectionData);
}
public void TestLineBreak() {
List<String> lineSelectionData = new ArrayList<String>();
lineSelectionData.add("Multi-");
lineSelectionData.add("Level ");
lineSelectionData.add("example ");
lineSelectionData.add("of ");
lineSelectionData.add("a ");
lineSelectionData.add("semi-");
lineSelectionData.add("idiotic ");
lineSelectionData.add("non-");
lineSelectionData.add("sensical ");
lineSelectionData.add("(non-");
lineSelectionData.add("important) ");
lineSelectionData.add("sentence. ");
lineSelectionData.add("Hi ");
lineSelectionData.add("Hello ");
lineSelectionData.add("How\n");
lineSelectionData.add("are\r");
lineSelectionData.add("you\u2028");
lineSelectionData.add("fine.\t");
lineSelectionData.add("good. ");
lineSelectionData.add("Now\r");
lineSelectionData.add("is\n");
lineSelectionData.add("the\r\n");
lineSelectionData.add("time\n");
lineSelectionData.add("\r");
lineSelectionData.add("for\r");
lineSelectionData.add("\r");
lineSelectionData.add("all");
generalIteratorTest(lineBreak, lineSelectionData);
}
/**
* @bug 4068133
*/
public void TestBug4068133() {
List<String> lineSelectionData = new ArrayList<String>(9);
lineSelectionData.add("\u96f6");
lineSelectionData.add("\u4e00\u3002");
lineSelectionData.add("\u4e8c\u3001");
lineSelectionData.add("\u4e09\u3002\u3001");
lineSelectionData.add("\u56db\u3001\u3002\u3001");
lineSelectionData.add("\u4e94,");
lineSelectionData.add("\u516d.");
lineSelectionData.add("\u4e03.\u3001,\u3002");
lineSelectionData.add("\u516b");
generalIteratorTest(lineBreak, lineSelectionData);
}
/**
* @bug 4086052
*/
public void TestBug4086052() {
List<String> lineSelectionData = new ArrayList<String>(1);
lineSelectionData.add("foo\u00a0bar ");
// lineSelectionData.addElement("foo\ufeffbar");
generalIteratorTest(lineBreak, lineSelectionData);
}
/**
* @bug 4097920
*/
public void TestBug4097920() {
List<String> lineSelectionData = new ArrayList<String>(3);
lineSelectionData.add("dog,cat,mouse ");
lineSelectionData.add("(one)");
lineSelectionData.add("(two)\n");
generalIteratorTest(lineBreak, lineSelectionData);
}
/**
* @bug 4117554
*/
public void TestBug4117554Lines() {
List<String> lineSelectionData = new ArrayList<String>(3);
// Fullwidth .!? should be treated as postJwrd
lineSelectionData.add("\u4e01\uff0e");
lineSelectionData.add("\u4e02\uff01");
lineSelectionData.add("\u4e03\uff1f");
generalIteratorTest(lineBreak, lineSelectionData);
}
public void TestLettersAndDigits() {
// a character sequence such as "X11" or "30F3" or "native2ascii" should
// be kept together as a single word
List<String> lineSelectionData = new ArrayList<String>(3);
lineSelectionData.add("X11 ");
lineSelectionData.add("30F3 ");
lineSelectionData.add("native2ascii");
generalIteratorTest(lineBreak, lineSelectionData);
}
private static final String graveS = "S\u0300";
private static final String acuteBelowI = "i\u0317";
private static final String acuteE = "e\u0301";
private static final String circumflexA = "a\u0302";
private static final String tildeE = "e\u0303";
public void TestCharacterBreak() {
List<String> characterSelectionData = new ArrayList<String>();
characterSelectionData.add(graveS);
characterSelectionData.add(acuteBelowI);
characterSelectionData.add("m");
characterSelectionData.add("p");
characterSelectionData.add("l");
characterSelectionData.add(acuteE);
characterSelectionData.add(" ");
characterSelectionData.add("s");
characterSelectionData.add(circumflexA);
characterSelectionData.add("m");
characterSelectionData.add("p");
characterSelectionData.add("l");
characterSelectionData.add(tildeE);
characterSelectionData.add(".");
characterSelectionData.add("w");
characterSelectionData.add(circumflexA);
characterSelectionData.add("w");
characterSelectionData.add("a");
characterSelectionData.add("f");
characterSelectionData.add("q");
characterSelectionData.add("\n");
characterSelectionData.add("\r");
characterSelectionData.add("\r\n");
characterSelectionData.add("\n");
generalIteratorTest(characterBreak, characterSelectionData);
}
/**
* @bug 4098467
*/
public void TestBug4098467Characters() {
List<String> characterSelectionData = new ArrayList<String>();
// What follows is a string of Korean characters (I found it in the Yellow Pages
// ad for the Korean Presbyterian Church of San Francisco, and I hope I transcribed
// it correctly), first as precomposed syllables, and then as conjoining jamo.
// Both sequences should be semantically identical and break the same way.
// precomposed syllables...
characterSelectionData.add("\uc0c1");
characterSelectionData.add("\ud56d");
characterSelectionData.add(" ");
characterSelectionData.add("\ud55c");
characterSelectionData.add("\uc778");
characterSelectionData.add(" ");
characterSelectionData.add("\uc5f0");
characterSelectionData.add("\ud569");
characterSelectionData.add(" ");
characterSelectionData.add("\uc7a5");
characterSelectionData.add("\ub85c");
characterSelectionData.add("\uad50");
characterSelectionData.add("\ud68c");
characterSelectionData.add(" ");
// conjoining jamo...
characterSelectionData.add("\u1109\u1161\u11bc");
characterSelectionData.add("\u1112\u1161\u11bc");
characterSelectionData.add(" ");
characterSelectionData.add("\u1112\u1161\u11ab");
characterSelectionData.add("\u110b\u1175\u11ab");
characterSelectionData.add(" ");
characterSelectionData.add("\u110b\u1167\u11ab");
characterSelectionData.add("\u1112\u1161\u11b8");
characterSelectionData.add(" ");
characterSelectionData.add("\u110c\u1161\u11bc");
characterSelectionData.add("\u1105\u1169");
characterSelectionData.add("\u1100\u116d");
characterSelectionData.add("\u1112\u116c");
generalIteratorTest(characterBreak, characterSelectionData);
}
public void TestTitleBreak()
{
List<String> titleData = new ArrayList<String>();
titleData.add(" ");
titleData.add("This ");
titleData.add("is ");
titleData.add("a ");
titleData.add("simple ");
titleData.add("sample ");
titleData.add("sentence. ");
titleData.add("This ");
generalIteratorTest(titleBreak, titleData);
}
/*
* @bug 4153072
*/
public void TestBug4153072() {
BreakIterator iter = BreakIterator.getWordInstance();
String str = "...Hello, World!...";
int begin = 3;
int end = str.length() - 3;
// not used boolean gotException = false;
iter.setText(new StringCharacterIterator(str, begin, end, begin));
for (int index = -1; index < begin + 1; ++index) {
try {
iter.isBoundary(index);
if (index < begin)
errln("Didn't get exception with offset = " + index +
" and begin index = " + begin);
}
catch (IllegalArgumentException e) {
if (index >= begin)
errln("Got exception with offset = " + index +
" and begin index = " + begin);
}
}
}
public void TestBug4146175Lines() {
List<String> lineSelectionData = new ArrayList<String>(2);
// the fullwidth comma should stick to the preceding Japanese character
lineSelectionData.add("\u7d42\uff0c");
lineSelectionData.add("\u308f");
generalIteratorTest(lineBreak, lineSelectionData);
}
private static final String cannedTestChars
= "\u0000\u0001\u0002\u0003\u0004 !\"#$%&()+-01234<=>ABCDE[]^_`abcde{}|\u00a0\u00a2"
+ "\u00a3\u00a4\u00a5\u00a6\u00a7\u00a8\u00a9\u00ab\u00ad\u00ae\u00af\u00b0\u00b2\u00b3"
+ "\u00b4\u00b9\u00bb\u00bc\u00bd\u02b0\u02b1\u02b2\u02b3\u02b4\u0300\u0301\u0302\u0303"
+ "\u0304\u05d0\u05d1\u05d2\u05d3\u05d4\u0903\u093e\u093f\u0940\u0949\u0f3a\u0f3b\u2000"
+ "\u2001\u2002\u200c\u200d\u200e\u200f\u2010\u2011\u2012\u2028\u2029\u202a\u203e\u203f"
+ "\u2040\u20dd\u20de\u20df\u20e0\u2160\u2161\u2162\u2163\u2164";
public void TestSentenceInvariants()
{
BreakIterator e = BreakIterator.getSentenceInstance();
doOtherInvariantTest(e, cannedTestChars + ".,\u3001\u3002\u3041\u3042\u3043\ufeff");
}
public void TestEmptyString()
{
String text = "";
List<String> x = new ArrayList<String>(1);
x.add(text);
generalIteratorTest(lineBreak, x);
}
public void TestGetAvailableLocales()
{
Locale[] locList = BreakIterator.getAvailableLocales();
if (locList.length == 0)
errln("getAvailableLocales() returned an empty list!");
// I have no idea how to test this function...
com.ibm.icu.util.ULocale[] ulocList = BreakIterator.getAvailableULocales();
if (ulocList.length == 0) {
errln("getAvailableULocales() returned an empty list!");
} else {
logln("getAvailableULocales() returned " + ulocList.length + " locales");
}
}
/**
* @bug 4068137
*/
public void TestEndBehavior()
{
String testString = "boo.";
BreakIterator wb = BreakIterator.getWordInstance();
wb.setText(testString);
if (wb.first() != 0)
errln("Didn't get break at beginning of string.");
if (wb.next() != 3)
errln("Didn't get break before period in \"boo.\"");
if (wb.current() != 4 && wb.next() != 4)
errln("Didn't get break at end of string.");
}
// The Following two tests are ported from ICU4C 1.8.1 [Richard/GCL]
/**
* Port From: ICU4C v1.8.1 : textbounds : IntlTestTextBoundary
* Source File: $ICU4CRoot/source/test/intltest/ittxtbd.cpp
**/
/**
* test methods preceding, following and isBoundary
**/
public void TestPreceding() {
String words3 = "aaa bbb ccc";
BreakIterator e = BreakIterator.getWordInstance(Locale.getDefault());
e.setText( words3 );
e.first();
int p1 = e.next();
int p2 = e.next();
int p3 = e.next();
int p4 = e.next();
int f = e.following(p2+1);
int p = e.preceding(p2+1);
if (f!=p3)
errln("IntlTestTextBoundary::TestPreceding: f!=p3");
if (p!=p2)
errln("IntlTestTextBoundary::TestPreceding: p!=p2");
if (p1+1!=p2)
errln("IntlTestTextBoundary::TestPreceding: p1+1!=p2");
if (p3+1!=p4)
errln("IntlTestTextBoundary::TestPreceding: p3+1!=p4");
if (!e.isBoundary(p2) || e.isBoundary(p2+1) || !e.isBoundary(p3))
{
errln("IntlTestTextBoundary::TestPreceding: isBoundary err");
}
}
/**
* Bug 4450804
*/
public void TestLineBreakContractions() {
List<String> expected = new ArrayList<String>(7);
expected.add("These ");
expected.add("are ");
expected.add("'foobles'. ");
expected.add("Don't ");
expected.add("you ");
expected.add("like ");
expected.add("them?");
generalIteratorTest(lineBreak, expected);
}
/**
* Ticket#5615
*/
public void TestT5615() {
com.ibm.icu.util.ULocale[] ulocales = BreakIterator.getAvailableULocales();
int type = 0;
com.ibm.icu.util.ULocale loc = null;
try {
for (int i = 0; i < ulocales.length; i++) {
loc = ulocales[i];
for (type = 0; type < 5 /* 5 = BreakIterator.KIND_COUNT */; ++type) {
BreakIterator brk = BreakIterator.getBreakInstance(loc, type);
if (brk == null) {
errln("ERR: Failed to create an instance type: " + type + " / locale: " + loc);
}
}
}
} catch (Exception e) {
errln("ERR: Failed to create an instance type: " + type + " / locale: " + loc + " / exception: " + e.getMessage());
}
}
}