You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
1190 lines
39 KiB
1190 lines
39 KiB
// © 2016 and later: Unicode, Inc. and others.
|
|
// License & terms of use: http://www.unicode.org/copyright.html
|
|
/****************************************************************************************
|
|
* COPYRIGHT:
|
|
* Copyright (c) 1997-2014, International Business Machines Corporation and
|
|
* others. All Rights Reserved.
|
|
* Modification History:
|
|
*
|
|
* Date Name Description
|
|
* 05/22/2000 Madhu Added tests for testing new API for utf16 support and more
|
|
****************************************************************************************/
|
|
|
|
#include <string.h>
|
|
#include "utypeinfo.h" // for 'typeid' to work
|
|
|
|
#include "unicode/chariter.h"
|
|
#include "unicode/ustring.h"
|
|
#include "unicode/unistr.h"
|
|
#include "unicode/schriter.h"
|
|
#include "unicode/uchriter.h"
|
|
#include "unicode/uiter.h"
|
|
#include "unicode/putil.h"
|
|
#include "unicode/utf16.h"
|
|
#include "citrtest.h"
|
|
#include "cmemory.h"
|
|
|
|
|
|
class SCharacterIterator : public CharacterIterator {
|
|
public:
|
|
SCharacterIterator(const UnicodeString& textStr){
|
|
text = textStr;
|
|
pos=0;
|
|
textLength = textStr.length();
|
|
begin = 0;
|
|
end=textLength;
|
|
|
|
}
|
|
|
|
virtual ~SCharacterIterator(){}
|
|
|
|
|
|
void setText(const UnicodeString& newText){
|
|
text = newText;
|
|
}
|
|
|
|
virtual void getText(UnicodeString& result) {
|
|
text.extract(0,text.length(),result);
|
|
}
|
|
static UClassID getStaticClassID(void){
|
|
return (UClassID)(&fgClassID);
|
|
}
|
|
virtual UClassID getDynamicClassID(void) const{
|
|
return getStaticClassID();
|
|
}
|
|
|
|
virtual UBool operator==(const ForwardCharacterIterator& /*that*/) const{
|
|
return TRUE;
|
|
}
|
|
|
|
virtual SCharacterIterator* clone(void) const {
|
|
return NULL;
|
|
}
|
|
virtual int32_t hashCode(void) const{
|
|
return DONE;
|
|
}
|
|
virtual UChar nextPostInc(void){ return text.charAt(pos++);}
|
|
virtual UChar32 next32PostInc(void){return text.char32At(pos++);}
|
|
virtual UBool hasNext() { return TRUE;}
|
|
virtual UChar first(){return DONE;}
|
|
virtual UChar32 first32(){return DONE;}
|
|
virtual UChar last(){return DONE;}
|
|
virtual UChar32 last32(){return DONE;}
|
|
virtual UChar setIndex(int32_t /*pos*/){return DONE;}
|
|
virtual UChar32 setIndex32(int32_t /*pos*/){return DONE;}
|
|
virtual UChar current() const{return DONE;}
|
|
virtual UChar32 current32() const{return DONE;}
|
|
virtual UChar next(){return DONE;}
|
|
virtual UChar32 next32(){return DONE;}
|
|
virtual UChar previous(){return DONE;}
|
|
virtual UChar32 previous32(){return DONE;}
|
|
virtual int32_t move(int32_t delta,CharacterIterator::EOrigin origin){
|
|
switch(origin) {
|
|
case kStart:
|
|
pos = begin + delta;
|
|
break;
|
|
case kCurrent:
|
|
pos += delta;
|
|
break;
|
|
case kEnd:
|
|
pos = end + delta;
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
|
|
if(pos < begin) {
|
|
pos = begin;
|
|
} else if(pos > end) {
|
|
pos = end;
|
|
}
|
|
|
|
return pos;
|
|
}
|
|
virtual int32_t move32(int32_t delta, CharacterIterator::EOrigin origin){
|
|
switch(origin) {
|
|
case kStart:
|
|
pos = begin;
|
|
if(delta > 0) {
|
|
U16_FWD_N(text, pos, end, delta);
|
|
}
|
|
break;
|
|
case kCurrent:
|
|
if(delta > 0) {
|
|
U16_FWD_N(text, pos, end, delta);
|
|
} else {
|
|
U16_BACK_N(text, begin, pos, -delta);
|
|
}
|
|
break;
|
|
case kEnd:
|
|
pos = end;
|
|
if(delta < 0) {
|
|
U16_BACK_N(text, begin, pos, -delta);
|
|
}
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
|
|
return pos;
|
|
}
|
|
virtual UBool hasPrevious() {return TRUE;}
|
|
|
|
SCharacterIterator& operator=(const SCharacterIterator& that){
|
|
text = that.text;
|
|
return *this;
|
|
}
|
|
|
|
|
|
private:
|
|
UnicodeString text;
|
|
static const char fgClassID;
|
|
};
|
|
const char SCharacterIterator::fgClassID=0;
|
|
|
|
CharIterTest::CharIterTest()
|
|
{
|
|
}
|
|
void CharIterTest::runIndexedTest( int32_t index, UBool exec, const char* &name, char* /*par*/ )
|
|
{
|
|
if (exec) logln("TestSuite CharIterTest: ");
|
|
switch (index) {
|
|
case 0: name = "TestConstructionAndEquality"; if (exec) TestConstructionAndEquality(); break;
|
|
case 1: name = "TestConstructionAndEqualityUChariter"; if (exec) TestConstructionAndEqualityUChariter(); break;
|
|
case 2: name = "TestIteration"; if (exec) TestIteration(); break;
|
|
case 3: name = "TestIterationUChar32"; if (exec) TestIterationUChar32(); break;
|
|
case 4: name = "TestUCharIterator"; if (exec) TestUCharIterator(); break;
|
|
case 5: name = "TestCoverage"; if(exec) TestCoverage(); break;
|
|
case 6: name = "TestCharIteratorSubClasses"; if (exec) TestCharIteratorSubClasses(); break;
|
|
default: name = ""; break; //needed to end loop
|
|
}
|
|
}
|
|
|
|
void CharIterTest::TestCoverage(){
|
|
UnicodeString testText("Now is the time for all good men to come to the aid of their country.");
|
|
UnicodeString testText2("\\ud800\\udc01deadbeef");
|
|
testText2 = testText2.unescape();
|
|
SCharacterIterator* test = new SCharacterIterator(testText);
|
|
if(test->firstPostInc()!= 0x004E){
|
|
errln("Failed: firstPostInc() failed");
|
|
}
|
|
if(test->getIndex()!=1){
|
|
errln("Failed: getIndex().");
|
|
}
|
|
if(test->getLength()!=testText.length()){
|
|
errln("Failed: getLength()");
|
|
}
|
|
test->setToStart();
|
|
if(test->getIndex()!=0){
|
|
errln("Failed: setToStart().");
|
|
}
|
|
test->setToEnd();
|
|
if(test->getIndex()!=testText.length()){
|
|
errln("Failed: setToEnd().");
|
|
}
|
|
if(test->startIndex() != 0){
|
|
errln("Failed: startIndex()");
|
|
}
|
|
test->setText(testText2);
|
|
if(test->first32PostInc()!= testText2.char32At(0)){
|
|
errln("Failed: first32PostInc() failed");
|
|
}
|
|
|
|
delete test;
|
|
|
|
}
|
|
void CharIterTest::TestConstructionAndEquality() {
|
|
UnicodeString testText("Now is the time for all good men to come to the aid of their country.");
|
|
UnicodeString testText2("Don't bother using this string.");
|
|
UnicodeString result1, result2, result3;
|
|
|
|
StringCharacterIterator* test1 = new StringCharacterIterator(testText);
|
|
CharacterIterator* test1b= new StringCharacterIterator(testText, -1);
|
|
CharacterIterator* test1c= new StringCharacterIterator(testText, 100);
|
|
CharacterIterator* test1d= new StringCharacterIterator(testText, -2, 100, 5);
|
|
CharacterIterator* test1e= new StringCharacterIterator(testText, 100, 20, 5);
|
|
CharacterIterator* test2 = new StringCharacterIterator(testText, 5);
|
|
CharacterIterator* test3 = new StringCharacterIterator(testText, 2, 20, 5);
|
|
CharacterIterator* test4 = new StringCharacterIterator(testText2);
|
|
CharacterIterator* test5 = test1->clone();
|
|
|
|
if (test1d->startIndex() < 0)
|
|
errln("Construction failed: startIndex is negative");
|
|
if (test1d->endIndex() > testText.length())
|
|
errln("Construction failed: endIndex is greater than the text length");
|
|
if (test1d->getIndex() < test1d->startIndex() || test1d->endIndex() < test1d->getIndex())
|
|
errln("Construction failed: index is invalid");
|
|
|
|
if (*test1 == *test2 || *test1 == *test3 || *test1 == *test4)
|
|
errln("Construction or operator== failed: Unequal objects compared equal");
|
|
if (*test1 != *test5)
|
|
errln("clone() or equals() failed: Two clones tested unequal");
|
|
|
|
if (test1->hashCode() == test2->hashCode() || test1->hashCode() == test3->hashCode()
|
|
|| test1->hashCode() == test4->hashCode())
|
|
errln("hashCode() failed: different objects have same hash code");
|
|
|
|
if (test1->hashCode() != test5->hashCode())
|
|
errln("hashCode() failed: identical objects have different hash codes");
|
|
|
|
if(test1->getLength() != testText.length()){
|
|
errln("getLength of CharacterIterator failed");
|
|
}
|
|
test1->getText(result1);
|
|
test1b->getText(result2);
|
|
test1c->getText(result3);
|
|
if(result1 != result2 || result1 != result3)
|
|
errln("construction failed or getText() failed");
|
|
|
|
|
|
test1->setIndex(5);
|
|
if (*test1 != *test2 || *test1 == *test5)
|
|
errln("setIndex() failed");
|
|
|
|
*((StringCharacterIterator*)test1) = *((StringCharacterIterator*)test3);
|
|
if (*test1 != *test3 || *test1 == *test5)
|
|
errln("operator= failed");
|
|
|
|
delete test2;
|
|
delete test3;
|
|
delete test4;
|
|
delete test5;
|
|
delete test1b;
|
|
delete test1c;
|
|
delete test1d;
|
|
delete test1e;
|
|
|
|
|
|
StringCharacterIterator* testChar1=new StringCharacterIterator(testText);
|
|
StringCharacterIterator* testChar2=new StringCharacterIterator(testText2);
|
|
StringCharacterIterator* testChar3=test1->clone();
|
|
|
|
testChar1->getText(result1);
|
|
testChar2->getText(result2);
|
|
testChar3->getText(result3);
|
|
if(result1 != result3 || result1 == result2)
|
|
errln("getText() failed");
|
|
testChar3->setText(testText2);
|
|
testChar3->getText(result3);
|
|
if(result1 == result3 || result2 != result3)
|
|
errln("setText() or getText() failed");
|
|
testChar3->setText(testText);
|
|
testChar3->getText(result3);
|
|
if(result1 != result3 || result1 == result2)
|
|
errln("setText() or getText() round-trip failed");
|
|
|
|
delete testChar1;
|
|
delete testChar2;
|
|
delete testChar3;
|
|
delete test1;
|
|
|
|
}
|
|
void CharIterTest::TestConstructionAndEqualityUChariter() {
|
|
U_STRING_DECL(testText, "Now is the time for all good men to come to the aid of their country.", 69);
|
|
U_STRING_DECL(testText2, "Don't bother using this string.", 31);
|
|
|
|
U_STRING_INIT(testText, "Now is the time for all good men to come to the aid of their country.", 69);
|
|
U_STRING_INIT(testText2, "Don't bother using this string.", 31);
|
|
|
|
UnicodeString result, result4, result5;
|
|
|
|
UCharCharacterIterator* test1 = new UCharCharacterIterator(testText, u_strlen(testText));
|
|
UCharCharacterIterator* test2 = new UCharCharacterIterator(testText, u_strlen(testText), 5);
|
|
UCharCharacterIterator* test3 = new UCharCharacterIterator(testText, u_strlen(testText), 2, 20, 5);
|
|
UCharCharacterIterator* test4 = new UCharCharacterIterator(testText2, u_strlen(testText2));
|
|
UCharCharacterIterator* test5 = test1->clone();
|
|
UCharCharacterIterator* test6 = new UCharCharacterIterator(*test1);
|
|
|
|
// j785: length=-1 will use u_strlen()
|
|
UCharCharacterIterator* test7a = new UCharCharacterIterator(testText, -1);
|
|
UCharCharacterIterator* test7b = new UCharCharacterIterator(testText, -1);
|
|
UCharCharacterIterator* test7c = new UCharCharacterIterator(testText, -1, 2, 20, 5);
|
|
|
|
// Bad parameters.
|
|
UCharCharacterIterator* test8a = new UCharCharacterIterator(testText, -1, -1, 20, 5);
|
|
UCharCharacterIterator* test8b = new UCharCharacterIterator(testText, -1, 2, 100, 5);
|
|
UCharCharacterIterator* test8c = new UCharCharacterIterator(testText, -1, 2, 20, 100);
|
|
|
|
if (test8a->startIndex() < 0)
|
|
errln("Construction failed: startIndex is negative");
|
|
if (test8b->endIndex() != u_strlen(testText))
|
|
errln("Construction failed: endIndex is different from the text length");
|
|
if (test8c->getIndex() < test8c->startIndex() || test8c->endIndex() < test8c->getIndex())
|
|
errln("Construction failed: index is invalid");
|
|
|
|
if (*test1 == *test2 || *test1 == *test3 || *test1 == *test4 )
|
|
errln("Construction or operator== failed: Unequal objects compared equal");
|
|
if (*test1 != *test5 )
|
|
errln("clone() or equals() failed: Two clones tested unequal");
|
|
|
|
if (*test6 != *test1 )
|
|
errln("copy construction or equals() failed: Two copies tested unequal");
|
|
|
|
if (test1->hashCode() == test2->hashCode() || test1->hashCode() == test3->hashCode()
|
|
|| test1->hashCode() == test4->hashCode())
|
|
errln("hashCode() failed: different objects have same hash code");
|
|
|
|
if (test1->hashCode() != test5->hashCode())
|
|
errln("hashCode() failed: identical objects have different hash codes");
|
|
|
|
test7a->getText(result);
|
|
test7b->getText(result4);
|
|
test7c->getText(result5);
|
|
|
|
if(result != UnicodeString(testText) || result4 != result || result5 != result)
|
|
errln("error in construction");
|
|
|
|
test1->getText(result);
|
|
test4->getText(result4);
|
|
test5->getText(result5);
|
|
if(result != result5 || result == result4)
|
|
errln("getText() failed");
|
|
test5->setText(testText2, u_strlen(testText2));
|
|
test5->getText(result5);
|
|
if(result == result5 || result4 != result5)
|
|
errln("setText() or getText() failed");
|
|
test5->setText(testText, u_strlen(testText));
|
|
test5->getText(result5);
|
|
if(result != result5 || result == result4)
|
|
errln("setText() or getText() round-trip failed");
|
|
|
|
|
|
test1->setIndex(5);
|
|
if (*test1 != *test2 || *test1 == *test5)
|
|
errln("setIndex() failed");
|
|
test8b->setIndex32(5);
|
|
if (test8b->getIndex()!=5)
|
|
errln("setIndex32() failed");
|
|
|
|
*test1 = *test3;
|
|
if (*test1 != *test3 || *test1 == *test5)
|
|
errln("operator= failed");
|
|
|
|
delete test1;
|
|
delete test2;
|
|
delete test3;
|
|
delete test4;
|
|
delete test5;
|
|
delete test6;
|
|
delete test7a;
|
|
delete test7b;
|
|
delete test7c;
|
|
delete test8a;
|
|
delete test8b;
|
|
delete test8c;
|
|
}
|
|
|
|
|
|
void CharIterTest::TestIteration() {
|
|
UnicodeString text("Now is the time for all good men to come to the aid of their country.");
|
|
|
|
UChar c;
|
|
int32_t i;
|
|
{
|
|
StringCharacterIterator iter(text, 5);
|
|
|
|
UnicodeString iterText;
|
|
iter.getText(iterText);
|
|
if (iterText != text)
|
|
errln("iter.getText() failed");
|
|
|
|
if (iter.current() != text[(int32_t)5])
|
|
errln("Iterator didn't start out in the right place.");
|
|
|
|
c = iter.first();
|
|
i = 0;
|
|
|
|
if (iter.startIndex() != 0 || iter.endIndex() != text.length())
|
|
errln("startIndex() or endIndex() failed");
|
|
|
|
logln("Testing forward iteration...");
|
|
do {
|
|
if (c == CharacterIterator::DONE && i != text.length())
|
|
errln("Iterator reached end prematurely");
|
|
else if (c != text[i])
|
|
errln((UnicodeString)"Character mismatch at position " + i +
|
|
", iterator has " + UCharToUnicodeString(c) +
|
|
", string has " + UCharToUnicodeString(text[i]));
|
|
|
|
if (iter.current() != c)
|
|
errln("current() isn't working right");
|
|
if (iter.getIndex() != i)
|
|
errln("getIndex() isn't working right");
|
|
|
|
if (c != CharacterIterator::DONE) {
|
|
c = iter.next();
|
|
i++;
|
|
}
|
|
} while (c != CharacterIterator::DONE);
|
|
c=iter.next();
|
|
if(c!= CharacterIterator::DONE)
|
|
errln("next() didn't return DONE at the end");
|
|
c=iter.setIndex(text.length()+1);
|
|
if(c!= CharacterIterator::DONE)
|
|
errln("setIndex(len+1) didn't return DONE");
|
|
|
|
c = iter.last();
|
|
i = text.length() - 1;
|
|
|
|
logln("Testing backward iteration...");
|
|
do {
|
|
if (c == CharacterIterator::DONE && i >= 0)
|
|
errln("Iterator reached end prematurely");
|
|
else if (c != text[i])
|
|
errln((UnicodeString)"Character mismatch at position " + i +
|
|
", iterator has " + UCharToUnicodeString(c) +
|
|
", string has " + UCharToUnicodeString(text[i]));
|
|
|
|
if (iter.current() != c)
|
|
errln("current() isn't working right");
|
|
if (iter.getIndex() != i)
|
|
errln("getIndex() isn't working right");
|
|
if(iter.setIndex(i) != c)
|
|
errln("setIndex() isn't working right");
|
|
|
|
if (c != CharacterIterator::DONE) {
|
|
c = iter.previous();
|
|
i--;
|
|
}
|
|
} while (c != CharacterIterator::DONE);
|
|
|
|
c=iter.previous();
|
|
if(c!= CharacterIterator::DONE)
|
|
errln("previous didn't return DONE at the beginning");
|
|
|
|
|
|
//testing firstPostInc, nextPostInc, setTostart
|
|
i = 0;
|
|
c=iter.firstPostInc();
|
|
if(c != text[i])
|
|
errln((UnicodeString)"firstPostInc failed. Expected->" +
|
|
UCharToUnicodeString(text[i]) + " Got->" + UCharToUnicodeString(c));
|
|
if(iter.getIndex() != i+1)
|
|
errln((UnicodeString)"getIndex() after firstPostInc() failed");
|
|
|
|
iter.setToStart();
|
|
i=0;
|
|
if (iter.startIndex() != 0)
|
|
errln("setToStart failed");
|
|
|
|
logln("Testing forward iteration...");
|
|
do {
|
|
if (c != CharacterIterator::DONE)
|
|
c = iter.nextPostInc();
|
|
|
|
if(c != text[i])
|
|
errln((UnicodeString)"Character mismatch at position " + i +
|
|
(UnicodeString)", iterator has " + UCharToUnicodeString(c) +
|
|
(UnicodeString)", string has " + UCharToUnicodeString(text[i]));
|
|
|
|
i++;
|
|
if(iter.getIndex() != i)
|
|
errln("getIndex() aftr nextPostInc() isn't working right");
|
|
if(iter.current() != text[i])
|
|
errln("current() after nextPostInc() isn't working right");
|
|
} while (iter.hasNext());
|
|
c=iter.nextPostInc();
|
|
if(c!= CharacterIterator::DONE)
|
|
errln("nextPostInc() didn't return DONE at the beginning");
|
|
}
|
|
|
|
{
|
|
StringCharacterIterator iter(text, 5, 15, 10);
|
|
if (iter.startIndex() != 5 || iter.endIndex() != 15)
|
|
errln("creation of a restricted-range iterator failed");
|
|
|
|
if (iter.getIndex() != 10 || iter.current() != text[(int32_t)10])
|
|
errln("starting the iterator in the middle didn't work");
|
|
|
|
c = iter.first();
|
|
i = 5;
|
|
|
|
logln("Testing forward iteration over a range...");
|
|
do {
|
|
if (c == CharacterIterator::DONE && i != 15)
|
|
errln("Iterator reached end prematurely");
|
|
else if (c != text[i])
|
|
errln((UnicodeString)"Character mismatch at position " + i +
|
|
", iterator has " + UCharToUnicodeString(c) +
|
|
", string has " + UCharToUnicodeString(text[i]));
|
|
|
|
if (iter.current() != c)
|
|
errln("current() isn't working right");
|
|
if (iter.getIndex() != i)
|
|
errln("getIndex() isn't working right");
|
|
if(iter.setIndex(i) != c)
|
|
errln("setIndex() isn't working right");
|
|
|
|
if (c != CharacterIterator::DONE) {
|
|
c = iter.next();
|
|
i++;
|
|
}
|
|
} while (c != CharacterIterator::DONE);
|
|
|
|
c = iter.last();
|
|
i = 14;
|
|
|
|
logln("Testing backward iteration over a range...");
|
|
do {
|
|
if (c == CharacterIterator::DONE && i >= 5)
|
|
errln("Iterator reached end prematurely");
|
|
else if (c != text[i])
|
|
errln((UnicodeString)"Character mismatch at position " + i +
|
|
", iterator has " + UCharToUnicodeString(c) +
|
|
", string has " + UCharToUnicodeString(text[i]));
|
|
|
|
if (iter.current() != c)
|
|
errln("current() isn't working right");
|
|
if (iter.getIndex() != i)
|
|
errln("getIndex() isn't working right");
|
|
|
|
if (c != CharacterIterator::DONE) {
|
|
c = iter.previous();
|
|
i--;
|
|
}
|
|
} while (c != CharacterIterator::DONE);
|
|
|
|
|
|
}
|
|
}
|
|
|
|
//Tests for new API for utf-16 support
|
|
void CharIterTest::TestIterationUChar32() {
|
|
UChar textChars[]={ 0x0061, 0x0062, 0xd841, 0xdc02, 0x20ac, 0xd7ff, 0xd842, 0xdc06, 0xd801, 0xdc00, 0x0061, 0x0000};
|
|
UnicodeString text(textChars);
|
|
UChar32 c;
|
|
int32_t i;
|
|
{
|
|
StringCharacterIterator iter(text, 1);
|
|
|
|
UnicodeString iterText;
|
|
iter.getText(iterText);
|
|
if (iterText != text)
|
|
errln("iter.getText() failed");
|
|
|
|
if (iter.current32() != text[(int32_t)1])
|
|
errln("Iterator didn't start out in the right place.");
|
|
|
|
c=iter.setToStart();
|
|
i=0;
|
|
i=iter.move32(1, CharacterIterator::kStart);
|
|
c=iter.current32();
|
|
if(c != text.char32At(1) || i!=1)
|
|
errln("move32(1, kStart) didn't work correctly expected %X got %X", c, text.char32At(1) );
|
|
|
|
i=iter.move32(2, CharacterIterator::kCurrent);
|
|
c=iter.current32();
|
|
if(c != text.char32At(4) || i!=4)
|
|
errln("move32(2, kCurrent) didn't work correctly expected %X got %X i=%ld", c, text.char32At(4), i);
|
|
|
|
i=iter.move32(-2, CharacterIterator::kCurrent);
|
|
c=iter.current32();
|
|
if(c != text.char32At(1) || i!=1)
|
|
errln("move32(-2, kCurrent) didn't work correctly expected %X got %X i=%d", c, text.char32At(1), i);
|
|
|
|
|
|
i=iter.move32(-2, CharacterIterator::kEnd);
|
|
c=iter.current32();
|
|
if(c != text.char32At((text.length()-3)) || i!=(text.length()-3))
|
|
errln("move32(-2, kEnd) didn't work correctly expected %X got %X i=%d", c, text.char32At((text.length()-3)), i);
|
|
|
|
|
|
c = iter.first32();
|
|
i = 0;
|
|
|
|
if (iter.startIndex() != 0 || iter.endIndex() != text.length())
|
|
errln("startIndex() or endIndex() failed");
|
|
|
|
logln("Testing forward iteration...");
|
|
do {
|
|
/* logln("c=%d i=%d char32At=%d", c, i, text.char32At(i)); */
|
|
if (c == CharacterIterator::DONE && i != text.length())
|
|
errln("Iterator reached end prematurely");
|
|
else if(iter.hasNext() == FALSE && i != text.length())
|
|
errln("Iterator reached end prematurely. Failed at hasNext");
|
|
else if (c != text.char32At(i))
|
|
errln("Character mismatch at position %d, iterator has %X, string has %X", i, c, text.char32At(i));
|
|
|
|
if (iter.current32() != c)
|
|
errln("current32() isn't working right");
|
|
if(iter.setIndex32(i) != c)
|
|
errln("setIndex32() isn't working right");
|
|
if (c != CharacterIterator::DONE) {
|
|
c = iter.next32();
|
|
i += U16_LENGTH(c);
|
|
}
|
|
} while (c != CharacterIterator::DONE);
|
|
if(iter.hasNext() == TRUE)
|
|
errln("hasNext() returned true at the end of the string");
|
|
|
|
|
|
|
|
c=iter.setToEnd();
|
|
if(iter.getIndex() != text.length() || iter.hasNext() != FALSE)
|
|
errln("setToEnd failed");
|
|
|
|
c=iter.next32();
|
|
if(c!= CharacterIterator::DONE)
|
|
errln("next32 didn't return DONE at the end");
|
|
c=iter.setIndex32(text.length()+1);
|
|
if(c!= CharacterIterator::DONE)
|
|
errln("setIndex32(len+1) didn't return DONE");
|
|
|
|
|
|
c = iter.last32();
|
|
i = text.length()-1;
|
|
logln("Testing backward iteration...");
|
|
do {
|
|
if (c == CharacterIterator::DONE && i >= 0)
|
|
errln((UnicodeString)"Iterator reached start prematurely for i=" + i);
|
|
else if(iter.hasPrevious() == FALSE && i>0)
|
|
errln((UnicodeString)"Iterator reached start prematurely for i=" + i);
|
|
else if (c != text.char32At(i))
|
|
errln("Character mismatch at position %d, iterator has %X, string has %X", i, c, text.char32At(i));
|
|
|
|
if (iter.current32() != c)
|
|
errln("current32() isn't working right");
|
|
if(iter.setIndex32(i) != c)
|
|
errln("setIndex32() isn't working right");
|
|
if (iter.getIndex() != i)
|
|
errln("getIndex() isn't working right");
|
|
if (c != CharacterIterator::DONE) {
|
|
c = iter.previous32();
|
|
i -= U16_LENGTH(c);
|
|
}
|
|
} while (c != CharacterIterator::DONE);
|
|
if(iter.hasPrevious() == TRUE)
|
|
errln("hasPrevious returned true after reaching the start");
|
|
|
|
c=iter.previous32();
|
|
if(c!= CharacterIterator::DONE)
|
|
errln("previous32 didn't return DONE at the beginning");
|
|
|
|
|
|
|
|
|
|
//testing first32PostInc, next32PostInc, setTostart
|
|
i = 0;
|
|
c=iter.first32PostInc();
|
|
if(c != text.char32At(i))
|
|
errln("first32PostInc failed. Expected->%X Got->%X", text.char32At(i), c);
|
|
if(iter.getIndex() != U16_LENGTH(c) + i)
|
|
errln((UnicodeString)"getIndex() after first32PostInc() failed");
|
|
|
|
iter.setToStart();
|
|
i=0;
|
|
if (iter.startIndex() != 0)
|
|
errln("setToStart failed");
|
|
|
|
logln("Testing forward iteration...");
|
|
do {
|
|
if (c != CharacterIterator::DONE)
|
|
c = iter.next32PostInc();
|
|
|
|
if(c != text.char32At(i))
|
|
errln("Character mismatch at position %d, iterator has %X, string has %X", i, c, text.char32At(i));
|
|
|
|
i += U16_LENGTH(c);
|
|
if(iter.getIndex() != i)
|
|
errln("getIndex() aftr next32PostInc() isn't working right");
|
|
if(iter.current32() != text.char32At(i))
|
|
errln("current() after next32PostInc() isn't working right");
|
|
} while (iter.hasNext());
|
|
c=iter.next32PostInc();
|
|
if(c!= CharacterIterator::DONE)
|
|
errln("next32PostInc() didn't return DONE at the beginning");
|
|
|
|
|
|
}
|
|
|
|
{
|
|
StringCharacterIterator iter(text, 1, 11, 10);
|
|
if (iter.startIndex() != 1 || iter.endIndex() != 11)
|
|
errln("creation of a restricted-range iterator failed");
|
|
|
|
if (iter.getIndex() != 10 || iter.current32() != text.char32At(10))
|
|
errln("starting the iterator in the middle didn't work");
|
|
|
|
c = iter.first32();
|
|
|
|
i = 1;
|
|
|
|
logln("Testing forward iteration over a range...");
|
|
do {
|
|
if (c == CharacterIterator::DONE && i != 11)
|
|
errln("Iterator reached end prematurely");
|
|
else if(iter.hasNext() == FALSE)
|
|
errln("Iterator reached end prematurely");
|
|
else if (c != text.char32At(i))
|
|
errln("Character mismatch at position %d, iterator has %X, string has %X", i, c, text.char32At(i));
|
|
|
|
if (iter.current32() != c)
|
|
errln("current32() isn't working right");
|
|
if(iter.setIndex32(i) != c)
|
|
errln("setIndex32() isn't working right");
|
|
|
|
if (c != CharacterIterator::DONE) {
|
|
c = iter.next32();
|
|
i += U16_LENGTH(c);
|
|
}
|
|
} while (c != CharacterIterator::DONE);
|
|
c=iter.next32();
|
|
if(c != CharacterIterator::DONE)
|
|
errln("error in next32()");
|
|
|
|
|
|
|
|
c=iter.last32();
|
|
i = 10;
|
|
logln("Testing backward iteration over a range...");
|
|
do {
|
|
if (c == CharacterIterator::DONE && i >= 5)
|
|
errln("Iterator reached start prematurely");
|
|
else if(iter.hasPrevious() == FALSE && i > 5)
|
|
errln("Iterator reached start prematurely");
|
|
else if (c != text.char32At(i))
|
|
errln("Character mismatch at position %d, iterator has %X, string has %X", i, c, text.char32At(i));
|
|
if (iter.current32() != c)
|
|
errln("current32() isn't working right");
|
|
if (iter.getIndex() != i)
|
|
errln("getIndex() isn't working right");
|
|
if(iter.setIndex32(i) != c)
|
|
errln("setIndex32() isn't working right");
|
|
|
|
if (c != CharacterIterator::DONE) {
|
|
c = iter.previous32();
|
|
i -= U16_LENGTH(c);
|
|
}
|
|
|
|
} while (c != CharacterIterator::DONE);
|
|
c=iter.previous32();
|
|
if(c!= CharacterIterator::DONE)
|
|
errln("error on previous32");
|
|
|
|
|
|
}
|
|
}
|
|
|
|
void CharIterTest::TestUCharIterator(UCharIterator *iter, CharacterIterator &ci,
|
|
const char *moves, const char *which) {
|
|
int32_t m;
|
|
UChar32 c, c2;
|
|
UBool h, h2;
|
|
|
|
for(m=0;; ++m) {
|
|
// move both iter and s[index]
|
|
switch(moves[m]) {
|
|
case '0':
|
|
h=iter->hasNext(iter);
|
|
h2=ci.hasNext();
|
|
c=iter->current(iter);
|
|
c2=ci.current();
|
|
break;
|
|
case '|':
|
|
h=iter->hasNext(iter);
|
|
h2=ci.hasNext();
|
|
c=uiter_current32(iter);
|
|
c2=ci.current32();
|
|
break;
|
|
|
|
case '+':
|
|
h=iter->hasNext(iter);
|
|
h2=ci.hasNext();
|
|
c=iter->next(iter);
|
|
c2=ci.nextPostInc();
|
|
break;
|
|
case '>':
|
|
h=iter->hasNext(iter);
|
|
h2=ci.hasNext();
|
|
c=uiter_next32(iter);
|
|
c2=ci.next32PostInc();
|
|
break;
|
|
|
|
case '-':
|
|
h=iter->hasPrevious(iter);
|
|
h2=ci.hasPrevious();
|
|
c=iter->previous(iter);
|
|
c2=ci.previous();
|
|
break;
|
|
case '<':
|
|
h=iter->hasPrevious(iter);
|
|
h2=ci.hasPrevious();
|
|
c=uiter_previous32(iter);
|
|
c2=ci.previous32();
|
|
break;
|
|
|
|
case '2':
|
|
h=h2=FALSE;
|
|
c=(UChar32)iter->move(iter, 2, UITER_CURRENT);
|
|
c2=(UChar32)ci.move(2, CharacterIterator::kCurrent);
|
|
break;
|
|
|
|
case '8':
|
|
h=h2=FALSE;
|
|
c=(UChar32)iter->move(iter, -2, UITER_CURRENT);
|
|
c2=(UChar32)ci.move(-2, CharacterIterator::kCurrent);
|
|
break;
|
|
|
|
case 0:
|
|
return;
|
|
default:
|
|
errln("error: unexpected move character '%c' in \"%s\"", moves[m], moves);
|
|
return;
|
|
}
|
|
|
|
// compare results
|
|
if(c2==0xffff) {
|
|
c2=(UChar32)-1;
|
|
}
|
|
if(c!=c2 || h!=h2 || ci.getIndex()!=iter->getIndex(iter, UITER_CURRENT)) {
|
|
errln("error: UCharIterator(%s) misbehaving at \"%s\"[%d]='%c'", which, moves, m, moves[m]);
|
|
}
|
|
}
|
|
}
|
|
|
|
void CharIterTest::TestUCharIterator() {
|
|
// test string of length 8
|
|
UnicodeString s=UnicodeString("a \\U00010001b\\U0010fffdz", "").unescape();
|
|
const char *const moves=
|
|
"0+++++++++" // 10 moves per line
|
|
"----0-----"
|
|
">>|>>>>>>>"
|
|
"<<|<<<<<<<"
|
|
"22+>8>-8+2";
|
|
|
|
StringCharacterIterator sci(s), compareCI(s);
|
|
|
|
UCharIterator sIter, cIter, rIter;
|
|
|
|
uiter_setString(&sIter, s.getBuffer(), s.length());
|
|
uiter_setCharacterIterator(&cIter, &sci);
|
|
uiter_setReplaceable(&rIter, &s);
|
|
|
|
TestUCharIterator(&sIter, compareCI, moves, "uiter_setString");
|
|
compareCI.setIndex(0);
|
|
TestUCharIterator(&cIter, compareCI, moves, "uiter_setCharacterIterator");
|
|
compareCI.setIndex(0);
|
|
TestUCharIterator(&rIter, compareCI, moves, "uiter_setReplaceable");
|
|
|
|
// test move & getIndex some more
|
|
sIter.start=2;
|
|
sIter.index=3;
|
|
sIter.limit=5;
|
|
if( sIter.getIndex(&sIter, UITER_ZERO)!=0 ||
|
|
sIter.getIndex(&sIter, UITER_START)!=2 ||
|
|
sIter.getIndex(&sIter, UITER_CURRENT)!=3 ||
|
|
sIter.getIndex(&sIter, UITER_LIMIT)!=5 ||
|
|
sIter.getIndex(&sIter, UITER_LENGTH)!=s.length()
|
|
) {
|
|
errln("error: UCharIterator(string).getIndex returns wrong index");
|
|
}
|
|
|
|
if( sIter.move(&sIter, 4, UITER_ZERO)!=4 ||
|
|
sIter.move(&sIter, 1, UITER_START)!=3 ||
|
|
sIter.move(&sIter, 3, UITER_CURRENT)!=5 ||
|
|
sIter.move(&sIter, -1, UITER_LIMIT)!=4 ||
|
|
sIter.move(&sIter, -5, UITER_LENGTH)!=3 ||
|
|
sIter.move(&sIter, 0, UITER_CURRENT)!=sIter.getIndex(&sIter, UITER_CURRENT) ||
|
|
sIter.getIndex(&sIter, UITER_CURRENT)!=3
|
|
) {
|
|
errln("error: UCharIterator(string).move sets/returns wrong index");
|
|
}
|
|
|
|
sci=StringCharacterIterator(s, 2, 5, 3);
|
|
uiter_setCharacterIterator(&cIter, &sci);
|
|
if( cIter.getIndex(&cIter, UITER_ZERO)!=0 ||
|
|
cIter.getIndex(&cIter, UITER_START)!=2 ||
|
|
cIter.getIndex(&cIter, UITER_CURRENT)!=3 ||
|
|
cIter.getIndex(&cIter, UITER_LIMIT)!=5 ||
|
|
cIter.getIndex(&cIter, UITER_LENGTH)!=s.length()
|
|
) {
|
|
errln("error: UCharIterator(character iterator).getIndex returns wrong index");
|
|
}
|
|
|
|
if( cIter.move(&cIter, 4, UITER_ZERO)!=4 ||
|
|
cIter.move(&cIter, 1, UITER_START)!=3 ||
|
|
cIter.move(&cIter, 3, UITER_CURRENT)!=5 ||
|
|
cIter.move(&cIter, -1, UITER_LIMIT)!=4 ||
|
|
cIter.move(&cIter, -5, UITER_LENGTH)!=3 ||
|
|
cIter.move(&cIter, 0, UITER_CURRENT)!=cIter.getIndex(&cIter, UITER_CURRENT) ||
|
|
cIter.getIndex(&cIter, UITER_CURRENT)!=3
|
|
) {
|
|
errln("error: UCharIterator(character iterator).move sets/returns wrong index");
|
|
}
|
|
|
|
|
|
if(cIter.getIndex(&cIter, (enum UCharIteratorOrigin)-1) != -1)
|
|
{
|
|
errln("error: UCharIterator(char iter).getIndex did not return error value");
|
|
}
|
|
|
|
if(cIter.move(&cIter, 0, (enum UCharIteratorOrigin)-1) != -1)
|
|
{
|
|
errln("error: UCharIterator(char iter).move did not return error value");
|
|
}
|
|
|
|
|
|
if(rIter.getIndex(&rIter, (enum UCharIteratorOrigin)-1) != -1)
|
|
{
|
|
errln("error: UCharIterator(repl iter).getIndex did not return error value");
|
|
}
|
|
|
|
if(rIter.move(&rIter, 0, (enum UCharIteratorOrigin)-1) != -1)
|
|
{
|
|
errln("error: UCharIterator(repl iter).move did not return error value");
|
|
}
|
|
|
|
|
|
if(sIter.getIndex(&sIter, (enum UCharIteratorOrigin)-1) != -1)
|
|
{
|
|
errln("error: UCharIterator(string iter).getIndex did not return error value");
|
|
}
|
|
|
|
if(sIter.move(&sIter, 0, (enum UCharIteratorOrigin)-1) != -1)
|
|
{
|
|
errln("error: UCharIterator(string iter).move did not return error value");
|
|
}
|
|
|
|
/* Testing function coverage on bad input */
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
uiter_setString(&sIter, NULL, 1);
|
|
uiter_setState(&sIter, 1, &status);
|
|
if (status != U_UNSUPPORTED_ERROR) {
|
|
errln("error: uiter_setState returned %s instead of U_UNSUPPORTED_ERROR", u_errorName(status));
|
|
}
|
|
status = U_ZERO_ERROR;
|
|
uiter_setState(NULL, 1, &status);
|
|
if (status != U_ILLEGAL_ARGUMENT_ERROR) {
|
|
errln("error: uiter_setState returned %s instead of U_ILLEGAL_ARGUMENT_ERROR", u_errorName(status));
|
|
}
|
|
if (uiter_getState(&sIter) != UITER_NO_STATE) {
|
|
errln("error: uiter_getState did not return UITER_NO_STATE on bad input");
|
|
}
|
|
}
|
|
|
|
// subclass test, and completing API coverage -------------------------------
|
|
|
|
class SubCharIter : public CharacterIterator {
|
|
public:
|
|
// public default constructor, to get coverage of CharacterIterator()
|
|
SubCharIter() : CharacterIterator() {
|
|
textLength=end=UPRV_LENGTHOF(s);
|
|
s[0]=0x61; // 'a'
|
|
s[1]=0xd900; // U+50400
|
|
s[2]=0xdd00;
|
|
s[3]=0x2029; // PS
|
|
}
|
|
|
|
// useful stuff, mostly dummy but testing coverage and subclassability
|
|
virtual UChar nextPostInc() {
|
|
if(pos<UPRV_LENGTHOF(s)) {
|
|
return s[pos++];
|
|
} else {
|
|
return DONE;
|
|
}
|
|
}
|
|
|
|
virtual UChar32 next32PostInc() {
|
|
if(pos<UPRV_LENGTHOF(s)) {
|
|
UChar32 c;
|
|
U16_NEXT(s, pos, UPRV_LENGTHOF(s), c);
|
|
return c;
|
|
} else {
|
|
return DONE;
|
|
}
|
|
}
|
|
|
|
virtual UBool hasNext() {
|
|
return pos<UPRV_LENGTHOF(s);
|
|
}
|
|
|
|
virtual UChar first() {
|
|
pos=0;
|
|
return s[0];
|
|
}
|
|
|
|
virtual UChar32 first32() {
|
|
UChar32 c;
|
|
pos=0;
|
|
U16_NEXT(s, pos, UPRV_LENGTHOF(s), c);
|
|
pos=0;
|
|
return c;
|
|
}
|
|
|
|
virtual UChar setIndex(int32_t position) {
|
|
if(0<=position && position<=UPRV_LENGTHOF(s)) {
|
|
pos=position;
|
|
if(pos<UPRV_LENGTHOF(s)) {
|
|
return s[pos];
|
|
}
|
|
}
|
|
return DONE;
|
|
}
|
|
|
|
virtual UChar32 setIndex32(int32_t position) {
|
|
if(0<=position && position<=UPRV_LENGTHOF(s)) {
|
|
pos=position;
|
|
if(pos<UPRV_LENGTHOF(s)) {
|
|
UChar32 c;
|
|
U16_GET(s, 0, pos, UPRV_LENGTHOF(s), c);
|
|
return c;
|
|
}
|
|
}
|
|
return DONE;
|
|
}
|
|
|
|
virtual UChar current() const {
|
|
if(pos<UPRV_LENGTHOF(s)) {
|
|
return s[pos];
|
|
} else {
|
|
return DONE;
|
|
}
|
|
}
|
|
|
|
virtual UChar32 current32() const {
|
|
if(pos<UPRV_LENGTHOF(s)) {
|
|
UChar32 c;
|
|
U16_GET(s, 0, pos, UPRV_LENGTHOF(s), c);
|
|
return c;
|
|
} else {
|
|
return DONE;
|
|
}
|
|
}
|
|
|
|
virtual UChar next() {
|
|
if(pos<UPRV_LENGTHOF(s) && ++pos<UPRV_LENGTHOF(s)) {
|
|
return s[pos];
|
|
} else {
|
|
return DONE;
|
|
}
|
|
}
|
|
|
|
virtual UChar32 next32() {
|
|
if(pos<UPRV_LENGTHOF(s)) {
|
|
U16_FWD_1(s, pos, UPRV_LENGTHOF(s));
|
|
}
|
|
if(pos<UPRV_LENGTHOF(s)) {
|
|
UChar32 c;
|
|
int32_t i=pos;
|
|
U16_NEXT(s, i, UPRV_LENGTHOF(s), c);
|
|
return c;
|
|
} else {
|
|
return DONE;
|
|
}
|
|
}
|
|
|
|
virtual UBool hasPrevious() {
|
|
return pos>0;
|
|
}
|
|
|
|
virtual void getText(UnicodeString &result) {
|
|
result.setTo(s, UPRV_LENGTHOF(s));
|
|
}
|
|
|
|
// dummy implementations of other pure virtual base class functions
|
|
virtual UBool operator==(const ForwardCharacterIterator &that) const {
|
|
return
|
|
this==&that ||
|
|
(typeid(*this)==typeid(that) && pos==((SubCharIter &)that).pos);
|
|
}
|
|
|
|
virtual int32_t hashCode() const {
|
|
return 2;
|
|
}
|
|
|
|
virtual CharacterIterator *clone() const {
|
|
return NULL;
|
|
}
|
|
|
|
virtual UChar last() {
|
|
return 0;
|
|
}
|
|
|
|
virtual UChar32 last32() {
|
|
return 0;
|
|
}
|
|
|
|
virtual UChar previous() {
|
|
return 0;
|
|
}
|
|
|
|
virtual UChar32 previous32() {
|
|
return 0;
|
|
}
|
|
|
|
virtual int32_t move(int32_t /*delta*/, EOrigin /*origin*/) {
|
|
return 0;
|
|
}
|
|
|
|
virtual int32_t move32(int32_t /*delta*/, EOrigin /*origin*/) {
|
|
return 0;
|
|
}
|
|
|
|
// RTTI
|
|
static UClassID getStaticClassID() {
|
|
return (UClassID)(&fgClassID);
|
|
}
|
|
|
|
virtual UClassID getDynamicClassID() const {
|
|
return getStaticClassID();
|
|
}
|
|
|
|
private:
|
|
// dummy string data
|
|
UChar s[4];
|
|
|
|
static const char fgClassID;
|
|
};
|
|
|
|
const char SubCharIter::fgClassID = 0;
|
|
|
|
class SubStringCharIter : public StringCharacterIterator {
|
|
public:
|
|
SubStringCharIter() {
|
|
setText(UNICODE_STRING("abc", 3));
|
|
}
|
|
};
|
|
|
|
class SubUCharCharIter : public UCharCharacterIterator {
|
|
public:
|
|
SubUCharCharIter() {
|
|
setText(u, 3);
|
|
}
|
|
|
|
private:
|
|
static const UChar u[3];
|
|
};
|
|
|
|
const UChar SubUCharCharIter::u[3]={ 0x61, 0x62, 0x63 };
|
|
|
|
void CharIterTest::TestCharIteratorSubClasses() {
|
|
SubCharIter *p;
|
|
|
|
// coverage - call functions that are not otherwise tested
|
|
// first[32]PostInc() are default implementations that are overridden
|
|
// in ICU's own CharacterIterator subclasses
|
|
p=new SubCharIter;
|
|
if(p->firstPostInc()!=0x61) {
|
|
errln("SubCharIter.firstPosInc() failed\n");
|
|
}
|
|
delete p;
|
|
|
|
p=new SubCharIter[2];
|
|
if(p[1].first32PostInc()!=0x61) {
|
|
errln("SubCharIter.first32PosInc() failed\n");
|
|
}
|
|
delete [] p;
|
|
|
|
// coverage: StringCharacterIterator default constructor
|
|
SubStringCharIter sci;
|
|
if(sci.firstPostInc()!=0x61) {
|
|
errln("SubStringCharIter.firstPostInc() failed\n");
|
|
}
|
|
|
|
// coverage: UCharCharacterIterator default constructor
|
|
SubUCharCharIter uci;
|
|
if(uci.firstPostInc()!=0x61) {
|
|
errln("SubUCharCharIter.firstPostInc() failed\n");
|
|
}
|
|
}
|