You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
265 lines
6.3 KiB
265 lines
6.3 KiB
// © 2016 and later: Unicode, Inc. and others.
|
|
// License & terms of use: http://www.unicode.org/copyright.html
|
|
/********************************************************************
|
|
* COPYRIGHT:
|
|
* Copyright (c) 1997-2014, International Business Machines Corporation and
|
|
* others. All Rights Reserved.
|
|
********************************************************************/
|
|
|
|
/**
|
|
* Collation regression tests.
|
|
* (So we'll have no regrets later)
|
|
*/
|
|
|
|
#ifndef _REGCOLL
|
|
#define _REGCOLL
|
|
|
|
#include "unicode/utypes.h"
|
|
|
|
#if !UCONFIG_NO_COLLATION
|
|
|
|
#include "unicode/coleitr.h"
|
|
#include "tscoll.h"
|
|
|
|
class CollationRegressionTest: public IntlTestCollator
|
|
{
|
|
public:
|
|
|
|
// If this is too small for the test data, just increase it.
|
|
// Just don't make it too large, otherwise the executable will get too big
|
|
enum EToken_Len { MAX_TOKEN_LEN = 32 };
|
|
|
|
CollationRegressionTest();
|
|
virtual ~CollationRegressionTest();
|
|
|
|
void runIndexedTest( int32_t index, UBool exec, const char* &name, char* par = NULL );
|
|
|
|
// @bug 4048446
|
|
//
|
|
// CollationElementIterator.reset() doesn't work
|
|
//
|
|
void Test4048446(/* char* par */);
|
|
|
|
// @bug 4051866
|
|
//
|
|
// Collator -> rules -> Collator round-trip broken for expanding characters
|
|
//
|
|
void Test4051866(/* char* par */);
|
|
|
|
// @bug 4053636
|
|
//
|
|
// Collator thinks "black-bird" == "black"
|
|
//
|
|
void Test4053636(/* char* par */);
|
|
|
|
|
|
// @bug 4054238
|
|
//
|
|
// CollationElementIterator will not work correctly if the associated
|
|
// Collator object's mode is changed
|
|
//
|
|
void Test4054238(/* char* par */);
|
|
|
|
// @bug 4054734
|
|
//
|
|
// Collator.IDENTICAL documented but not implemented
|
|
//
|
|
void Test4054734(/* char* par */);
|
|
|
|
// @bug 4054736
|
|
//
|
|
// Full Decomposition mode not implemented
|
|
//
|
|
void Test4054736(/* char* par */);
|
|
|
|
// @bug 4058613
|
|
//
|
|
// Collator.getInstance() causes an ArrayIndexOutofBoundsException for Korean
|
|
//
|
|
void Test4058613(/* char* par */);
|
|
|
|
// @bug 4059820
|
|
//
|
|
// RuleBasedCollator.getRules does not return the exact pattern as input
|
|
// for expanding character sequences
|
|
//
|
|
void Test4059820(/* char* par */);
|
|
|
|
// @bug 4060154
|
|
//
|
|
// MergeCollation::fixEntry broken for "& H < \u0131, \u0130, i, I"
|
|
//
|
|
void Test4060154(/* char* par */);
|
|
|
|
// @bug 4062418
|
|
//
|
|
// Secondary/Tertiary comparison incorrect in French Secondary
|
|
//
|
|
void Test4062418(/* char* par */);
|
|
|
|
// @bug 4065540
|
|
//
|
|
// Collator.compare() method broken if either string contains spaces
|
|
//
|
|
void Test4065540(/* char* par */);
|
|
|
|
// @bug 4066189
|
|
//
|
|
// Unicode characters need to be recursively decomposed to get the
|
|
// correct result. For example,
|
|
// u1EB1 -> \u0103 + \u0300 -> a + \u0306 + \u0300.
|
|
//
|
|
void Test4066189(/* char* par */);
|
|
|
|
// @bug 4066696
|
|
//
|
|
// French secondary collation checking at the end of compare iteration fails
|
|
//
|
|
void Test4066696(/* char* par */);
|
|
|
|
|
|
// @bug 4076676
|
|
//
|
|
// Bad canonicalization of same-class combining characters
|
|
//
|
|
void Test4076676(/* char* par */);
|
|
|
|
|
|
// @bug 4078588
|
|
//
|
|
// RuleBasedCollator breaks on "< a < bb" rule
|
|
//
|
|
void Test4078588(/* char* par */);
|
|
|
|
// @bug 4079231
|
|
//
|
|
// RuleBasedCollator.equals(null) throws NullPointerException
|
|
//
|
|
void Test4079231(/* char* par */);
|
|
|
|
// @bug 4081866
|
|
//
|
|
// Combining characters in different classes not reordered properly.
|
|
//
|
|
void Test4081866(/* char* par */);
|
|
|
|
// @bug 4087241
|
|
//
|
|
// string comparison errors in Scandinavian collators
|
|
//
|
|
void Test4087241(/* char* par */);
|
|
|
|
// @bug 4087243
|
|
//
|
|
// CollationKey takes ignorable strings into account when it shouldn't
|
|
//
|
|
void Test4087243(/* char* par */);
|
|
|
|
// @bug 4092260
|
|
//
|
|
// Mu/micro conflict
|
|
// Micro symbol and greek lowercase letter Mu should sort identically
|
|
//
|
|
void Test4092260(/* char* par */);
|
|
|
|
// @bug 4095316
|
|
//
|
|
void Test4095316(/* char* par */);
|
|
|
|
// @bug 4101940
|
|
//
|
|
void Test4101940(/* char* par */);
|
|
|
|
// @bug 4103436
|
|
//
|
|
// Collator.compare not handling spaces properly
|
|
//
|
|
void Test4103436(/* char* par */);
|
|
|
|
// @bug 4114076
|
|
//
|
|
// Collation not Unicode conformant with Hangul syllables
|
|
//
|
|
void Test4114076(/* char* par */);
|
|
|
|
|
|
// @bug 4114077
|
|
//
|
|
// Collation with decomposition off doesn't work for Europe
|
|
//
|
|
void Test4114077(/* char* par */);
|
|
|
|
// @bug 4124632
|
|
//
|
|
// Collator.getCollationKey was hanging on certain character sequences
|
|
//
|
|
void Test4124632(/* char* par */);
|
|
|
|
// @bug 4132736
|
|
//
|
|
// sort order of french words with multiple accents has errors
|
|
//
|
|
void Test4132736(/* char* par */);
|
|
|
|
// @bug 4133509
|
|
//
|
|
// The sorting using java.text.CollationKey is not in the exact order
|
|
//
|
|
void Test4133509(/* char* par */);
|
|
|
|
// @bug 4139572
|
|
//
|
|
// getCollationKey throws exception for spanish text
|
|
// Cannot reproduce this bug on 1.2, however it DOES fail on 1.1.6
|
|
//
|
|
void Test4139572(/* char* par */);
|
|
|
|
// @bug 4141640
|
|
//
|
|
// Support for Swedish gone in 1.1.6 (Can't create Swedish collator)
|
|
//
|
|
void Test4141640(/* char* par */);
|
|
|
|
// @bug 4146160
|
|
//
|
|
// RuleBasedCollator doesn't use getCollationElementIterator internally
|
|
//
|
|
void Test4146160(/* char* par */);
|
|
|
|
void Test4179216();
|
|
|
|
// Ticket 7189
|
|
//
|
|
// nextSortKeyPart incorrect for EO_S1 collation
|
|
//
|
|
void TestT7189();
|
|
|
|
// Ticket 8624
|
|
//
|
|
// Tertiary value compression problem with case first option enabled
|
|
//
|
|
void TestCaseFirstCompression();
|
|
|
|
void TestTrailingComment();
|
|
void TestBeforeWithTooStrongAfter();
|
|
|
|
private:
|
|
//------------------------------------------------------------------------
|
|
// Internal utilities
|
|
//
|
|
void compareArray(Collator &c,
|
|
const UChar tests[][CollationRegressionTest::MAX_TOKEN_LEN],
|
|
int32_t testCount);
|
|
|
|
void assertEqual(CollationElementIterator &i1, CollationElementIterator &i2);
|
|
|
|
|
|
RuleBasedCollator *en_us;
|
|
|
|
void caseFirstCompressionSub(Collator *col, UnicodeString opt);
|
|
};
|
|
|
|
#endif /* #if !UCONFIG_NO_COLLATION */
|
|
|
|
#endif
|