You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
199 lines
5.5 KiB
199 lines
5.5 KiB
// © 2018 and later: Unicode, Inc. and others.
|
|
// License & terms of use: http://www.unicode.org/copyright.html
|
|
|
|
#include "unicode/utypes.h"
|
|
|
|
#if !UCONFIG_NO_FORMATTING
|
|
|
|
// Allow implicit conversion from char16_t* to UnicodeString for this file:
|
|
// Helpful in toString methods and elsewhere.
|
|
#define UNISTR_FROM_STRING_EXPLICIT
|
|
|
|
#include "numparse_types.h"
|
|
#include "numparse_symbols.h"
|
|
#include "numparse_utils.h"
|
|
#include "string_segment.h"
|
|
|
|
using namespace icu;
|
|
using namespace icu::numparse;
|
|
using namespace icu::numparse::impl;
|
|
|
|
|
|
SymbolMatcher::SymbolMatcher(const UnicodeString& symbolString, unisets::Key key) {
|
|
fUniSet = unisets::get(key);
|
|
if (fUniSet->contains(symbolString)) {
|
|
fString.setToBogus();
|
|
} else {
|
|
fString = symbolString;
|
|
}
|
|
}
|
|
|
|
const UnicodeSet* SymbolMatcher::getSet() const {
|
|
return fUniSet;
|
|
}
|
|
|
|
bool SymbolMatcher::match(StringSegment& segment, ParsedNumber& result, UErrorCode&) const {
|
|
// Smoke test first; this matcher might be disabled.
|
|
if (isDisabled(result)) {
|
|
return false;
|
|
}
|
|
|
|
// Test the string first in order to consume trailing chars greedily.
|
|
int overlap = 0;
|
|
if (!fString.isEmpty()) {
|
|
overlap = segment.getCommonPrefixLength(fString);
|
|
if (overlap == fString.length()) {
|
|
segment.adjustOffset(fString.length());
|
|
accept(segment, result);
|
|
return false;
|
|
}
|
|
}
|
|
|
|
int cp = segment.getCodePoint();
|
|
if (cp != -1 && fUniSet->contains(cp)) {
|
|
segment.adjustOffset(U16_LENGTH(cp));
|
|
accept(segment, result);
|
|
return false;
|
|
}
|
|
|
|
return overlap == segment.length();
|
|
}
|
|
|
|
bool SymbolMatcher::smokeTest(const StringSegment& segment) const {
|
|
return segment.startsWith(*fUniSet) || segment.startsWith(fString);
|
|
}
|
|
|
|
UnicodeString SymbolMatcher::toString() const {
|
|
// TODO: Customize output for each symbol
|
|
return u"<Symbol>";
|
|
}
|
|
|
|
|
|
IgnorablesMatcher::IgnorablesMatcher(parse_flags_t parseFlags) :
|
|
SymbolMatcher(
|
|
{},
|
|
(0 != (parseFlags & PARSE_FLAG_STRICT_IGNORABLES)) ?
|
|
unisets::STRICT_IGNORABLES :
|
|
unisets::DEFAULT_IGNORABLES) {
|
|
}
|
|
|
|
bool IgnorablesMatcher::isFlexible() const {
|
|
return true;
|
|
}
|
|
|
|
UnicodeString IgnorablesMatcher::toString() const {
|
|
return u"<Ignorables>";
|
|
}
|
|
|
|
bool IgnorablesMatcher::isDisabled(const ParsedNumber&) const {
|
|
return false;
|
|
}
|
|
|
|
void IgnorablesMatcher::accept(StringSegment&, ParsedNumber&) const {
|
|
// No-op
|
|
}
|
|
|
|
|
|
InfinityMatcher::InfinityMatcher(const DecimalFormatSymbols& dfs)
|
|
: SymbolMatcher(dfs.getConstSymbol(DecimalFormatSymbols::kInfinitySymbol), unisets::INFINITY_SIGN) {
|
|
}
|
|
|
|
bool InfinityMatcher::isDisabled(const ParsedNumber& result) const {
|
|
return 0 != (result.flags & FLAG_INFINITY);
|
|
}
|
|
|
|
void InfinityMatcher::accept(StringSegment& segment, ParsedNumber& result) const {
|
|
result.flags |= FLAG_INFINITY;
|
|
result.setCharsConsumed(segment);
|
|
}
|
|
|
|
|
|
MinusSignMatcher::MinusSignMatcher(const DecimalFormatSymbols& dfs, bool allowTrailing)
|
|
: SymbolMatcher(dfs.getConstSymbol(DecimalFormatSymbols::kMinusSignSymbol), unisets::MINUS_SIGN),
|
|
fAllowTrailing(allowTrailing) {
|
|
}
|
|
|
|
bool MinusSignMatcher::isDisabled(const ParsedNumber& result) const {
|
|
return !fAllowTrailing && result.seenNumber();
|
|
}
|
|
|
|
void MinusSignMatcher::accept(StringSegment& segment, ParsedNumber& result) const {
|
|
result.flags |= FLAG_NEGATIVE;
|
|
result.setCharsConsumed(segment);
|
|
}
|
|
|
|
|
|
NanMatcher::NanMatcher(const DecimalFormatSymbols& dfs)
|
|
: SymbolMatcher(dfs.getConstSymbol(DecimalFormatSymbols::kNaNSymbol), unisets::EMPTY) {
|
|
}
|
|
|
|
bool NanMatcher::isDisabled(const ParsedNumber& result) const {
|
|
return result.seenNumber();
|
|
}
|
|
|
|
void NanMatcher::accept(StringSegment& segment, ParsedNumber& result) const {
|
|
result.flags |= FLAG_NAN;
|
|
result.setCharsConsumed(segment);
|
|
}
|
|
|
|
|
|
PaddingMatcher::PaddingMatcher(const UnicodeString& padString)
|
|
: SymbolMatcher(padString, unisets::EMPTY) {}
|
|
|
|
bool PaddingMatcher::isFlexible() const {
|
|
return true;
|
|
}
|
|
|
|
bool PaddingMatcher::isDisabled(const ParsedNumber&) const {
|
|
return false;
|
|
}
|
|
|
|
void PaddingMatcher::accept(StringSegment&, ParsedNumber&) const {
|
|
// No-op
|
|
}
|
|
|
|
|
|
PercentMatcher::PercentMatcher(const DecimalFormatSymbols& dfs)
|
|
: SymbolMatcher(dfs.getConstSymbol(DecimalFormatSymbols::kPercentSymbol), unisets::PERCENT_SIGN) {
|
|
}
|
|
|
|
bool PercentMatcher::isDisabled(const ParsedNumber& result) const {
|
|
return 0 != (result.flags & FLAG_PERCENT);
|
|
}
|
|
|
|
void PercentMatcher::accept(StringSegment& segment, ParsedNumber& result) const {
|
|
result.flags |= FLAG_PERCENT;
|
|
result.setCharsConsumed(segment);
|
|
}
|
|
|
|
|
|
PermilleMatcher::PermilleMatcher(const DecimalFormatSymbols& dfs)
|
|
: SymbolMatcher(dfs.getConstSymbol(DecimalFormatSymbols::kPerMillSymbol), unisets::PERMILLE_SIGN) {
|
|
}
|
|
|
|
bool PermilleMatcher::isDisabled(const ParsedNumber& result) const {
|
|
return 0 != (result.flags & FLAG_PERMILLE);
|
|
}
|
|
|
|
void PermilleMatcher::accept(StringSegment& segment, ParsedNumber& result) const {
|
|
result.flags |= FLAG_PERMILLE;
|
|
result.setCharsConsumed(segment);
|
|
}
|
|
|
|
|
|
PlusSignMatcher::PlusSignMatcher(const DecimalFormatSymbols& dfs, bool allowTrailing)
|
|
: SymbolMatcher(dfs.getConstSymbol(DecimalFormatSymbols::kPlusSignSymbol), unisets::PLUS_SIGN),
|
|
fAllowTrailing(allowTrailing) {
|
|
}
|
|
|
|
bool PlusSignMatcher::isDisabled(const ParsedNumber& result) const {
|
|
return !fAllowTrailing && result.seenNumber();
|
|
}
|
|
|
|
void PlusSignMatcher::accept(StringSegment& segment, ParsedNumber& result) const {
|
|
result.setCharsConsumed(segment);
|
|
}
|
|
|
|
|
|
#endif /* #if !UCONFIG_NO_FORMATTING */
|