You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
109 lines
3.5 KiB
109 lines
3.5 KiB
// © 2018 and later: Unicode, Inc. and others.
|
|
// License & terms of use: http://www.unicode.org/copyright.html
|
|
|
|
#include "unicode/utypes.h"
|
|
|
|
#if !UCONFIG_NO_FORMATTING
|
|
|
|
// Allow implicit conversion from char16_t* to UnicodeString for this file:
|
|
// Helpful in toString methods and elsewhere.
|
|
#define UNISTR_FROM_STRING_EXPLICIT
|
|
|
|
#include "numparse_types.h"
|
|
#include "numparse_compositions.h"
|
|
#include "string_segment.h"
|
|
#include "unicode/uniset.h"
|
|
|
|
using namespace icu;
|
|
using namespace icu::numparse;
|
|
using namespace icu::numparse::impl;
|
|
|
|
|
|
bool SeriesMatcher::match(StringSegment& segment, ParsedNumber& result, UErrorCode& status) const {
|
|
ParsedNumber backup(result);
|
|
|
|
int32_t initialOffset = segment.getOffset();
|
|
bool maybeMore = true;
|
|
for (auto* it = begin(); it < end();) {
|
|
const NumberParseMatcher* matcher = *it;
|
|
int matcherOffset = segment.getOffset();
|
|
if (segment.length() != 0) {
|
|
maybeMore = matcher->match(segment, result, status);
|
|
} else {
|
|
// Nothing for this matcher to match; ask for more.
|
|
maybeMore = true;
|
|
}
|
|
|
|
bool success = (segment.getOffset() != matcherOffset);
|
|
bool isFlexible = matcher->isFlexible();
|
|
if (success && isFlexible) {
|
|
// Match succeeded, and this is a flexible matcher. Re-run it.
|
|
} else if (success) {
|
|
// Match succeeded, and this is NOT a flexible matcher. Proceed to the next matcher.
|
|
it++;
|
|
// Small hack: if there is another matcher coming, do not accept trailing weak chars.
|
|
// Needed for proper handling of currency spacing.
|
|
if (it < end() && segment.getOffset() != result.charEnd && result.charEnd > matcherOffset) {
|
|
segment.setOffset(result.charEnd);
|
|
}
|
|
} else if (isFlexible) {
|
|
// Match failed, and this is a flexible matcher. Try again with the next matcher.
|
|
it++;
|
|
} else {
|
|
// Match failed, and this is NOT a flexible matcher. Exit.
|
|
segment.setOffset(initialOffset);
|
|
result = backup;
|
|
return maybeMore;
|
|
}
|
|
}
|
|
|
|
// All matchers in the series succeeded.
|
|
return maybeMore;
|
|
}
|
|
|
|
bool SeriesMatcher::smokeTest(const StringSegment& segment) const {
|
|
// NOTE: The range-based for loop calls the virtual begin() and end() methods.
|
|
// NOTE: We only want the first element. Use the for loop for boundary checking.
|
|
for (auto& matcher : *this) {
|
|
// SeriesMatchers are never allowed to start with a Flexible matcher.
|
|
U_ASSERT(!matcher->isFlexible());
|
|
return matcher->smokeTest(segment);
|
|
}
|
|
return false;
|
|
}
|
|
|
|
void SeriesMatcher::postProcess(ParsedNumber& result) const {
|
|
// NOTE: The range-based for loop calls the virtual begin() and end() methods.
|
|
for (auto* matcher : *this) {
|
|
matcher->postProcess(result);
|
|
}
|
|
}
|
|
|
|
|
|
ArraySeriesMatcher::ArraySeriesMatcher()
|
|
: fMatchersLen(0) {
|
|
}
|
|
|
|
ArraySeriesMatcher::ArraySeriesMatcher(MatcherArray& matchers, int32_t matchersLen)
|
|
: fMatchers(std::move(matchers)), fMatchersLen(matchersLen) {
|
|
}
|
|
|
|
int32_t ArraySeriesMatcher::length() const {
|
|
return fMatchersLen;
|
|
}
|
|
|
|
const NumberParseMatcher* const* ArraySeriesMatcher::begin() const {
|
|
return fMatchers.getAlias();
|
|
}
|
|
|
|
const NumberParseMatcher* const* ArraySeriesMatcher::end() const {
|
|
return fMatchers.getAlias() + fMatchersLen;
|
|
}
|
|
|
|
UnicodeString ArraySeriesMatcher::toString() const {
|
|
return u"<ArraySeries>";
|
|
}
|
|
|
|
|
|
#endif /* #if !UCONFIG_NO_FORMATTING */
|