1 // © 2018 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 
4 #include "unicode/utypes.h"
5 
6 #if !UCONFIG_NO_FORMATTING
7 
8 // Allow implicit conversion from char16_t* to UnicodeString for this file:
9 // Helpful in toString methods and elsewhere.
10 #define UNISTR_FROM_STRING_EXPLICIT
11 
12 #include "numparse_types.h"
13 #include "numparse_compositions.h"
14 #include "string_segment.h"
15 #include "unicode/uniset.h"
16 
17 using namespace icu;
18 using namespace icu::numparse;
19 using namespace icu::numparse::impl;
20 
21 
match(StringSegment & segment,ParsedNumber & result,UErrorCode & status) const22 bool SeriesMatcher::match(StringSegment& segment, ParsedNumber& result, UErrorCode& status) const {
23     ParsedNumber backup(result);
24 
25     int32_t initialOffset = segment.getOffset();
26     bool maybeMore = true;
27     for (auto* it = begin(); it < end();) {
28         const NumberParseMatcher* matcher = *it;
29         int matcherOffset = segment.getOffset();
30         if (segment.length() != 0) {
31             maybeMore = matcher->match(segment, result, status);
32         } else {
33             // Nothing for this matcher to match; ask for more.
34             maybeMore = true;
35         }
36 
37         bool success = (segment.getOffset() != matcherOffset);
38         bool isFlexible = matcher->isFlexible();
39         if (success && isFlexible) {
40             // Match succeeded, and this is a flexible matcher. Re-run it.
41         } else if (success) {
42             // Match succeeded, and this is NOT a flexible matcher. Proceed to the next matcher.
43             it++;
44             // Small hack: if there is another matcher coming, do not accept trailing weak chars.
45             // Needed for proper handling of currency spacing.
46             if (it < end() && segment.getOffset() != result.charEnd && result.charEnd > matcherOffset) {
47                 segment.setOffset(result.charEnd);
48             }
49         } else if (isFlexible) {
50             // Match failed, and this is a flexible matcher. Try again with the next matcher.
51             it++;
52         } else {
53             // Match failed, and this is NOT a flexible matcher. Exit.
54             segment.setOffset(initialOffset);
55             result = backup;
56             return maybeMore;
57         }
58     }
59 
60     // All matchers in the series succeeded.
61     return maybeMore;
62 }
63 
smokeTest(const StringSegment & segment) const64 bool SeriesMatcher::smokeTest(const StringSegment& segment) const {
65     // NOTE: The range-based for loop calls the virtual begin() and end() methods.
66     // NOTE: We only want the first element. Use the for loop for boundary checking.
67     for (auto& matcher : *this) {
68         // SeriesMatchers are never allowed to start with a Flexible matcher.
69         U_ASSERT(!matcher->isFlexible());
70         return matcher->smokeTest(segment);
71     }
72     return false;
73 }
74 
postProcess(ParsedNumber & result) const75 void SeriesMatcher::postProcess(ParsedNumber& result) const {
76     // NOTE: The range-based for loop calls the virtual begin() and end() methods.
77     for (auto* matcher : *this) {
78         matcher->postProcess(result);
79     }
80 }
81 
82 
ArraySeriesMatcher()83 ArraySeriesMatcher::ArraySeriesMatcher()
84         : fMatchersLen(0) {
85 }
86 
ArraySeriesMatcher(MatcherArray & matchers,int32_t matchersLen)87 ArraySeriesMatcher::ArraySeriesMatcher(MatcherArray& matchers, int32_t matchersLen)
88         : fMatchers(std::move(matchers)), fMatchersLen(matchersLen) {
89 }
90 
length() const91 int32_t ArraySeriesMatcher::length() const {
92     return fMatchersLen;
93 }
94 
begin() const95 const NumberParseMatcher* const* ArraySeriesMatcher::begin() const {
96     return fMatchers.getAlias();
97 }
98 
end() const99 const NumberParseMatcher* const* ArraySeriesMatcher::end() const {
100     return fMatchers.getAlias() + fMatchersLen;
101 }
102 
toString() const103 UnicodeString ArraySeriesMatcher::toString() const {
104     return u"<ArraySeries>";
105 }
106 
107 
108 #endif /* #if !UCONFIG_NO_FORMATTING */
109