123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151 |
- // © 2016 and later: Unicode, Inc. and others.
- // License & terms of use: http://www.unicode.org/copyright.html
- /*
- **********************************************************************
- * Copyright (C) 2001-2012, International Business Machines
- * Corporation and others. All Rights Reserved.
- **********************************************************************
- * Date Name Description
- * 07/26/01 aliu Creation.
- **********************************************************************
- */
- #include "unicode/utypes.h"
- #if !UCONFIG_NO_TRANSLITERATION
- #include "quant.h"
- #include "unicode/unistr.h"
- #include "util.h"
- U_NAMESPACE_BEGIN
- UOBJECT_DEFINE_RTTI_IMPLEMENTATION(Quantifier)
- Quantifier::Quantifier(UnicodeFunctor *adoptedMatcher,
- uint32_t _minCount, uint32_t _maxCount) {
- // assert(adopted != 0);
- // assert(minCount <= maxCount);
- matcher = adoptedMatcher;
- this->minCount = _minCount;
- this->maxCount = _maxCount;
- }
- Quantifier::Quantifier(const Quantifier& o) :
- UnicodeFunctor(o),
- UnicodeMatcher(o),
- matcher(o.matcher->clone()),
- minCount(o.minCount),
- maxCount(o.maxCount)
- {
- }
- Quantifier::~Quantifier() {
- delete matcher;
- }
- /**
- * Implement UnicodeFunctor
- */
- Quantifier* Quantifier::clone() const {
- return new Quantifier(*this);
- }
- /**
- * UnicodeFunctor API. Cast 'this' to a UnicodeMatcher* pointer
- * and return the pointer.
- */
- UnicodeMatcher* Quantifier::toMatcher() const {
- Quantifier *nonconst_this = const_cast<Quantifier *>(this);
- UnicodeMatcher *nonconst_base = static_cast<UnicodeMatcher *>(nonconst_this);
-
- return nonconst_base;
- }
- UMatchDegree Quantifier::matches(const Replaceable& text,
- int32_t& offset,
- int32_t limit,
- UBool incremental) {
- int32_t start = offset;
- uint32_t count = 0;
- while (count < maxCount) {
- int32_t pos = offset;
- UMatchDegree m = matcher->toMatcher()->matches(text, offset, limit, incremental);
- if (m == U_MATCH) {
- ++count;
- if (pos == offset) {
- // If offset has not moved we have a zero-width match.
- // Don't keep matching it infinitely.
- break;
- }
- } else if (incremental && m == U_PARTIAL_MATCH) {
- return U_PARTIAL_MATCH;
- } else {
- break;
- }
- }
- if (incremental && offset == limit) {
- return U_PARTIAL_MATCH;
- }
- if (count >= minCount) {
- return U_MATCH;
- }
- offset = start;
- return U_MISMATCH;
- }
- /**
- * Implement UnicodeMatcher
- */
- UnicodeString& Quantifier::toPattern(UnicodeString& result,
- UBool escapeUnprintable) const {
- result.truncate(0);
- matcher->toMatcher()->toPattern(result, escapeUnprintable);
- if (minCount == 0) {
- if (maxCount == 1) {
- return result.append((char16_t)63); /*?*/
- } else if (maxCount == MAX) {
- return result.append((char16_t)42); /***/
- }
- // else fall through
- } else if (minCount == 1 && maxCount == MAX) {
- return result.append((char16_t)43); /*+*/
- }
- result.append((char16_t)123); /*{*/
- ICU_Utility::appendNumber(result, minCount);
- result.append((char16_t)44); /*,*/
- if (maxCount != MAX) {
- ICU_Utility::appendNumber(result, maxCount);
- }
- result.append((char16_t)125); /*}*/
- return result;
- }
- /**
- * Implement UnicodeMatcher
- */
- UBool Quantifier::matchesIndexValue(uint8_t v) const {
- return (minCount == 0) || matcher->toMatcher()->matchesIndexValue(v);
- }
- /**
- * Implement UnicodeMatcher
- */
- void Quantifier::addMatchSetTo(UnicodeSet& toUnionTo) const {
- if (maxCount > 0) {
- matcher->toMatcher()->addMatchSetTo(toUnionTo);
- }
- }
- /**
- * Implement UnicodeFunctor
- */
- void Quantifier::setData(const TransliterationRuleData* d) {
- matcher->setData(d);
- }
- U_NAMESPACE_END
- #endif /* #if !UCONFIG_NO_TRANSLITERATION */
- //eof
|