123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658 |
- #ifndef __NORMALIZER2_H__
- #define __NORMALIZER2_H__
- #include "unicode/utypes.h"
- #if !UCONFIG_NO_NORMALIZATION
- #include "unicode/uniset.h"
- #include "unicode/unistr.h"
- #include "unicode/unorm2.h"
- U_NAMESPACE_BEGIN
- class U_COMMON_API Normalizer2 : public UObject {
- public:
-
- ~Normalizer2();
-
- static const Normalizer2 *
- getNFCInstance(UErrorCode &errorCode);
-
- static const Normalizer2 *
- getNFDInstance(UErrorCode &errorCode);
-
- static const Normalizer2 *
- getNFKCInstance(UErrorCode &errorCode);
-
- static const Normalizer2 *
- getNFKDInstance(UErrorCode &errorCode);
-
- static const Normalizer2 *
- getNFKCCasefoldInstance(UErrorCode &errorCode);
-
- static const Normalizer2 *
- getInstance(const char *packageName,
- const char *name,
- UNormalization2Mode mode,
- UErrorCode &errorCode);
-
- UnicodeString
- normalize(const UnicodeString &src, UErrorCode &errorCode) const {
- UnicodeString result;
- normalize(src, result, errorCode);
- return result;
- }
-
- virtual UnicodeString &
- normalize(const UnicodeString &src,
- UnicodeString &dest,
- UErrorCode &errorCode) const = 0;
-
- virtual UnicodeString &
- normalizeSecondAndAppend(UnicodeString &first,
- const UnicodeString &second,
- UErrorCode &errorCode) const = 0;
-
- virtual UnicodeString &
- append(UnicodeString &first,
- const UnicodeString &second,
- UErrorCode &errorCode) const = 0;
-
- virtual UBool
- getDecomposition(UChar32 c, UnicodeString &decomposition) const = 0;
-
- virtual UBool
- getRawDecomposition(UChar32 c, UnicodeString &decomposition) const;
-
- virtual UChar32
- composePair(UChar32 a, UChar32 b) const;
-
- virtual uint8_t
- getCombiningClass(UChar32 c) const;
-
- virtual UBool
- isNormalized(const UnicodeString &s, UErrorCode &errorCode) const = 0;
-
- virtual UNormalizationCheckResult
- quickCheck(const UnicodeString &s, UErrorCode &errorCode) const = 0;
-
- virtual int32_t
- spanQuickCheckYes(const UnicodeString &s, UErrorCode &errorCode) const = 0;
-
- virtual UBool hasBoundaryBefore(UChar32 c) const = 0;
-
- virtual UBool hasBoundaryAfter(UChar32 c) const = 0;
-
- virtual UBool isInert(UChar32 c) const = 0;
- };
- class U_COMMON_API FilteredNormalizer2 : public Normalizer2 {
- public:
-
- FilteredNormalizer2(const Normalizer2 &n2, const UnicodeSet &filterSet) :
- norm2(n2), set(filterSet) {}
-
- ~FilteredNormalizer2();
-
- virtual UnicodeString &
- normalize(const UnicodeString &src,
- UnicodeString &dest,
- UErrorCode &errorCode) const;
-
- virtual UnicodeString &
- normalizeSecondAndAppend(UnicodeString &first,
- const UnicodeString &second,
- UErrorCode &errorCode) const;
-
- virtual UnicodeString &
- append(UnicodeString &first,
- const UnicodeString &second,
- UErrorCode &errorCode) const;
-
- virtual UBool
- getDecomposition(UChar32 c, UnicodeString &decomposition) const;
-
- virtual UBool
- getRawDecomposition(UChar32 c, UnicodeString &decomposition) const;
-
- virtual UChar32
- composePair(UChar32 a, UChar32 b) const;
-
- virtual uint8_t
- getCombiningClass(UChar32 c) const;
-
- virtual UBool
- isNormalized(const UnicodeString &s, UErrorCode &errorCode) const;
-
- virtual UNormalizationCheckResult
- quickCheck(const UnicodeString &s, UErrorCode &errorCode) const;
-
- virtual int32_t
- spanQuickCheckYes(const UnicodeString &s, UErrorCode &errorCode) const;
-
- virtual UBool hasBoundaryBefore(UChar32 c) const;
-
- virtual UBool hasBoundaryAfter(UChar32 c) const;
-
- virtual UBool isInert(UChar32 c) const;
- private:
- UnicodeString &
- normalize(const UnicodeString &src,
- UnicodeString &dest,
- USetSpanCondition spanCondition,
- UErrorCode &errorCode) const;
- UnicodeString &
- normalizeSecondAndAppend(UnicodeString &first,
- const UnicodeString &second,
- UBool doNormalize,
- UErrorCode &errorCode) const;
- const Normalizer2 &norm2;
- const UnicodeSet &set;
- };
- U_NAMESPACE_END
- #endif
- #endif
|