// © 2016 and later: Unicode, Inc. and others. // License & terms of use: http://www.unicode.org/copyright.html /* ***************************************************************************** * Copyright (C) 1996-2014, International Business Machines Corporation and others. * All Rights Reserved. ***************************************************************************** * * File sortkey.h * * Created by: Helena Shih * * Modification History: * * Date Name Description * * 6/20/97 helena Java class name change. * 8/18/97 helena Added internal API documentation. * 6/26/98 erm Changed to use byte arrays and memcmp. ***************************************************************************** */ #ifndef SORTKEY_H #define SORTKEY_H #include "unicode/utypes.h" #if U_SHOW_CPLUSPLUS_API /** * \file * \brief C++ API: Keys for comparing strings multiple times. */ #if !UCONFIG_NO_COLLATION #include "unicode/uobject.h" #include "unicode/unistr.h" #include "unicode/coll.h" U_NAMESPACE_BEGIN /* forward declaration */ class RuleBasedCollator; class CollationKeyByteSink; /** * * Collation keys are generated by the Collator class. Use the CollationKey objects * instead of Collator to compare strings multiple times. A CollationKey * preprocesses the comparison information from the Collator object to * make the comparison faster. If you are not going to comparing strings * multiple times, then using the Collator object is generally faster, * since it only processes as much of the string as needed to make a * comparison. * <p> For example (with strength == tertiary) * <p>When comparing "Abernathy" to "Baggins-Smythworthy", Collator * only needs to process a couple of characters, while a comparison * with CollationKeys will process all of the characters. On the other hand, * if you are doing a sort of a number of fields, it is much faster to use * CollationKeys, since you will be comparing strings multiple times. * <p>Typical use of CollationKeys are in databases, where you store a CollationKey * in a hidden field, and use it for sorting or indexing. * * <p>Example of use: * <pre> * \code * UErrorCode success = U_ZERO_ERROR; * Collator* myCollator = Collator::createInstance(success); * CollationKey* keys = new CollationKey [3]; * myCollator->getCollationKey("Tom", keys[0], success ); * myCollator->getCollationKey("Dick", keys[1], success ); * myCollator->getCollationKey("Harry", keys[2], success ); * * // Inside body of sort routine, compare keys this way: * CollationKey tmp; * if(keys[0].compareTo( keys[1] ) > 0 ) { * tmp = keys[0]; keys[0] = keys[1]; keys[1] = tmp; * } * //... * \endcode * </pre> * <p>Because Collator::compare()'s algorithm is complex, it is faster to sort * long lists of words by retrieving collation keys with Collator::getCollationKey(). * You can then cache the collation keys and compare them using CollationKey::compareTo(). * <p> * <strong>Note:</strong> <code>Collator</code>s with different Locale, * CollationStrength and DecompositionMode settings will return different * CollationKeys for the same set of strings. Locales have specific * collation rules, and the way in which secondary and tertiary differences * are taken into account, for example, will result in different CollationKeys * for same strings. * <p> * @see Collator * @see RuleBasedCollator * @version 1.3 12/18/96 * @author Helena Shih * @stable ICU 2.0 */ class U_I18N_API CollationKey : public UObject { public: /** * This creates an empty collation key based on the null string. An empty * collation key contains no sorting information. When comparing two empty * collation keys, the result is Collator::EQUAL. Comparing empty collation key * with non-empty collation key is always Collator::LESS. * @stable ICU 2.0 */ CollationKey(); /** * Creates a collation key based on the collation key values. * @param values the collation key values * @param count number of collation key values, including trailing nulls. * @stable ICU 2.0 */ CollationKey(const uint8_t* values, int32_t count); /** * Copy constructor. * @param other the object to be copied. * @stable ICU 2.0 */ CollationKey(const CollationKey& other); /** * Sort key destructor. * @stable ICU 2.0 */ virtual ~CollationKey(); /** * Assignment operator * @param other the object to be copied. * @stable ICU 2.0 */ const CollationKey& operator=(const CollationKey& other); /** * Compare if two collation keys are the same. * @param source the collation key to compare to. * @return Returns true if two collation keys are equal, false otherwise. * @stable ICU 2.0 */ UBool operator==(const CollationKey& source) const; /** * Compare if two collation keys are not the same. * @param source the collation key to compare to. * @return Returns TRUE if two collation keys are different, FALSE otherwise. * @stable ICU 2.0 */ UBool operator!=(const CollationKey& source) const; /** * Test to see if the key is in an invalid state. The key will be in an * invalid state if it couldn't allocate memory for some operation. * @return Returns TRUE if the key is in an invalid, FALSE otherwise. * @stable ICU 2.0 */ UBool isBogus(void) const; /** * Returns a pointer to the collation key values. The storage is owned * by the collation key and the pointer will become invalid if the key * is deleted. * @param count the output parameter of number of collation key values, * including any trailing nulls. * @return a pointer to the collation key values. * @stable ICU 2.0 */ const uint8_t* getByteArray(int32_t& count) const; #ifdef U_USE_COLLATION_KEY_DEPRECATES /** * Extracts the collation key values into a new array. The caller owns * this storage and should free it. * @param count the output parameter of number of collation key values, * including any trailing nulls. * @obsolete ICU 2.6. Use getByteArray instead since this API will be removed in that release. */ uint8_t* toByteArray(int32_t& count) const; #endif #ifndef U_HIDE_DEPRECATED_API /** * Convenience method which does a string(bit-wise) comparison of the * two collation keys. * @param target target collation key to be compared with * @return Returns Collator::LESS if sourceKey < targetKey, * Collator::GREATER if sourceKey > targetKey and Collator::EQUAL * otherwise. * @deprecated ICU 2.6 use the overload with error code */ Collator::EComparisonResult compareTo(const CollationKey& target) const; #endif /* U_HIDE_DEPRECATED_API */ /** * Convenience method which does a string(bit-wise) comparison of the * two collation keys. * @param target target collation key to be compared with * @param status error code * @return Returns UCOL_LESS if sourceKey < targetKey, * UCOL_GREATER if sourceKey > targetKey and UCOL_EQUAL * otherwise. * @stable ICU 2.6 */ UCollationResult compareTo(const CollationKey& target, UErrorCode &status) const; /** * Creates an integer that is unique to the collation key. NOTE: this * is not the same as String.hashCode. * <p>Example of use: * <pre> * . UErrorCode status = U_ZERO_ERROR; * . Collator *myCollation = Collator::createInstance(Locale::US, status); * . if (U_FAILURE(status)) return; * . CollationKey key1, key2; * . UErrorCode status1 = U_ZERO_ERROR, status2 = U_ZERO_ERROR; * . myCollation->getCollationKey("abc", key1, status1); * . if (U_FAILURE(status1)) { delete myCollation; return; } * . myCollation->getCollationKey("ABC", key2, status2); * . if (U_FAILURE(status2)) { delete myCollation; return; } * . // key1.hashCode() != key2.hashCode() * </pre> * @return the hash value based on the string's collation order. * @see UnicodeString#hashCode * @stable ICU 2.0 */ int32_t hashCode(void) const; /** * ICU "poor man's RTTI", returns a UClassID for the actual class. * @stable ICU 2.2 */ virtual UClassID getDynamicClassID() const; /** * ICU "poor man's RTTI", returns a UClassID for this class. * @stable ICU 2.2 */ static UClassID U_EXPORT2 getStaticClassID(); private: /** * Replaces the current bytes buffer with a new one of newCapacity * and copies length bytes from the old buffer to the new one. * @return the new buffer, or NULL if the allocation failed */ uint8_t *reallocate(int32_t newCapacity, int32_t length); /** * Set a new length for a new sort key in the existing fBytes. */ void setLength(int32_t newLength); uint8_t *getBytes() { return (fFlagAndLength >= 0) ? fUnion.fStackBuffer : fUnion.fFields.fBytes; } const uint8_t *getBytes() const { return (fFlagAndLength >= 0) ? fUnion.fStackBuffer : fUnion.fFields.fBytes; } int32_t getCapacity() const { return (fFlagAndLength >= 0) ? (int32_t)sizeof(fUnion) : fUnion.fFields.fCapacity; } int32_t getLength() const { return fFlagAndLength & 0x7fffffff; } /** * Set the CollationKey to a "bogus" or invalid state * @return this CollationKey */ CollationKey& setToBogus(void); /** * Resets this CollationKey to an empty state * @return this CollationKey */ CollationKey& reset(void); /** * Allow private access to RuleBasedCollator */ friend class RuleBasedCollator; friend class CollationKeyByteSink; // Class fields. sizeof(CollationKey) is intended to be 48 bytes // on a machine with 64-bit pointers. // We use a union to maximize the size of the internal buffer, // similar to UnicodeString but not as tight and complex. // (implicit) *vtable; /** * Sort key length and flag. * Bit 31 is set if the buffer is heap-allocated. * Bits 30..0 contain the sort key length. */ int32_t fFlagAndLength; /** * Unique hash value of this CollationKey. * Special value 2 if the key is bogus. */ mutable int32_t fHashCode; /** * fUnion provides 32 bytes for the internal buffer or for * pointer+capacity. */ union StackBufferOrFields { /** fStackBuffer is used iff fFlagAndLength>=0, else fFields is used */ uint8_t fStackBuffer[32]; struct { uint8_t *fBytes; int32_t fCapacity; } fFields; } fUnion; }; inline UBool CollationKey::operator!=(const CollationKey& other) const { return !(*this == other); } inline UBool CollationKey::isBogus() const { return fHashCode == 2; // kBogusHashCode } inline const uint8_t* CollationKey::getByteArray(int32_t &count) const { count = getLength(); return getBytes(); } U_NAMESPACE_END #endif /* #if !UCONFIG_NO_COLLATION */ #endif /* U_SHOW_CPLUSPLUS_API */ #endif
Name | Type | Size | Permission | Actions |
---|---|---|---|---|
alphaindex.h | File | 26.48 KB | 0644 |
|
appendable.h | File | 8.49 KB | 0644 |
|
basictz.h | File | 9.15 KB | 0644 |
|
brkiter.h | File | 27.8 KB | 0644 |
|
bytestream.h | File | 9.6 KB | 0644 |
|
bytestrie.h | File | 20.77 KB | 0644 |
|
bytestriebuilder.h | File | 7.08 KB | 0644 |
|
calendar.h | File | 105.74 KB | 0644 |
|
caniter.h | File | 7.43 KB | 0644 |
|
casemap.h | File | 25.33 KB | 0644 |
|
char16ptr.h | File | 7.22 KB | 0644 |
|
chariter.h | File | 24.05 KB | 0644 |
|
choicfmt.h | File | 23.91 KB | 0644 |
|
coleitr.h | File | 13.76 KB | 0644 |
|
coll.h | File | 56.23 KB | 0644 |
|
compactdecimalformat.h | File | 6.88 KB | 0644 |
|
curramt.h | File | 3.76 KB | 0644 |
|
currpinf.h | File | 7.3 KB | 0644 |
|
currunit.h | File | 4.05 KB | 0644 |
|
datefmt.h | File | 40.67 KB | 0644 |
|
dbbi.h | File | 1.19 KB | 0644 |
|
dcfmtsym.h | File | 20.13 KB | 0644 |
|
decimfmt.h | File | 87.38 KB | 0644 |
|
docmain.h | File | 6.97 KB | 0644 |
|
dtfmtsym.h | File | 37.7 KB | 0644 |
|
dtintrv.h | File | 3.84 KB | 0644 |
|
dtitvfmt.h | File | 46.63 KB | 0644 |
|
dtitvinf.h | File | 18.51 KB | 0644 |
|
dtptngen.h | File | 25.08 KB | 0644 |
|
dtrule.h | File | 8.68 KB | 0644 |
|
edits.h | File | 20.74 KB | 0644 |
|
enumset.h | File | 2.08 KB | 0644 |
|
errorcode.h | File | 4.84 KB | 0644 |
|
fieldpos.h | File | 8.69 KB | 0644 |
|
filteredbrk.h | File | 5.37 KB | 0644 |
|
fmtable.h | File | 24.42 KB | 0644 |
|
format.h | File | 12.5 KB | 0644 |
|
formattedvalue.h | File | 10.27 KB | 0644 |
|
fpositer.h | File | 3.04 KB | 0644 |
|
gender.h | File | 3.33 KB | 0644 |
|
gregocal.h | File | 31.71 KB | 0644 |
|
icudataver.h | File | 1.03 KB | 0644 |
|
icuplug.h | File | 11.88 KB | 0644 |
|
idna.h | File | 12.7 KB | 0644 |
|
listformatter.h | File | 9.47 KB | 0644 |
|
localebuilder.h | File | 11.27 KB | 0644 |
|
localematcher.h | File | 22.5 KB | 0644 |
|
localpointer.h | File | 19.69 KB | 0644 |
|
locdspnm.h | File | 7.12 KB | 0644 |
|
locid.h | File | 47.4 KB | 0644 |
|
measfmt.h | File | 11.33 KB | 0644 |
|
measunit.h | File | 93.31 KB | 0644 |
|
measure.h | File | 4.32 KB | 0644 |
|
messagepattern.h | File | 33.71 KB | 0644 |
|
msgfmt.h | File | 44.11 KB | 0644 |
|
normalizer2.h | File | 34.03 KB | 0644 |
|
normlzr.h | File | 30.94 KB | 0644 |
|
nounit.h | File | 2.69 KB | 0644 |
|
numberformatter.h | File | 86.31 KB | 0644 |
|
numberrangeformatter.h | File | 30.14 KB | 0644 |
|
numfmt.h | File | 49.81 KB | 0644 |
|
numsys.h | File | 7.19 KB | 0644 |
|
parseerr.h | File | 3.08 KB | 0644 |
|
parsepos.h | File | 5.56 KB | 0644 |
|
platform.h | File | 28.08 KB | 0644 |
|
plurfmt.h | File | 25.2 KB | 0644 |
|
plurrule.h | File | 18.39 KB | 0644 |
|
ptypes.h | File | 3.49 KB | 0644 |
|
putil.h | File | 6.33 KB | 0644 |
|
rbbi.h | File | 26.58 KB | 0644 |
|
rbnf.h | File | 48.73 KB | 0644 |
|
rbtz.h | File | 15.6 KB | 0644 |
|
regex.h | File | 84.36 KB | 0644 |
|
region.h | File | 9.18 KB | 0644 |
|
reldatefmt.h | File | 22.62 KB | 0644 |
|
rep.h | File | 9.37 KB | 0644 |
|
resbund.h | File | 18.07 KB | 0644 |
|
schriter.h | File | 6.32 KB | 0644 |
|
scientificnumberformatter.h | File | 6.4 KB | 0644 |
|
search.h | File | 22.22 KB | 0644 |
|
selfmt.h | File | 14.3 KB | 0644 |
|
simpleformatter.h | File | 12.59 KB | 0644 |
|
simpletz.h | File | 45.44 KB | 0644 |
|
smpdtfmt.h | File | 70.97 KB | 0644 |
|
sortkey.h | File | 11.18 KB | 0644 |
|
std_string.h | File | 1.05 KB | 0644 |
|
strenum.h | File | 9.92 KB | 0644 |
|
stringoptions.h | File | 5.79 KB | 0644 |
|
stringpiece.h | File | 7.38 KB | 0644 |
|
stringtriebuilder.h | File | 15.33 KB | 0644 |
|
stsearch.h | File | 21.3 KB | 0644 |
|
symtable.h | File | 4.27 KB | 0644 |
|
tblcoll.h | File | 36.61 KB | 0644 |
|
timezone.h | File | 41.02 KB | 0644 |
|
tmunit.h | File | 3.38 KB | 0644 |
|
tmutamt.h | File | 4.9 KB | 0644 |
|
tmutfmt.h | File | 7.85 KB | 0644 |
|
translit.h | File | 65.82 KB | 0644 |
|
tzfmt.h | File | 42.89 KB | 0644 |
|
tznames.h | File | 16.85 KB | 0644 |
|
tzrule.h | File | 35.37 KB | 0644 |
|
tztrans.h | File | 6.12 KB | 0644 |
|
ubidi.h | File | 89.56 KB | 0644 |
|
ubiditransform.h | File | 12.65 KB | 0644 |
|
ubrk.h | File | 23.97 KB | 0644 |
|
ucal.h | File | 56.9 KB | 0644 |
|
ucasemap.h | File | 15.18 KB | 0644 |
|
ucat.h | File | 5.36 KB | 0644 |
|
uchar.h | File | 140.56 KB | 0644 |
|
ucharstrie.h | File | 22.58 KB | 0644 |
|
ucharstriebuilder.h | File | 7.21 KB | 0644 |
|
uchriter.h | File | 13.2 KB | 0644 |
|
uclean.h | File | 11.21 KB | 0644 |
|
ucnv.h | File | 83.09 KB | 0644 |
|
ucnv_cb.h | File | 6.59 KB | 0644 |
|
ucnv_err.h | File | 20.99 KB | 0644 |
|
ucnvsel.h | File | 6.14 KB | 0644 |
|
ucol.h | File | 61.46 KB | 0644 |
|
ucoleitr.h | File | 9.46 KB | 0644 |
|
uconfig.h | File | 12.07 KB | 0644 |
|
ucpmap.h | File | 5.53 KB | 0644 |
|
ucptrie.h | File | 22.46 KB | 0644 |
|
ucsdet.h | File | 14.67 KB | 0644 |
|
ucurr.h | File | 16.12 KB | 0644 |
|
udat.h | File | 60.88 KB | 0644 |
|
udata.h | File | 15.56 KB | 0644 |
|
udateintervalformat.h | File | 10.03 KB | 0644 |
|
udatpg.h | File | 26.01 KB | 0644 |
|
udisplaycontext.h | File | 5.89 KB | 0644 |
|
uenum.h | File | 7.78 KB | 0644 |
|
ufieldpositer.h | File | 4.36 KB | 0644 |
|
uformattable.h | File | 10.94 KB | 0644 |
|
uformattedvalue.h | File | 12.14 KB | 0644 |
|
ugender.h | File | 2 KB | 0644 |
|
uidna.h | File | 33.37 KB | 0644 |
|
uiter.h | File | 22.77 KB | 0644 |
|
uldnames.h | File | 10.45 KB | 0644 |
|
ulistformatter.h | File | 8.83 KB | 0644 |
|
uloc.h | File | 52.54 KB | 0644 |
|
ulocdata.h | File | 11.26 KB | 0644 |
|
umachine.h | File | 14.53 KB | 0644 |
|
umisc.h | File | 1.33 KB | 0644 |
|
umsg.h | File | 24.23 KB | 0644 |
|
umutablecptrie.h | File | 8.24 KB | 0644 |
|
unifilt.h | File | 3.96 KB | 0644 |
|
unifunct.h | File | 4.04 KB | 0644 |
|
unimatch.h | File | 6.1 KB | 0644 |
|
unirepl.h | File | 3.38 KB | 0644 |
|
uniset.h | File | 64.9 KB | 0644 |
|
unistr.h | File | 170.43 KB | 0644 |
|
unorm.h | File | 20.52 KB | 0644 |
|
unorm2.h | File | 24.66 KB | 0644 |
|
unum.h | File | 53.62 KB | 0644 |
|
unumberformatter.h | File | 25.36 KB | 0644 |
|
unumsys.h | File | 7.21 KB | 0644 |
|
uobject.h | File | 10.68 KB | 0644 |
|
upluralrules.h | File | 7.88 KB | 0644 |
|
uregex.h | File | 72.05 KB | 0644 |
|
uregion.h | File | 9.84 KB | 0644 |
|
ureldatefmt.h | File | 17.26 KB | 0644 |
|
urename.h | File | 130.97 KB | 0644 |
|
urep.h | File | 5.38 KB | 0644 |
|
ures.h | File | 36.54 KB | 0644 |
|
uscript.h | File | 26.87 KB | 0644 |
|
usearch.h | File | 38.12 KB | 0644 |
|
uset.h | File | 40 KB | 0644 |
|
usetiter.h | File | 9.55 KB | 0644 |
|
ushape.h | File | 18 KB | 0644 |
|
uspoof.h | File | 65.9 KB | 0644 |
|
usprep.h | File | 8.14 KB | 0644 |
|
ustdio.h | File | 38.54 KB | 0644 |
|
ustream.h | File | 1.89 KB | 0644 |
|
ustring.h | File | 72.47 KB | 0644 |
|
ustringtrie.h | File | 3.15 KB | 0644 |
|
utext.h | File | 58.13 KB | 0644 |
|
utf.h | File | 7.86 KB | 0644 |
|
utf16.h | File | 23.32 KB | 0644 |
|
utf32.h | File | 763 B | 0644 |
|
utf8.h | File | 30.96 KB | 0644 |
|
utf_old.h | File | 45.83 KB | 0644 |
|
utmscale.h | File | 13.78 KB | 0644 |
|
utrace.h | File | 15.73 KB | 0644 |
|
utrans.h | File | 25.52 KB | 0644 |
|
utypes.h | File | 30.74 KB | 0644 |
|
uvernum.h | File | 6.67 KB | 0644 |
|
uversion.h | File | 6 KB | 0644 |
|
vtzone.h | File | 20.3 KB | 0644 |
|