404

[ Avaa Bypassed ]




Upload:

Command:

elspacio@18.119.164.231: ~ $
// © 2016 and later: Unicode, Inc. and others.
// License & terms of use: http://www.unicode.org/copyright.html
/*
 *******************************************************************************
 * Copyright (C) 1996-2014, International Business Machines Corporation and
 * others. All Rights Reserved.
 *******************************************************************************
 */

#ifndef CANITER_H
#define CANITER_H

#include "unicode/utypes.h"

#if U_SHOW_CPLUSPLUS_API

#if !UCONFIG_NO_NORMALIZATION

#include "unicode/uobject.h"
#include "unicode/unistr.h"

/**
 * \file
 * \brief C++ API: Canonical Iterator
 */
 
/** Should permutation skip characters with combining class zero
 *  Should be either TRUE or FALSE. This is a compile time option
 *  @stable ICU 2.4
 */
#ifndef CANITER_SKIP_ZEROES
#define CANITER_SKIP_ZEROES TRUE
#endif

U_NAMESPACE_BEGIN

class Hashtable;
class Normalizer2;
class Normalizer2Impl;

/**
 * This class allows one to iterate through all the strings that are canonically equivalent to a given
 * string. For example, here are some sample results:
Results for: {LATIN CAPITAL LETTER A WITH RING ABOVE}{LATIN SMALL LETTER D}{COMBINING DOT ABOVE}{COMBINING CEDILLA}
1: \\u0041\\u030A\\u0064\\u0307\\u0327
 = {LATIN CAPITAL LETTER A}{COMBINING RING ABOVE}{LATIN SMALL LETTER D}{COMBINING DOT ABOVE}{COMBINING CEDILLA}
2: \\u0041\\u030A\\u0064\\u0327\\u0307
 = {LATIN CAPITAL LETTER A}{COMBINING RING ABOVE}{LATIN SMALL LETTER D}{COMBINING CEDILLA}{COMBINING DOT ABOVE}
3: \\u0041\\u030A\\u1E0B\\u0327
 = {LATIN CAPITAL LETTER A}{COMBINING RING ABOVE}{LATIN SMALL LETTER D WITH DOT ABOVE}{COMBINING CEDILLA}
4: \\u0041\\u030A\\u1E11\\u0307
 = {LATIN CAPITAL LETTER A}{COMBINING RING ABOVE}{LATIN SMALL LETTER D WITH CEDILLA}{COMBINING DOT ABOVE}
5: \\u00C5\\u0064\\u0307\\u0327
 = {LATIN CAPITAL LETTER A WITH RING ABOVE}{LATIN SMALL LETTER D}{COMBINING DOT ABOVE}{COMBINING CEDILLA}
6: \\u00C5\\u0064\\u0327\\u0307
 = {LATIN CAPITAL LETTER A WITH RING ABOVE}{LATIN SMALL LETTER D}{COMBINING CEDILLA}{COMBINING DOT ABOVE}
7: \\u00C5\\u1E0B\\u0327
 = {LATIN CAPITAL LETTER A WITH RING ABOVE}{LATIN SMALL LETTER D WITH DOT ABOVE}{COMBINING CEDILLA}
8: \\u00C5\\u1E11\\u0307
 = {LATIN CAPITAL LETTER A WITH RING ABOVE}{LATIN SMALL LETTER D WITH CEDILLA}{COMBINING DOT ABOVE}
9: \\u212B\\u0064\\u0307\\u0327
 = {ANGSTROM SIGN}{LATIN SMALL LETTER D}{COMBINING DOT ABOVE}{COMBINING CEDILLA}
10: \\u212B\\u0064\\u0327\\u0307
 = {ANGSTROM SIGN}{LATIN SMALL LETTER D}{COMBINING CEDILLA}{COMBINING DOT ABOVE}
11: \\u212B\\u1E0B\\u0327
 = {ANGSTROM SIGN}{LATIN SMALL LETTER D WITH DOT ABOVE}{COMBINING CEDILLA}
12: \\u212B\\u1E11\\u0307
 = {ANGSTROM SIGN}{LATIN SMALL LETTER D WITH CEDILLA}{COMBINING DOT ABOVE}
 *<br>Note: the code is intended for use with small strings, and is not suitable for larger ones,
 * since it has not been optimized for that situation.
 * Note, CanonicalIterator is not intended to be subclassed.
 * @author M. Davis
 * @author C++ port by V. Weinstein
 * @stable ICU 2.4
 */
class U_COMMON_API CanonicalIterator U_FINAL : public UObject {
public:
    /**
     * Construct a CanonicalIterator object
     * @param source    string to get results for
     * @param status    Fill-in parameter which receives the status of this operation.
     * @stable ICU 2.4
     */
    CanonicalIterator(const UnicodeString &source, UErrorCode &status);

    /** Destructor
     *  Cleans pieces
     * @stable ICU 2.4
     */
    virtual ~CanonicalIterator();

    /**
     * Gets the NFD form of the current source we are iterating over.
     * @return gets the source: NOTE: it is the NFD form of source
     * @stable ICU 2.4
     */
    UnicodeString getSource();

    /**
     * Resets the iterator so that one can start again from the beginning.
     * @stable ICU 2.4
     */
    void reset();

    /**
     * Get the next canonically equivalent string.
     * <br><b>Warning: The strings are not guaranteed to be in any particular order.</b>
     * @return the next string that is canonically equivalent. A bogus string is returned when
     * the iteration is done.
     * @stable ICU 2.4
     */
    UnicodeString next();

    /**
     * Set a new source for this iterator. Allows object reuse.
     * @param newSource     the source string to iterate against. This allows the same iterator to be used
     *                     while changing the source string, saving object creation.
     * @param status        Fill-in parameter which receives the status of this operation.
     * @stable ICU 2.4
     */
    void setSource(const UnicodeString &newSource, UErrorCode &status);

#ifndef U_HIDE_INTERNAL_API
    /**
     * Dumb recursive implementation of permutation.
     * TODO: optimize
     * @param source     the string to find permutations for
     * @param skipZeros  determine if skip zeros
     * @param result     the results in a set.
     * @param status       Fill-in parameter which receives the status of this operation.
     * @internal
     */
    static void U_EXPORT2 permute(UnicodeString &source, UBool skipZeros, Hashtable *result, UErrorCode &status);
#endif  /* U_HIDE_INTERNAL_API */

    /**
     * ICU "poor man's RTTI", returns a UClassID for this class.
     *
     * @stable ICU 2.2
     */
    static UClassID U_EXPORT2 getStaticClassID();

    /**
     * ICU "poor man's RTTI", returns a UClassID for the actual class.
     *
     * @stable ICU 2.2
     */
    virtual UClassID getDynamicClassID() const;

private:
    // ===================== PRIVATES ==============================
    // private default constructor
    CanonicalIterator();


    /**
     * Copy constructor. Private for now.
     * @internal (private)
     */
    CanonicalIterator(const CanonicalIterator& other);

    /**
     * Assignment operator. Private for now.
     * @internal (private)
     */
    CanonicalIterator& operator=(const CanonicalIterator& other);

    // fields
    UnicodeString source;
    UBool done;

    // 2 dimensional array holds the pieces of the string with
    // their different canonically equivalent representations
    UnicodeString **pieces;
    int32_t pieces_length;
    int32_t *pieces_lengths;

    // current is used in iterating to combine pieces
    int32_t *current;
    int32_t current_length;

    // transient fields
    UnicodeString buffer;

    const Normalizer2 &nfd;
    const Normalizer2Impl &nfcImpl;

    // we have a segment, in NFD. Find all the strings that are canonically equivalent to it.
    UnicodeString *getEquivalents(const UnicodeString &segment, int32_t &result_len, UErrorCode &status); //private String[] getEquivalents(String segment)

    //Set getEquivalents2(String segment);
    Hashtable *getEquivalents2(Hashtable *fillinResult, const char16_t *segment, int32_t segLen, UErrorCode &status);
    //Hashtable *getEquivalents2(const UnicodeString &segment, int32_t segLen, UErrorCode &status);

    /**
     * See if the decomposition of cp2 is at segment starting at segmentPos
     * (with canonical rearrangment!)
     * If so, take the remainder, and return the equivalents
     */
    //Set extract(int comp, String segment, int segmentPos, StringBuffer buffer);
    Hashtable *extract(Hashtable *fillinResult, UChar32 comp, const char16_t *segment, int32_t segLen, int32_t segmentPos, UErrorCode &status);
    //Hashtable *extract(UChar32 comp, const UnicodeString &segment, int32_t segLen, int32_t segmentPos, UErrorCode &status);

    void cleanPieces();

};

U_NAMESPACE_END

#endif /* #if !UCONFIG_NO_NORMALIZATION */

#endif /* U_SHOW_CPLUSPLUS_API */

#endif

Filemanager

Name Type Size Permission Actions
alphaindex.h File 26.48 KB 0644
appendable.h File 8.49 KB 0644
basictz.h File 9.15 KB 0644
brkiter.h File 27.8 KB 0644
bytestream.h File 9.6 KB 0644
bytestrie.h File 20.77 KB 0644
bytestriebuilder.h File 7.08 KB 0644
calendar.h File 105.74 KB 0644
caniter.h File 7.43 KB 0644
casemap.h File 25.33 KB 0644
char16ptr.h File 7.22 KB 0644
chariter.h File 24.05 KB 0644
choicfmt.h File 23.91 KB 0644
coleitr.h File 13.76 KB 0644
coll.h File 56.23 KB 0644
compactdecimalformat.h File 6.88 KB 0644
curramt.h File 3.76 KB 0644
currpinf.h File 7.3 KB 0644
currunit.h File 4.05 KB 0644
datefmt.h File 40.67 KB 0644
dbbi.h File 1.19 KB 0644
dcfmtsym.h File 20.13 KB 0644
decimfmt.h File 87.38 KB 0644
docmain.h File 6.97 KB 0644
dtfmtsym.h File 37.7 KB 0644
dtintrv.h File 3.84 KB 0644
dtitvfmt.h File 46.63 KB 0644
dtitvinf.h File 18.51 KB 0644
dtptngen.h File 25.08 KB 0644
dtrule.h File 8.68 KB 0644
edits.h File 20.74 KB 0644
enumset.h File 2.08 KB 0644
errorcode.h File 4.84 KB 0644
fieldpos.h File 8.69 KB 0644
filteredbrk.h File 5.37 KB 0644
fmtable.h File 24.42 KB 0644
format.h File 12.5 KB 0644
formattedvalue.h File 10.27 KB 0644
fpositer.h File 3.04 KB 0644
gender.h File 3.33 KB 0644
gregocal.h File 31.71 KB 0644
icudataver.h File 1.03 KB 0644
icuplug.h File 11.88 KB 0644
idna.h File 12.7 KB 0644
listformatter.h File 9.47 KB 0644
localebuilder.h File 11.27 KB 0644
localematcher.h File 22.5 KB 0644
localpointer.h File 19.69 KB 0644
locdspnm.h File 7.12 KB 0644
locid.h File 47.4 KB 0644
measfmt.h File 11.33 KB 0644
measunit.h File 93.31 KB 0644
measure.h File 4.32 KB 0644
messagepattern.h File 33.71 KB 0644
msgfmt.h File 44.11 KB 0644
normalizer2.h File 34.03 KB 0644
normlzr.h File 30.94 KB 0644
nounit.h File 2.69 KB 0644
numberformatter.h File 86.31 KB 0644
numberrangeformatter.h File 30.14 KB 0644
numfmt.h File 49.81 KB 0644
numsys.h File 7.19 KB 0644
parseerr.h File 3.08 KB 0644
parsepos.h File 5.56 KB 0644
platform.h File 28.08 KB 0644
plurfmt.h File 25.2 KB 0644
plurrule.h File 18.39 KB 0644
ptypes.h File 3.49 KB 0644
putil.h File 6.33 KB 0644
rbbi.h File 26.58 KB 0644
rbnf.h File 48.73 KB 0644
rbtz.h File 15.6 KB 0644
regex.h File 84.36 KB 0644
region.h File 9.18 KB 0644
reldatefmt.h File 22.62 KB 0644
rep.h File 9.37 KB 0644
resbund.h File 18.07 KB 0644
schriter.h File 6.32 KB 0644
scientificnumberformatter.h File 6.4 KB 0644
search.h File 22.22 KB 0644
selfmt.h File 14.3 KB 0644
simpleformatter.h File 12.59 KB 0644
simpletz.h File 45.44 KB 0644
smpdtfmt.h File 70.97 KB 0644
sortkey.h File 11.18 KB 0644
std_string.h File 1.05 KB 0644
strenum.h File 9.92 KB 0644
stringoptions.h File 5.79 KB 0644
stringpiece.h File 7.38 KB 0644
stringtriebuilder.h File 15.33 KB 0644
stsearch.h File 21.3 KB 0644
symtable.h File 4.27 KB 0644
tblcoll.h File 36.61 KB 0644
timezone.h File 41.02 KB 0644
tmunit.h File 3.38 KB 0644
tmutamt.h File 4.9 KB 0644
tmutfmt.h File 7.85 KB 0644
translit.h File 65.82 KB 0644
tzfmt.h File 42.89 KB 0644
tznames.h File 16.85 KB 0644
tzrule.h File 35.37 KB 0644
tztrans.h File 6.12 KB 0644
ubidi.h File 89.56 KB 0644
ubiditransform.h File 12.65 KB 0644
ubrk.h File 23.97 KB 0644
ucal.h File 56.9 KB 0644
ucasemap.h File 15.18 KB 0644
ucat.h File 5.36 KB 0644
uchar.h File 140.56 KB 0644
ucharstrie.h File 22.58 KB 0644
ucharstriebuilder.h File 7.21 KB 0644
uchriter.h File 13.2 KB 0644
uclean.h File 11.21 KB 0644
ucnv.h File 83.09 KB 0644
ucnv_cb.h File 6.59 KB 0644
ucnv_err.h File 20.99 KB 0644
ucnvsel.h File 6.14 KB 0644
ucol.h File 61.46 KB 0644
ucoleitr.h File 9.46 KB 0644
uconfig.h File 12.07 KB 0644
ucpmap.h File 5.53 KB 0644
ucptrie.h File 22.46 KB 0644
ucsdet.h File 14.67 KB 0644
ucurr.h File 16.12 KB 0644
udat.h File 60.88 KB 0644
udata.h File 15.56 KB 0644
udateintervalformat.h File 10.03 KB 0644
udatpg.h File 26.01 KB 0644
udisplaycontext.h File 5.89 KB 0644
uenum.h File 7.78 KB 0644
ufieldpositer.h File 4.36 KB 0644
uformattable.h File 10.94 KB 0644
uformattedvalue.h File 12.14 KB 0644
ugender.h File 2 KB 0644
uidna.h File 33.37 KB 0644
uiter.h File 22.77 KB 0644
uldnames.h File 10.45 KB 0644
ulistformatter.h File 8.83 KB 0644
uloc.h File 52.54 KB 0644
ulocdata.h File 11.26 KB 0644
umachine.h File 14.53 KB 0644
umisc.h File 1.33 KB 0644
umsg.h File 24.23 KB 0644
umutablecptrie.h File 8.24 KB 0644
unifilt.h File 3.96 KB 0644
unifunct.h File 4.04 KB 0644
unimatch.h File 6.1 KB 0644
unirepl.h File 3.38 KB 0644
uniset.h File 64.9 KB 0644
unistr.h File 170.43 KB 0644
unorm.h File 20.52 KB 0644
unorm2.h File 24.66 KB 0644
unum.h File 53.62 KB 0644
unumberformatter.h File 25.36 KB 0644
unumsys.h File 7.21 KB 0644
uobject.h File 10.68 KB 0644
upluralrules.h File 7.88 KB 0644
uregex.h File 72.05 KB 0644
uregion.h File 9.84 KB 0644
ureldatefmt.h File 17.26 KB 0644
urename.h File 130.97 KB 0644
urep.h File 5.38 KB 0644
ures.h File 36.54 KB 0644
uscript.h File 26.87 KB 0644
usearch.h File 38.12 KB 0644
uset.h File 40 KB 0644
usetiter.h File 9.55 KB 0644
ushape.h File 18 KB 0644
uspoof.h File 65.9 KB 0644
usprep.h File 8.14 KB 0644
ustdio.h File 38.54 KB 0644
ustream.h File 1.89 KB 0644
ustring.h File 72.47 KB 0644
ustringtrie.h File 3.15 KB 0644
utext.h File 58.13 KB 0644
utf.h File 7.86 KB 0644
utf16.h File 23.32 KB 0644
utf32.h File 763 B 0644
utf8.h File 30.96 KB 0644
utf_old.h File 45.83 KB 0644
utmscale.h File 13.78 KB 0644
utrace.h File 15.73 KB 0644
utrans.h File 25.52 KB 0644
utypes.h File 30.74 KB 0644
uvernum.h File 6.67 KB 0644
uversion.h File 6 KB 0644
vtzone.h File 20.3 KB 0644