// © 2016 and later: Unicode, Inc. and others. // License & terms of use: http://www.unicode.org/copyright.html /* ******************************************************************************* * Copyright (C) 2010-2012, International Business Machines * Corporation and others. All Rights Reserved. ******************************************************************************* * file name: idna.h * encoding: UTF-8 * tab size: 8 (not used) * indentation:4 * * created on: 2010mar05 * created by: Markus W. Scherer */ #ifndef __IDNA_H__ #define __IDNA_H__ /** * \file * \brief C++ API: Internationalizing Domain Names in Applications (IDNA) */ #include "unicode/utypes.h" #if U_SHOW_CPLUSPLUS_API #if !UCONFIG_NO_IDNA #include "unicode/bytestream.h" #include "unicode/stringpiece.h" #include "unicode/uidna.h" #include "unicode/unistr.h" U_NAMESPACE_BEGIN class IDNAInfo; /** * Abstract base class for IDNA processing. * See http://www.unicode.org/reports/tr46/ * and http://www.ietf.org/rfc/rfc3490.txt * * The IDNA class is not intended for public subclassing. * * This C++ API currently only implements UTS #46. * The uidna.h C API implements both UTS #46 (functions using UIDNA service object) * and IDNA2003 (functions that do not use a service object). * @stable ICU 4.6 */ class U_COMMON_API IDNA : public UObject { public: /** * Destructor. * @stable ICU 4.6 */ ~IDNA(); /** * Returns an IDNA instance which implements UTS #46. * Returns an unmodifiable instance, owned by the caller. * Cache it for multiple operations, and delete it when done. * The instance is thread-safe, that is, it can be used concurrently. * * UTS #46 defines Unicode IDNA Compatibility Processing, * updated to the latest version of Unicode and compatible with both * IDNA2003 and IDNA2008. * * The worker functions use transitional processing, including deviation mappings, * unless UIDNA_NONTRANSITIONAL_TO_ASCII or UIDNA_NONTRANSITIONAL_TO_UNICODE * is used in which case the deviation characters are passed through without change. * * Disallowed characters are mapped to U+FFFD. * * For available options see the uidna.h header. * Operations with the UTS #46 instance do not support the * UIDNA_ALLOW_UNASSIGNED option. * * By default, the UTS #46 implementation allows all ASCII characters (as valid or mapped). * When the UIDNA_USE_STD3_RULES option is used, ASCII characters other than * letters, digits, hyphen (LDH) and dot/full stop are disallowed and mapped to U+FFFD. * * @param options Bit set to modify the processing and error checking. * See option bit set values in uidna.h. * @param errorCode Standard ICU error code. Its input value must * pass the U_SUCCESS() test, or else the function returns * immediately. Check for U_FAILURE() on output or use with * function chaining. (See User Guide for details.) * @return the UTS #46 IDNA instance, if successful * @stable ICU 4.6 */ static IDNA * createUTS46Instance(uint32_t options, UErrorCode &errorCode); /** * Converts a single domain name label into its ASCII form for DNS lookup. * If any processing step fails, then info.hasErrors() will be true and * the result might not be an ASCII string. * The label might be modified according to the types of errors. * Labels with severe errors will be left in (or turned into) their Unicode form. * * The UErrorCode indicates an error only in exceptional cases, * such as a U_MEMORY_ALLOCATION_ERROR. * * @param label Input domain name label * @param dest Destination string object * @param info Output container of IDNA processing details. * @param errorCode Standard ICU error code. Its input value must * pass the U_SUCCESS() test, or else the function returns * immediately. Check for U_FAILURE() on output or use with * function chaining. (See User Guide for details.) * @return dest * @stable ICU 4.6 */ virtual UnicodeString & labelToASCII(const UnicodeString &label, UnicodeString &dest, IDNAInfo &info, UErrorCode &errorCode) const = 0; /** * Converts a single domain name label into its Unicode form for human-readable display. * If any processing step fails, then info.hasErrors() will be true. * The label might be modified according to the types of errors. * * The UErrorCode indicates an error only in exceptional cases, * such as a U_MEMORY_ALLOCATION_ERROR. * * @param label Input domain name label * @param dest Destination string object * @param info Output container of IDNA processing details. * @param errorCode Standard ICU error code. Its input value must * pass the U_SUCCESS() test, or else the function returns * immediately. Check for U_FAILURE() on output or use with * function chaining. (See User Guide for details.) * @return dest * @stable ICU 4.6 */ virtual UnicodeString & labelToUnicode(const UnicodeString &label, UnicodeString &dest, IDNAInfo &info, UErrorCode &errorCode) const = 0; /** * Converts a whole domain name into its ASCII form for DNS lookup. * If any processing step fails, then info.hasErrors() will be true and * the result might not be an ASCII string. * The domain name might be modified according to the types of errors. * Labels with severe errors will be left in (or turned into) their Unicode form. * * The UErrorCode indicates an error only in exceptional cases, * such as a U_MEMORY_ALLOCATION_ERROR. * * @param name Input domain name * @param dest Destination string object * @param info Output container of IDNA processing details. * @param errorCode Standard ICU error code. Its input value must * pass the U_SUCCESS() test, or else the function returns * immediately. Check for U_FAILURE() on output or use with * function chaining. (See User Guide for details.) * @return dest * @stable ICU 4.6 */ virtual UnicodeString & nameToASCII(const UnicodeString &name, UnicodeString &dest, IDNAInfo &info, UErrorCode &errorCode) const = 0; /** * Converts a whole domain name into its Unicode form for human-readable display. * If any processing step fails, then info.hasErrors() will be true. * The domain name might be modified according to the types of errors. * * The UErrorCode indicates an error only in exceptional cases, * such as a U_MEMORY_ALLOCATION_ERROR. * * @param name Input domain name * @param dest Destination string object * @param info Output container of IDNA processing details. * @param errorCode Standard ICU error code. Its input value must * pass the U_SUCCESS() test, or else the function returns * immediately. Check for U_FAILURE() on output or use with * function chaining. (See User Guide for details.) * @return dest * @stable ICU 4.6 */ virtual UnicodeString & nameToUnicode(const UnicodeString &name, UnicodeString &dest, IDNAInfo &info, UErrorCode &errorCode) const = 0; // UTF-8 versions of the processing methods ---------------------------- *** /** * Converts a single domain name label into its ASCII form for DNS lookup. * UTF-8 version of labelToASCII(), same behavior. * * @param label Input domain name label * @param dest Destination byte sink; Flush()ed if successful * @param info Output container of IDNA processing details. * @param errorCode Standard ICU error code. Its input value must * pass the U_SUCCESS() test, or else the function returns * immediately. Check for U_FAILURE() on output or use with * function chaining. (See User Guide for details.) * @return dest * @stable ICU 4.6 */ virtual void labelToASCII_UTF8(StringPiece label, ByteSink &dest, IDNAInfo &info, UErrorCode &errorCode) const; /** * Converts a single domain name label into its Unicode form for human-readable display. * UTF-8 version of labelToUnicode(), same behavior. * * @param label Input domain name label * @param dest Destination byte sink; Flush()ed if successful * @param info Output container of IDNA processing details. * @param errorCode Standard ICU error code. Its input value must * pass the U_SUCCESS() test, or else the function returns * immediately. Check for U_FAILURE() on output or use with * function chaining. (See User Guide for details.) * @return dest * @stable ICU 4.6 */ virtual void labelToUnicodeUTF8(StringPiece label, ByteSink &dest, IDNAInfo &info, UErrorCode &errorCode) const; /** * Converts a whole domain name into its ASCII form for DNS lookup. * UTF-8 version of nameToASCII(), same behavior. * * @param name Input domain name * @param dest Destination byte sink; Flush()ed if successful * @param info Output container of IDNA processing details. * @param errorCode Standard ICU error code. Its input value must * pass the U_SUCCESS() test, or else the function returns * immediately. Check for U_FAILURE() on output or use with * function chaining. (See User Guide for details.) * @return dest * @stable ICU 4.6 */ virtual void nameToASCII_UTF8(StringPiece name, ByteSink &dest, IDNAInfo &info, UErrorCode &errorCode) const; /** * Converts a whole domain name into its Unicode form for human-readable display. * UTF-8 version of nameToUnicode(), same behavior. * * @param name Input domain name * @param dest Destination byte sink; Flush()ed if successful * @param info Output container of IDNA processing details. * @param errorCode Standard ICU error code. Its input value must * pass the U_SUCCESS() test, or else the function returns * immediately. Check for U_FAILURE() on output or use with * function chaining. (See User Guide for details.) * @return dest * @stable ICU 4.6 */ virtual void nameToUnicodeUTF8(StringPiece name, ByteSink &dest, IDNAInfo &info, UErrorCode &errorCode) const; }; class UTS46; /** * Output container for IDNA processing errors. * The IDNAInfo class is not suitable for subclassing. * @stable ICU 4.6 */ class U_COMMON_API IDNAInfo : public UMemory { public: /** * Constructor for stack allocation. * @stable ICU 4.6 */ IDNAInfo() : errors(0), labelErrors(0), isTransDiff(false), isBiDi(false), isOkBiDi(true) {} /** * Were there IDNA processing errors? * @return true if there were processing errors * @stable ICU 4.6 */ UBool hasErrors() const { return errors!=0; } /** * Returns a bit set indicating IDNA processing errors. * See UIDNA_ERROR_... constants in uidna.h. * @return bit set of processing errors * @stable ICU 4.6 */ uint32_t getErrors() const { return errors; } /** * Returns true if transitional and nontransitional processing produce different results. * This is the case when the input label or domain name contains * one or more deviation characters outside a Punycode label (see UTS #46). * <ul> * <li>With nontransitional processing, such characters are * copied to the destination string. * <li>With transitional processing, such characters are * mapped (sharp s/sigma) or removed (joiner/nonjoiner). * </ul> * @return true if transitional and nontransitional processing produce different results * @stable ICU 4.6 */ UBool isTransitionalDifferent() const { return isTransDiff; } private: friend class UTS46; IDNAInfo(const IDNAInfo &other) = delete; // no copying IDNAInfo &operator=(const IDNAInfo &other) = delete; // no copying void reset() { errors=labelErrors=0; isTransDiff=false; isBiDi=false; isOkBiDi=true; } uint32_t errors, labelErrors; UBool isTransDiff; UBool isBiDi; UBool isOkBiDi; }; U_NAMESPACE_END #endif // UCONFIG_NO_IDNA #endif /* U_SHOW_CPLUSPLUS_API */ #endif // __IDNA_H__
Name | Type | Size | Permission | Actions |
---|---|---|---|---|
alphaindex.h | File | 26.54 KB | 0644 |
|
appendable.h | File | 8.54 KB | 0644 |
|
basictz.h | File | 9.99 KB | 0644 |
|
brkiter.h | File | 27.86 KB | 0644 |
|
bytestream.h | File | 10.75 KB | 0644 |
|
bytestrie.h | File | 20.8 KB | 0644 |
|
bytestriebuilder.h | File | 7.48 KB | 0644 |
|
calendar.h | File | 106.52 KB | 0644 |
|
caniter.h | File | 7.47 KB | 0644 |
|
casemap.h | File | 25.42 KB | 0644 |
|
char16ptr.h | File | 7.22 KB | 0644 |
|
chariter.h | File | 24.06 KB | 0644 |
|
choicfmt.h | File | 24 KB | 0644 |
|
coleitr.h | File | 13.78 KB | 0644 |
|
coll.h | File | 56.3 KB | 0644 |
|
compactdecimalformat.h | File | 6.88 KB | 0644 |
|
curramt.h | File | 3.67 KB | 0644 |
|
currpinf.h | File | 7.3 KB | 0644 |
|
currunit.h | File | 4.02 KB | 0644 |
|
datefmt.h | File | 40.72 KB | 0644 |
|
dbbi.h | File | 1.19 KB | 0644 |
|
dcfmtsym.h | File | 20.94 KB | 0644 |
|
decimfmt.h | File | 87.54 KB | 0644 |
|
displayoptions.h | File | 7.08 KB | 0644 |
|
docmain.h | File | 7.3 KB | 0644 |
|
dtfmtsym.h | File | 38.23 KB | 0644 |
|
dtintrv.h | File | 3.85 KB | 0644 |
|
dtitvfmt.h | File | 49.26 KB | 0644 |
|
dtitvinf.h | File | 18.63 KB | 0644 |
|
dtptngen.h | File | 28.64 KB | 0644 |
|
dtrule.h | File | 8.69 KB | 0644 |
|
edits.h | File | 20.73 KB | 0644 |
|
enumset.h | File | 2.08 KB | 0644 |
|
errorcode.h | File | 4.84 KB | 0644 |
|
fieldpos.h | File | 8.7 KB | 0644 |
|
filteredbrk.h | File | 5.37 KB | 0644 |
|
fmtable.h | File | 24.45 KB | 0644 |
|
format.h | File | 12.5 KB | 0644 |
|
formattednumber.h | File | 6.15 KB | 0644 |
|
formattedvalue.h | File | 9.75 KB | 0644 |
|
fpositer.h | File | 3.03 KB | 0644 |
|
gender.h | File | 3.35 KB | 0644 |
|
gregocal.h | File | 30.03 KB | 0644 |
|
icudataver.h | File | 1.02 KB | 0644 |
|
icuplug.h | File | 12.1 KB | 0644 |
|
idna.h | File | 12.71 KB | 0644 |
|
listformatter.h | File | 8.59 KB | 0644 |
|
localebuilder.h | File | 11.08 KB | 0644 |
|
localematcher.h | File | 26.83 KB | 0644 |
|
localpointer.h | File | 19.44 KB | 0644 |
|
locdspnm.h | File | 7.12 KB | 0644 |
|
locid.h | File | 48.27 KB | 0644 |
|
measfmt.h | File | 11.42 KB | 0644 |
|
measunit.h | File | 107.38 KB | 0644 |
|
measure.h | File | 4.69 KB | 0644 |
|
messagepattern.h | File | 33.72 KB | 0644 |
|
msgfmt.h | File | 44.21 KB | 0644 |
|
normalizer2.h | File | 34.73 KB | 0644 |
|
normlzr.h | File | 30.97 KB | 0644 |
|
nounit.h | File | 2.25 KB | 0644 |
|
numberformatter.h | File | 90.03 KB | 0644 |
|
numberrangeformatter.h | File | 25.32 KB | 0644 |
|
numfmt.h | File | 50.26 KB | 0644 |
|
numsys.h | File | 7.23 KB | 0644 |
|
parseerr.h | File | 3.08 KB | 0644 |
|
parsepos.h | File | 5.57 KB | 0644 |
|
platform.h | File | 27.8 KB | 0644 |
|
plurfmt.h | File | 25.25 KB | 0644 |
|
plurrule.h | File | 20.64 KB | 0644 |
|
ptypes.h | File | 3.49 KB | 0644 |
|
putil.h | File | 6.32 KB | 0644 |
|
rbbi.h | File | 32.07 KB | 0644 |
|
rbnf.h | File | 49.92 KB | 0644 |
|
rbtz.h | File | 15.77 KB | 0644 |
|
regex.h | File | 84.45 KB | 0644 |
|
region.h | File | 9.2 KB | 0644 |
|
reldatefmt.h | File | 22.36 KB | 0644 |
|
rep.h | File | 9.38 KB | 0644 |
|
resbund.h | File | 18.11 KB | 0644 |
|
schriter.h | File | 6.1 KB | 0644 |
|
scientificnumberformatter.h | File | 6.44 KB | 0644 |
|
search.h | File | 22.24 KB | 0644 |
|
selfmt.h | File | 14.35 KB | 0644 |
|
simpleformatter.h | File | 12.6 KB | 0644 |
|
simplenumberformatter.h | File | 8.88 KB | 0644 |
|
simpletz.h | File | 45.65 KB | 0644 |
|
smpdtfmt.h | File | 71.85 KB | 0644 |
|
sortkey.h | File | 11.19 KB | 0644 |
|
std_string.h | File | 1.05 KB | 0644 |
|
strenum.h | File | 9.96 KB | 0644 |
|
stringoptions.h | File | 5.79 KB | 0644 |
|
stringpiece.h | File | 10.05 KB | 0644 |
|
stringtriebuilder.h | File | 15.5 KB | 0644 |
|
stsearch.h | File | 21.44 KB | 0644 |
|
symtable.h | File | 4.28 KB | 0644 |
|
tblcoll.h | File | 36.94 KB | 0644 |
|
timezone.h | File | 45.67 KB | 0644 |
|
tmunit.h | File | 3.4 KB | 0644 |
|
tmutamt.h | File | 4.91 KB | 0644 |
|
tmutfmt.h | File | 7.42 KB | 0644 |
|
translit.h | File | 65.83 KB | 0644 |
|
tzfmt.h | File | 42.96 KB | 0644 |
|
tznames.h | File | 16.85 KB | 0644 |
|
tzrule.h | File | 34.86 KB | 0644 |
|
tztrans.h | File | 6.13 KB | 0644 |
|
ubidi.h | File | 89.61 KB | 0644 |
|
ubiditransform.h | File | 12.71 KB | 0644 |
|
ubrk.h | File | 24.43 KB | 0644 |
|
ucal.h | File | 64.28 KB | 0644 |
|
ucasemap.h | File | 15.21 KB | 0644 |
|
ucat.h | File | 5.35 KB | 0644 |
|
uchar.h | File | 145.7 KB | 0644 |
|
ucharstrie.h | File | 22.56 KB | 0644 |
|
ucharstriebuilder.h | File | 7.48 KB | 0644 |
|
uchriter.h | File | 13.42 KB | 0644 |
|
uclean.h | File | 11.21 KB | 0644 |
|
ucnv.h | File | 83.46 KB | 0644 |
|
ucnv_cb.h | File | 6.58 KB | 0644 |
|
ucnv_err.h | File | 20.98 KB | 0644 |
|
ucnvsel.h | File | 6.24 KB | 0644 |
|
ucol.h | File | 62.7 KB | 0644 |
|
ucoleitr.h | File | 9.82 KB | 0644 |
|
uconfig.h | File | 12.31 KB | 0644 |
|
ucpmap.h | File | 5.54 KB | 0644 |
|
ucptrie.h | File | 22.51 KB | 0644 |
|
ucsdet.h | File | 14.69 KB | 0644 |
|
ucurr.h | File | 16.72 KB | 0644 |
|
udat.h | File | 62.36 KB | 0644 |
|
udata.h | File | 15.63 KB | 0644 |
|
udateintervalformat.h | File | 11.93 KB | 0644 |
|
udatpg.h | File | 30.13 KB | 0644 |
|
udisplaycontext.h | File | 5.94 KB | 0644 |
|
udisplayoptions.h | File | 8.86 KB | 0644 |
|
uenum.h | File | 7.79 KB | 0644 |
|
ufieldpositer.h | File | 4.41 KB | 0644 |
|
uformattable.h | File | 10.97 KB | 0644 |
|
uformattednumber.h | File | 8.09 KB | 0644 |
|
uformattedvalue.h | File | 12.25 KB | 0644 |
|
ugender.h | File | 2.06 KB | 0644 |
|
uidna.h | File | 33.43 KB | 0644 |
|
uiter.h | File | 22.75 KB | 0644 |
|
uldnames.h | File | 10.48 KB | 0644 |
|
ulistformatter.h | File | 10.78 KB | 0644 |
|
uloc.h | File | 54.66 KB | 0644 |
|
ulocale.h | File | 6.35 KB | 0644 |
|
ulocbuilder.h | File | 16.72 KB | 0644 |
|
ulocdata.h | File | 11.3 KB | 0644 |
|
umachine.h | File | 15 KB | 0644 |
|
umisc.h | File | 1.34 KB | 0644 |
|
umsg.h | File | 24.25 KB | 0644 |
|
umutablecptrie.h | File | 8.3 KB | 0644 |
|
unifilt.h | File | 4 KB | 0644 |
|
unifunct.h | File | 4.05 KB | 0644 |
|
unimatch.h | File | 6.1 KB | 0644 |
|
unirepl.h | File | 3.38 KB | 0644 |
|
uniset.h | File | 66.85 KB | 0644 |
|
unistr.h | File | 171.35 KB | 0644 |
|
unorm.h | File | 20.55 KB | 0644 |
|
unorm2.h | File | 25.71 KB | 0644 |
|
unum.h | File | 55.16 KB | 0644 |
|
unumberformatter.h | File | 19.68 KB | 0644 |
|
unumberoptions.h | File | 5.23 KB | 0644 |
|
unumberrangeformatter.h | File | 15.35 KB | 0644 |
|
unumsys.h | File | 7.26 KB | 0644 |
|
uobject.h | File | 10.66 KB | 0644 |
|
upluralrules.h | File | 8.79 KB | 0644 |
|
uregex.h | File | 71.99 KB | 0644 |
|
uregion.h | File | 9.81 KB | 0644 |
|
ureldatefmt.h | File | 16.98 KB | 0644 |
|
urename.h | File | 140.82 KB | 0644 |
|
urep.h | File | 5.38 KB | 0644 |
|
ures.h | File | 36.65 KB | 0644 |
|
uscript.h | File | 27.8 KB | 0644 |
|
usearch.h | File | 39.21 KB | 0644 |
|
uset.h | File | 45.61 KB | 0644 |
|
usetiter.h | File | 9.63 KB | 0644 |
|
ushape.h | File | 18 KB | 0644 |
|
usimplenumberformatter.h | File | 7.46 KB | 0644 |
|
uspoof.h | File | 80.32 KB | 0644 |
|
usprep.h | File | 8.19 KB | 0644 |
|
ustdio.h | File | 38.56 KB | 0644 |
|
ustream.h | File | 1.89 KB | 0644 |
|
ustring.h | File | 72.13 KB | 0644 |
|
ustringtrie.h | File | 3.15 KB | 0644 |
|
utext.h | File | 58.1 KB | 0644 |
|
utf.h | File | 7.87 KB | 0644 |
|
utf16.h | File | 23.35 KB | 0644 |
|
utf32.h | File | 763 B | 0644 |
|
utf8.h | File | 30.83 KB | 0644 |
|
utf_old.h | File | 45.8 KB | 0644 |
|
utmscale.h | File | 13.78 KB | 0644 |
|
utrace.h | File | 17.18 KB | 0644 |
|
utrans.h | File | 25.54 KB | 0644 |
|
utypes.h | File | 31.06 KB | 0644 |
|
uvernum.h | File | 6.33 KB | 0644 |
|
uversion.h | File | 5.99 KB | 0644 |
|
vtzone.h | File | 20.69 KB | 0644 |
|