scuffed-code/icu4c/source/common/punycode.h

// © 2016 and later: Unicode, Inc. and others.
// License & terms of use: http://www.unicode.org/copyright.html
/*
*******************************************************************************
*
*   Copyright (C) 2002-2003, International Business Machines
*   Corporation and others.  All Rights Reserved.
*
*******************************************************************************
*   file name:  punycode.h
*   encoding:   UTF-8
*   tab size:   8 (not used)
*   indentation:4
*
*   created on: 2002jan31
*   created by: Markus W. Scherer
*/

/* This ICU code derived from: */
/*
punycode.c 0.4.0 (2001-Nov-17-Sat)
http://www.cs.berkeley.edu/~amc/idn/
Adam M. Costello
http://www.nicemice.net/amc/
*/

#ifndef __PUNYCODE_H__
#define __PUNYCODE_H__

#include "unicode/utypes.h"

#if !UCONFIG_NO_IDNA

/**
 * u_strToPunycode() converts Unicode to Punycode.
 *
 * The input string must not contain single, unpaired surrogates.
 * The output will be represented as an array of ASCII code points.
 *
 * The output string is NUL-terminated according to normal ICU
 * string output rules.
 *
 * @param src Input Unicode string.
 *            This function handles a limited amount of code points
 *            (the limit is >=64).
 *            U_INDEX_OUTOFBOUNDS_ERROR is set if the limit is exceeded.
 * @param srcLength Number of UChars in src, or -1 if NUL-terminated.
 * @param dest Output Punycode array.
 * @param destCapacity Size of dest.
 * @param caseFlags Vector of boolean values, one per input UChar,
 *                  indicating that the corresponding character is to be
 *                  marked for the decoder optionally
 *                  uppercasing (TRUE) or lowercasing (FALSE)
 *                  the character.
 *                  ASCII characters are output directly in the case as marked.
 *                  Flags corresponding to trail surrogates are ignored.
 *                  If caseFlags==NULL then input characters are not
 *                  case-mapped.
 * @param pErrorCode ICU in/out error code parameter.
 *                   U_INVALID_CHAR_FOUND if src contains
 *                   unmatched single surrogates.
 *                   U_INDEX_OUTOFBOUNDS_ERROR if src contains
 *                   too many code points.
 * @return Number of ASCII characters in puny.
 *
 * @see u_strFromPunycode
 */
U_CFUNC int32_t
u_strToPunycode(const UChar *src, int32_t srcLength,
                UChar *dest, int32_t destCapacity,
                const UBool *caseFlags,
                UErrorCode *pErrorCode);

/**
 * u_strFromPunycode() converts Punycode to Unicode.
 * The Unicode string will be at most as long (in UChars)
 * than the Punycode string (in chars).
 *
 * @param src Input Punycode string.
 * @param srcLength Length of puny, or -1 if NUL-terminated
 * @param dest Output Unicode string buffer.
 * @param destCapacity Size of dest in number of UChars,
 *                     and of caseFlags in numbers of UBools.
 * @param caseFlags Output array for case flags as
 *                  defined by the Punycode string.
 *                  The caller should uppercase (TRUE) or lowercase (FASLE)
 *                  the corresponding character in dest.
 *                  For supplementary characters, only the lead surrogate
 *                  is marked, and FALSE is stored for the trail surrogate.
 *                  This is redundant and not necessary for ASCII characters
 *                  because they are already in the case indicated.
 *                  Can be NULL if the case flags are not needed.
 * @param pErrorCode ICU in/out error code parameter.
 *                   U_INVALID_CHAR_FOUND if a non-ASCII character
 *                   precedes the last delimiter ('-'),
 *                   or if an invalid character (not a-zA-Z0-9) is found
 *                   after the last delimiter.
 *                   U_ILLEGAL_CHAR_FOUND if the delta sequence is ill-formed.
 * @return Number of UChars written to dest.
 *
 * @see u_strToPunycode
 */
U_CFUNC int32_t
u_strFromPunycode(const UChar *src, int32_t srcLength,
                  UChar *dest, int32_t destCapacity,
                  UBool *caseFlags,
                  UErrorCode *pErrorCode);

#endif /* #if !UCONFIG_NO_IDNA */

#endif

/*
 * Hey, Emacs, please set the following:
 *
 * Local Variables:
 * indent-tabs-mode: nil
 * End:
 *
 */
ICU-12764 icu4c utf-8 source files, update Copyright notices. X-SVN-Rev: 39583 2017-01-20 00:20:31 +00:00			`// © 2016 and later: Unicode, Inc. and others.`
ICU-12564 Update copyright notice in trunk X-SVN-Rev: 38848 2016-06-15 18:58:17 +00:00			`// License & terms of use: http://www.unicode.org/copyright.html`
ICU-2194 IDNA API X-SVN-Rev: 11194 2003-02-28 21:35:25 +00:00			`/*`
			`*******************************************************************************`
			`*`
ICU-12564 Reverted r38761 and r38762, because we want to prepend the Unicode copyright for existing source files, instead of replacing copyright comments. X-SVN-Rev: 38776 2016-05-31 21:45:07 +00:00			`* Copyright (C) 2002-2003, International Business Machines`
			`* Corporation and others. All Rights Reserved.`
ICU-2194 IDNA API X-SVN-Rev: 11194 2003-02-28 21:35:25 +00:00			`*`
			`*******************************************************************************`
			`* file name: punycode.h`
ICU-12764 UTF-8 source files, update file encoding comments. X-SVN-Rev: 39641 2017-02-03 18:57:23 +00:00			`* encoding: UTF-8`
ICU-2194 IDNA API X-SVN-Rev: 11194 2003-02-28 21:35:25 +00:00			`* tab size: 8 (not used)`
			`* indentation:4`
			`*`
			`* created on: 2002jan31`
			`* created by: Markus W. Scherer`
			`*/`

			`/* This ICU code derived from: */`
			`/*`
			`punycode.c 0.4.0 (2001-Nov-17-Sat)`
			`http://www.cs.berkeley.edu/~amc/idn/`
			`Adam M. Costello`
			`http://www.nicemice.net/amc/`
			`*/`

			`#ifndef __PUNYCODE_H__`
			`#define __PUNYCODE_H__`

			`#include "unicode/utypes.h"`

ICU-2860 add UCONFIG_NO_NORMALIZATION and UCONFIG_NO_IDNA X-SVN-Rev: 11809 2003-05-06 01:37:52 +00:00			`#if !UCONFIG_NO_IDNA`

ICU-2194 IDNA API X-SVN-Rev: 11194 2003-02-28 21:35:25 +00:00			`/**`
			`* u_strToPunycode() converts Unicode to Punycode.`
			`*`
			`* The input string must not contain single, unpaired surrogates.`
			`* The output will be represented as an array of ASCII code points.`
			`*`
			`* The output string is NUL-terminated according to normal ICU`
			`* string output rules.`
			`*`
			`* @param src Input Unicode string.`
			`* This function handles a limited amount of code points`
			`* (the limit is >=64).`
			`* U_INDEX_OUTOFBOUNDS_ERROR is set if the limit is exceeded.`
			`* @param srcLength Number of UChars in src, or -1 if NUL-terminated.`
			`* @param dest Output Punycode array.`
			`* @param destCapacity Size of dest.`
			`* @param caseFlags Vector of boolean values, one per input UChar,`
			`* indicating that the corresponding character is to be`
			`* marked for the decoder optionally`
			`* uppercasing (TRUE) or lowercasing (FALSE)`
			`* the character.`
			`* ASCII characters are output directly in the case as marked.`
			`* Flags corresponding to trail surrogates are ignored.`
			`* If caseFlags==NULL then input characters are not`
			`* case-mapped.`
			`* @param pErrorCode ICU in/out error code parameter.`
			`* U_INVALID_CHAR_FOUND if src contains`
			`* unmatched single surrogates.`
			`* U_INDEX_OUTOFBOUNDS_ERROR if src contains`
			`* too many code points.`
			`* @return Number of ASCII characters in puny.`
			`*`
			`* @see u_strFromPunycode`
			`*/`
			`U_CFUNC int32_t`
			`u_strToPunycode(const UChar *src, int32_t srcLength,`
			`UChar *dest, int32_t destCapacity,`
			`const UBool *caseFlags,`
			`UErrorCode *pErrorCode);`

			`/**`
			`* u_strFromPunycode() converts Punycode to Unicode.`
			`* The Unicode string will be at most as long (in UChars)`
			`* than the Punycode string (in chars).`
			`*`
			`* @param src Input Punycode string.`
			`* @param srcLength Length of puny, or -1 if NUL-terminated`
			`* @param dest Output Unicode string buffer.`
			`* @param destCapacity Size of dest in number of UChars,`
			`* and of caseFlags in numbers of UBools.`
			`* @param caseFlags Output array for case flags as`
			`* defined by the Punycode string.`
			`* The caller should uppercase (TRUE) or lowercase (FASLE)`
			`* the corresponding character in dest.`
			`* For supplementary characters, only the lead surrogate`
			`* is marked, and FALSE is stored for the trail surrogate.`
			`* This is redundant and not necessary for ASCII characters`
			`* because they are already in the case indicated.`
			`* Can be NULL if the case flags are not needed.`
			`* @param pErrorCode ICU in/out error code parameter.`
			`* U_INVALID_CHAR_FOUND if a non-ASCII character`
			`* precedes the last delimiter ('-'),`
			`* or if an invalid character (not a-zA-Z0-9) is found`
			`* after the last delimiter.`
			`* U_ILLEGAL_CHAR_FOUND if the delta sequence is ill-formed.`
			`* @return Number of UChars written to dest.`
			`*`
			`* @see u_strToPunycode`
			`*/`
			`U_CFUNC int32_t`
			`u_strFromPunycode(const UChar *src, int32_t srcLength,`
			`UChar *dest, int32_t destCapacity,`
			`UBool *caseFlags,`
			`UErrorCode *pErrorCode);`

ICU-2860 add UCONFIG_NO_NORMALIZATION and UCONFIG_NO_IDNA X-SVN-Rev: 11809 2003-05-06 01:37:52 +00:00			`#endif /* #if !UCONFIG_NO_IDNA */`

ICU-2194 IDNA API X-SVN-Rev: 11194 2003-02-28 21:35:25 +00:00			`#endif`

			`/*`
			`* Hey, Emacs, please set the following:`
			`*`
			`* Local Variables:`
			`* indent-tabs-mode: nil`
			`* End:`
			`*`
			`*/`