2 *******************************************************************************
4 * Copyright (C) 2003-2007, International Business Machines
5 * Corporation and others. All Rights Reserved.
7 *******************************************************************************
8 * file name: idnaref.cpp
10 * tab size: 8 (not used)
13 * created on: 2003feb1
14 * created by: Ram Viswanadha
17 #include "unicode/utypes.h"
19 #if !UCONFIG_NO_IDNA && !UCONFIG_NO_TRANSLITERATION
28 #include "unicode/ustring.h"
30 /* it is official IDNA ACE Prefix is "xn--" */
31 static const UChar ACE_PREFIX
[] ={ 0x0078,0x006E,0x002d,0x002d } ;
32 #define ACE_PREFIX_LENGTH 4
34 #define MAX_LABEL_LENGTH 63
36 /* The Max length of the labels should not be more than 64 */
37 #define MAX_LABEL_BUFFER_SIZE 100
38 #define MAX_IDN_BUFFER_SIZE 300
40 #define CAPITAL_A 0x0041
41 #define CAPITAL_Z 0x005A
42 #define LOWER_CASE_DELTA 0x0020
43 #define FULL_STOP 0x002E
47 startsWithPrefix(const UChar
* src
, int32_t srcLength
){
48 UBool startsWithPrefix
= TRUE
;
50 if(srcLength
< ACE_PREFIX_LENGTH
){
54 for(int8_t i
=0; i
< ACE_PREFIX_LENGTH
; i
++){
55 if(u_tolower(src
[i
]) != ACE_PREFIX
[i
]){
56 startsWithPrefix
= FALSE
;
59 return startsWithPrefix
;
63 toASCIILower(UChar ch
){
64 if(CAPITAL_A
<= ch
&& ch
<= CAPITAL_Z
){
65 return ch
+ LOWER_CASE_DELTA
;
71 compareCaseInsensitiveASCII(const UChar
* s1
, int32_t s1Len
,
72 const UChar
* s2
, int32_t s2Len
){
74 return (s1Len
> s2Len
) ? s1Len
: s2Len
;
79 for(int32_t i
=0;/* no condition */;i
++) {
80 /* If we reach the ends of both strings then they match */
88 /* Case-insensitive comparison */
90 rc
=(int32_t)toASCIILower(c1
)-(int32_t)toASCIILower(c2
);
99 static UErrorCode
getError(enum punycode_status status
){
101 case punycode_success
:
103 case punycode_bad_input
: /* Input is invalid. */
104 return U_INVALID_CHAR_FOUND
;
105 case punycode_big_output
: /* Output would exceed the space provided. */
106 return U_BUFFER_OVERFLOW_ERROR
;
107 case punycode_overflow
: /* Input requires wider integers to process. */
108 return U_INDEX_OUTOFBOUNDS_ERROR
;
110 return U_INTERNAL_PROGRAM_ERROR
;
114 static inline int32_t convertASCIIToUChars(const char* src
,UChar
* dest
, int32_t length
){
116 for(i
=0;i
<length
;i
++){
121 static inline int32_t convertUCharsToASCII(const UChar
* src
,char* dest
, int32_t length
){
123 for(i
=0;i
<length
;i
++){
124 dest
[i
] = (char)src
[i
];
128 // wrapper around the reference Punycode implementation
129 static int32_t convertToPuny(const UChar
* src
, int32_t srcLength
,
130 UChar
* dest
, int32_t destCapacity
,
132 uint32_t b1Stack
[MAX_LABEL_BUFFER_SIZE
];
133 int32_t b1Len
= 0, b1Capacity
= MAX_LABEL_BUFFER_SIZE
;
134 uint32_t* b1
= b1Stack
;
135 char b2Stack
[MAX_LABEL_BUFFER_SIZE
];
137 int32_t b2Len
=MAX_LABEL_BUFFER_SIZE
;
138 punycode_status error
;
139 unsigned char* caseFlags
= NULL
;
141 u_strToUTF32((UChar32
*)b1
,b1Capacity
,&b1Len
,src
,srcLength
,&status
);
142 if(status
== U_BUFFER_OVERFLOW_ERROR
){
143 // redo processing of string
144 /* we do not have enough room so grow the buffer*/
145 b1
= (uint32_t*) uprv_malloc(b1Len
* sizeof(uint32_t));
147 status
= U_MEMORY_ALLOCATION_ERROR
;
151 status
= U_ZERO_ERROR
; // reset error
153 u_strToUTF32((UChar32
*)b1
,b1Len
,&b1Len
,src
,srcLength
,&status
);
155 if(U_FAILURE(status
)){
159 //caseFlags = (unsigned char*) uprv_malloc(b1Len *sizeof(unsigned char));
161 error
= punycode_encode(b1Len
,b1
,caseFlags
, (uint32_t*)&b2Len
, b2
);
162 status
= getError(error
);
164 if(status
== U_BUFFER_OVERFLOW_ERROR
){
165 /* we do not have enough room so grow the buffer*/
166 b2
= (char*) uprv_malloc( b2Len
* sizeof(char));
168 status
= U_MEMORY_ALLOCATION_ERROR
;
172 status
= U_ZERO_ERROR
; // reset error
174 punycode_status error
= punycode_encode(b1Len
,b1
,caseFlags
, (uint32_t*)&b2Len
, b2
);
175 status
= getError(error
);
177 if(U_FAILURE(status
)){
181 if(b2Len
< destCapacity
){
182 convertASCIIToUChars(b2
,dest
,b2Len
);
184 status
=U_BUFFER_OVERFLOW_ERROR
;
194 uprv_free(caseFlags
);
199 static int32_t convertFromPuny( const UChar
* src
, int32_t srcLength
,
200 UChar
* dest
, int32_t destCapacity
,
202 char b1Stack
[MAX_LABEL_BUFFER_SIZE
];
206 convertUCharsToASCII(src
, b1
,srcLength
);
208 uint32_t b2Stack
[MAX_LABEL_BUFFER_SIZE
];
209 uint32_t* b2
= b2Stack
;
210 int32_t b2Len
=MAX_LABEL_BUFFER_SIZE
;
211 unsigned char* caseFlags
= NULL
; //(unsigned char*) uprv_malloc(srcLength * sizeof(unsigned char*));
212 punycode_status error
= punycode_decode(srcLength
,b1
,(uint32_t*)&b2Len
,b2
,caseFlags
);
213 status
= getError(error
);
214 if(status
== U_BUFFER_OVERFLOW_ERROR
){
215 b2
= (uint32_t*) uprv_malloc(b2Len
* sizeof(uint32_t));
217 status
= U_MEMORY_ALLOCATION_ERROR
;
220 error
= punycode_decode(srcLength
,b1
,(uint32_t*)&b2Len
,b2
,caseFlags
);
221 status
= getError(error
);
224 if(U_FAILURE(status
)){
228 u_strFromUTF32(dest
,destCapacity
,&destLen
,(UChar32
*)b2
,b2Len
,&status
);
237 uprv_free(caseFlags
);
243 U_CFUNC
int32_t U_EXPORT2
244 idnaref_toASCII(const UChar
* src
, int32_t srcLength
,
245 UChar
* dest
, int32_t destCapacity
,
247 UParseError
* parseError
,
250 if(status
== NULL
|| U_FAILURE(*status
)){
253 if((src
== NULL
) || (srcLength
< -1) || (destCapacity
<0) || (!dest
&& destCapacity
> 0)){
254 *status
= U_ILLEGAL_ARGUMENT_ERROR
;
257 UChar b1Stack
[MAX_LABEL_BUFFER_SIZE
], b2Stack
[MAX_LABEL_BUFFER_SIZE
];
258 //initialize pointers to stack buffers
259 UChar
*b1
= b1Stack
, *b2
= b2Stack
;
260 int32_t b1Len
=0, b2Len
=0,
261 b1Capacity
= MAX_LABEL_BUFFER_SIZE
,
262 b2Capacity
= MAX_LABEL_BUFFER_SIZE
,
266 UBool allowUnassigned
= (UBool
)((options
& IDNAREF_ALLOW_UNASSIGNED
) != 0);
267 UBool useSTD3ASCIIRules
= (UBool
)((options
& IDNAREF_USE_STD3_RULES
) != 0);
269 UBool
* caseFlags
= NULL
;
271 // assume the source contains all ascii codepoints
272 UBool srcIsASCII
= TRUE
;
273 // assume the source contains all LDH codepoints
274 UBool srcIsLDH
= TRUE
;
277 NamePrepTransform
* prep
= TestIDNA::getInstance(*status
);
279 if(U_FAILURE(*status
)){
284 srcLength
= u_strlen(src
);
286 if(srcLength
> b1Capacity
){
287 b1
= (UChar
*) uprv_malloc(srcLength
* U_SIZEOF_UCHAR
);
289 *status
= U_MEMORY_ALLOCATION_ERROR
;
292 b1Capacity
= srcLength
;
295 for( j
=0;j
<srcLength
;j
++){
299 b1
[b1Len
++] = src
[j
];
303 b1Len
= prep
->process(src
,srcLength
,b1
, b1Capacity
,allowUnassigned
,parseError
,*status
);
305 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
306 // redo processing of string
307 /* we do not have enough room so grow the buffer*/
311 b1
= (UChar
*) uprv_malloc(b1Len
* U_SIZEOF_UCHAR
);
313 *status
= U_MEMORY_ALLOCATION_ERROR
;
317 *status
= U_ZERO_ERROR
; // reset error
319 b1Len
= prep
->process(src
,srcLength
,b1
, b1Len
,allowUnassigned
, parseError
, *status
);
322 if(U_FAILURE(*status
)){
327 *status
= U_IDNA_ZERO_LENGTH_LABEL_ERROR
;
333 for( j
=0;j
<b1Len
;j
++){
334 if(b1
[j
] > 0x7F){// check if output of usprep_prepare is all ASCII
336 }else if(prep
->isLDHChar(b1
[j
])==FALSE
){ // if the char is in ASCII range verify that it is an LDH character{
341 if(useSTD3ASCIIRules
== TRUE
){
343 if( srcIsLDH
== FALSE
/* source contains some non-LDH characters */
344 || b1
[0] == HYPHEN
|| b1
[b1Len
-1] == HYPHEN
){
345 *status
= U_IDNA_STD3_ASCII_RULES_ERROR
;
350 if(b1Len
<= destCapacity
){
351 uprv_memmove(dest
, b1
, b1Len
* U_SIZEOF_UCHAR
);
358 // step 5 : verify the sequence does not begin with ACE prefix
359 if(!startsWithPrefix(b1
,b1Len
)){
361 //step 6: encode the sequence with punycode
362 //caseFlags = (UBool*) uprv_malloc(b1Len * sizeof(UBool));
364 b2Len
= convertToPuny(b1
,b1Len
, b2
,b2Capacity
,*status
);
365 //b2Len = u_strToPunycode(b2,b2Capacity,b1,b1Len, caseFlags, status);
366 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
367 // redo processing of string
368 /* we do not have enough room so grow the buffer*/
369 b2
= (UChar
*) uprv_malloc(b2Len
* U_SIZEOF_UCHAR
);
371 *status
= U_MEMORY_ALLOCATION_ERROR
;
375 *status
= U_ZERO_ERROR
; // reset error
377 b2Len
= convertToPuny(b1
, b1Len
, b2
, b2Len
, *status
);
378 //b2Len = u_strToPunycode(b2,b2Len,b1,b1Len, caseFlags, status);
382 if(U_FAILURE(*status
)){
385 reqLength
= b2Len
+ACE_PREFIX_LENGTH
;
387 if(reqLength
> destCapacity
){
388 *status
= U_BUFFER_OVERFLOW_ERROR
;
391 //Step 7: prepend the ACE prefix
392 uprv_memcpy(dest
,ACE_PREFIX
,ACE_PREFIX_LENGTH
* U_SIZEOF_UCHAR
);
393 //Step 6: copy the contents in b2 into dest
394 uprv_memcpy(dest
+ACE_PREFIX_LENGTH
, b2
, b2Len
* U_SIZEOF_UCHAR
);
397 *status
= U_IDNA_ACE_PREFIX_ERROR
;
402 if(reqLength
> MAX_LABEL_LENGTH
){
403 *status
= U_IDNA_LABEL_TOO_LONG_ERROR
;
413 uprv_free(caseFlags
);
417 return u_terminateUChars(dest
, destCapacity
, reqLength
, status
);
421 U_CFUNC
int32_t U_EXPORT2
422 idnaref_toUnicode(const UChar
* src
, int32_t srcLength
,
423 UChar
* dest
, int32_t destCapacity
,
425 UParseError
* parseError
,
428 if(status
== NULL
|| U_FAILURE(*status
)){
431 if((src
== NULL
) || (srcLength
< -1) || (destCapacity
<0) || (!dest
&& destCapacity
> 0)){
432 *status
= U_ILLEGAL_ARGUMENT_ERROR
;
438 UChar b1Stack
[MAX_LABEL_BUFFER_SIZE
], b2Stack
[MAX_LABEL_BUFFER_SIZE
], b3Stack
[MAX_LABEL_BUFFER_SIZE
];
440 //initialize pointers to stack buffers
441 UChar
*b1
= b1Stack
, *b2
= b2Stack
, *b1Prime
=NULL
, *b3
=b3Stack
;
442 int32_t b1Len
, b2Len
, b1PrimeLen
, b3Len
,
443 b1Capacity
= MAX_LABEL_BUFFER_SIZE
,
444 b2Capacity
= MAX_LABEL_BUFFER_SIZE
,
445 b3Capacity
= MAX_LABEL_BUFFER_SIZE
,
447 // UParseError parseError;
449 NamePrepTransform
* prep
= TestIDNA::getInstance(*status
);
451 UBool
* caseFlags
= NULL
;
454 UBool allowUnassigned
= (UBool
)((options
& IDNAREF_ALLOW_UNASSIGNED
) != 0);
455 UBool useSTD3ASCIIRules
= (UBool
)((options
& IDNAREF_USE_STD3_RULES
) != 0);
457 UBool srcIsASCII
= TRUE
;
458 UBool srcIsLDH
= TRUE
;
461 if(U_FAILURE(*status
)){
464 // step 1: find out if all the codepoints in src are ASCII
467 for(;src
[srcLength
]!=0;){
468 if(src
[srcLength
]> 0x7f){
470 }if(prep
->isLDHChar(src
[srcLength
])==FALSE
){
471 // here we do not assemble surrogates
472 // since we know that LDH code points
473 // are in the ASCII range only
480 for(int32_t j
=0; j
<srcLength
; j
++){
483 }else if(prep
->isLDHChar(src
[j
])==FALSE
){
484 // here we do not assemble surrogates
485 // since we know that LDH code points
486 // are in the ASCII range only
493 if(srcIsASCII
== FALSE
){
494 // step 2: process the string
495 b1Len
= prep
->process(src
,srcLength
,b1
,b1Capacity
,allowUnassigned
, parseError
, *status
);
496 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
497 // redo processing of string
498 /* we do not have enough room so grow the buffer*/
499 b1
= (UChar
*) uprv_malloc(b1Len
* U_SIZEOF_UCHAR
);
501 *status
= U_MEMORY_ALLOCATION_ERROR
;
505 *status
= U_ZERO_ERROR
; // reset error
507 b1Len
= prep
->process(src
,srcLength
,b1
, b1Len
,allowUnassigned
, parseError
, *status
);
510 if(U_FAILURE(*status
)){
515 // copy everything to b1
516 if(srcLength
< b1Capacity
){
517 uprv_memmove(b1
,src
, srcLength
* U_SIZEOF_UCHAR
);
519 /* we do not have enough room so grow the buffer*/
520 b1
= (UChar
*) uprv_malloc(srcLength
* U_SIZEOF_UCHAR
);
522 *status
= U_MEMORY_ALLOCATION_ERROR
;
525 uprv_memmove(b1
,src
, srcLength
* U_SIZEOF_UCHAR
);
529 //step 3: verify ACE Prefix
530 if(startsWithPrefix(src
,srcLength
)){
532 //step 4: Remove the ACE Prefix
533 b1Prime
= b1
+ ACE_PREFIX_LENGTH
;
534 b1PrimeLen
= b1Len
- ACE_PREFIX_LENGTH
;
536 //step 5: Decode using punycode
537 b2Len
= convertFromPuny(b1Prime
,b1PrimeLen
, b2
, b2Capacity
, *status
);
538 //b2Len = u_strFromPunycode(b2, b2Capacity,b1Prime,b1PrimeLen, caseFlags, status);
540 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
541 // redo processing of string
542 /* we do not have enough room so grow the buffer*/
543 b2
= (UChar
*) uprv_malloc(b2Len
* U_SIZEOF_UCHAR
);
545 *status
= U_MEMORY_ALLOCATION_ERROR
;
549 *status
= U_ZERO_ERROR
; // reset error
551 b2Len
= convertFromPuny(b1Prime
,b1PrimeLen
, b2
, b2Len
, *status
);
552 //b2Len = u_strFromPunycode(b2, b2Len,b1Prime,b1PrimeLen,caseFlags, status);
556 //step 6:Apply toASCII
557 b3Len
= idnaref_toASCII(b2
,b2Len
,b3
,b3Capacity
,options
,parseError
, status
);
559 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
560 // redo processing of string
561 /* we do not have enough room so grow the buffer*/
562 b3
= (UChar
*) uprv_malloc(b3Len
* U_SIZEOF_UCHAR
);
564 *status
= U_MEMORY_ALLOCATION_ERROR
;
568 *status
= U_ZERO_ERROR
; // reset error
570 b3Len
= idnaref_toASCII(b2
,b2Len
,b3
,b3Len
, options
, parseError
, status
);
574 if(U_FAILURE(*status
)){
579 if(compareCaseInsensitiveASCII(b1
, b1Len
, b3
, b3Len
) !=0){
580 *status
= U_IDNA_VERIFICATION_ERROR
;
584 //step 8: return output of step 5
586 if(b2Len
<= destCapacity
) {
587 uprv_memmove(dest
, b2
, b2Len
* U_SIZEOF_UCHAR
);
590 // verify that STD3 ASCII rules are satisfied
591 if(useSTD3ASCIIRules
== TRUE
){
592 if( srcIsLDH
== FALSE
/* source contains some non-LDH characters */
593 || src
[0] == HYPHEN
|| src
[srcLength
-1] == HYPHEN
){
594 *status
= U_IDNA_STD3_ASCII_RULES_ERROR
;
596 /* populate the parseError struct */
598 // failPos is always set the index of failure
599 uprv_syntaxError(src
,failPos
, srcLength
,parseError
);
600 }else if(src
[0] == HYPHEN
){
601 // fail position is 0
602 uprv_syntaxError(src
,0,srcLength
,parseError
);
604 // the last index in the source is always length-1
605 uprv_syntaxError(src
, (srcLength
>0) ? srcLength
-1 : srcLength
, srcLength
,parseError
);
611 //copy the source to destination
612 if(srcLength
<= destCapacity
){
613 uprv_memmove(dest
,src
,srcLength
* U_SIZEOF_UCHAR
);
615 reqLength
= srcLength
;
626 uprv_free(caseFlags
);
630 return u_terminateUChars(dest
, destCapacity
, reqLength
, status
);
635 getNextSeparator(UChar
*src
,int32_t srcLength
,NamePrepTransform
* prep
,
643 *limit
= src
+ i
; // point to null
647 if(prep
->isLabelSeparator(src
[i
],*status
)){
648 *limit
= src
+ (i
+1); // go past the delimiter
655 for(i
=0;i
<srcLength
;i
++){
656 if(prep
->isLabelSeparator(src
[i
],*status
)){
657 *limit
= src
+ (i
+1); // go past the delimiter
661 // we have not found the delimiter
663 *limit
= src
+srcLength
;
670 U_CFUNC
int32_t U_EXPORT2
671 idnaref_IDNToASCII( const UChar
* src
, int32_t srcLength
,
672 UChar
* dest
, int32_t destCapacity
,
674 UParseError
* parseError
,
677 if(status
== NULL
|| U_FAILURE(*status
)){
680 if((src
== NULL
) || (srcLength
< -1) || (destCapacity
<0) || (!dest
&& destCapacity
> 0)){
681 *status
= U_ILLEGAL_ARGUMENT_ERROR
;
685 int32_t reqLength
= 0;
686 // UParseError parseError;
688 NamePrepTransform
* prep
= TestIDNA::getInstance(*status
);
690 //initialize pointers to stack buffers
691 UChar b1Stack
[MAX_LABEL_BUFFER_SIZE
];
693 int32_t b1Len
, labelLen
;
694 UChar
* delimiter
= (UChar
*)src
;
695 UChar
* labelStart
= (UChar
*)src
;
696 int32_t remainingLen
= srcLength
;
697 int32_t b1Capacity
= MAX_LABEL_BUFFER_SIZE
;
700 // UBool allowUnassigned = (UBool)((options & IDNAREF_ALLOW_UNASSIGNED) != 0);
701 // UBool useSTD3ASCIIRules = (UBool)((options & IDNAREF_USE_STD3_RULES) != 0);
704 if(U_FAILURE(*status
)){
716 labelLen
= getNextSeparator(labelStart
, -1, prep
, &delimiter
, &done
, status
);
718 if(!(labelLen
==0 && done
)){// make sure this is not a root label separator.
720 b1Len
= idnaref_toASCII(labelStart
, labelLen
, b1
, b1Capacity
,
721 options
, parseError
, status
);
723 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
724 // redo processing of string
725 /* we do not have enough room so grow the buffer*/
726 b1
= (UChar
*) uprv_malloc(b1Len
* U_SIZEOF_UCHAR
);
728 *status
= U_MEMORY_ALLOCATION_ERROR
;
732 *status
= U_ZERO_ERROR
; // reset error
734 b1Len
= idnaref_toASCII(labelStart
, labelLen
, b1
, b1Len
,
735 options
, parseError
, status
);
740 if(U_FAILURE(*status
)){
743 int32_t tempLen
= (reqLength
+ b1Len
);
745 if( tempLen
< destCapacity
){
746 uprv_memmove(dest
+reqLength
, b1
, b1Len
* U_SIZEOF_UCHAR
);
751 // add the label separator
753 if(reqLength
< destCapacity
){
754 dest
[reqLength
] = FULL_STOP
;
759 labelStart
= delimiter
;
764 if(delimiter
== src
+srcLength
){
768 labelLen
= getNextSeparator(labelStart
, remainingLen
, prep
, &delimiter
, &done
, status
);
770 b1Len
= idnaref_toASCII(labelStart
, labelLen
, b1
, b1Capacity
,
771 options
,parseError
, status
);
773 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
774 // redo processing of string
775 /* we do not have enough room so grow the buffer*/
776 b1
= (UChar
*) uprv_malloc(b1Len
* U_SIZEOF_UCHAR
);
778 *status
= U_MEMORY_ALLOCATION_ERROR
;
782 *status
= U_ZERO_ERROR
; // reset error
784 b1Len
= idnaref_toASCII(labelStart
, labelLen
, b1
, b1Len
,
785 options
, parseError
, status
);
789 if(U_FAILURE(*status
)){
792 int32_t tempLen
= (reqLength
+ b1Len
);
794 if( tempLen
< destCapacity
){
795 uprv_memmove(dest
+reqLength
, b1
, b1Len
* U_SIZEOF_UCHAR
);
800 // add the label separator
802 if(reqLength
< destCapacity
){
803 dest
[reqLength
] = FULL_STOP
;
808 labelStart
= delimiter
;
809 remainingLen
= srcLength
- (delimiter
- src
);
822 return u_terminateUChars(dest
, destCapacity
, reqLength
, status
);
825 U_CFUNC
int32_t U_EXPORT2
826 idnaref_IDNToUnicode( const UChar
* src
, int32_t srcLength
,
827 UChar
* dest
, int32_t destCapacity
,
829 UParseError
* parseError
,
832 if(status
== NULL
|| U_FAILURE(*status
)){
835 if((src
== NULL
) || (srcLength
< -1) || (destCapacity
<0) || (!dest
&& destCapacity
> 0)){
836 *status
= U_ILLEGAL_ARGUMENT_ERROR
;
840 int32_t reqLength
= 0;
844 NamePrepTransform
* prep
= TestIDNA::getInstance(*status
);
846 //initialize pointers to stack buffers
847 UChar b1Stack
[MAX_LABEL_BUFFER_SIZE
];
849 int32_t b1Len
, labelLen
;
850 UChar
* delimiter
= (UChar
*)src
;
851 UChar
* labelStart
= (UChar
*)src
;
852 int32_t remainingLen
= srcLength
;
853 int32_t b1Capacity
= MAX_LABEL_BUFFER_SIZE
;
856 // UBool allowUnassigned = (UBool)((options & IDNAREF_ALLOW_UNASSIGNED) != 0);
857 // UBool useSTD3ASCIIRules = (UBool)((options & IDNAREF_USE_STD3_RULES) != 0);
859 if(U_FAILURE(*status
)){
870 labelLen
= getNextSeparator(labelStart
, -1, prep
, &delimiter
, &done
, status
);
872 if(labelLen
==0 && done
==FALSE
){
873 *status
= U_IDNA_ZERO_LENGTH_LABEL_ERROR
;
875 b1Len
= idnaref_toUnicode(labelStart
, labelLen
, b1
, b1Capacity
,
876 options
, parseError
, status
);
878 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
879 // redo processing of string
880 /* we do not have enough room so grow the buffer*/
881 b1
= (UChar
*) uprv_malloc(b1Len
* U_SIZEOF_UCHAR
);
883 *status
= U_MEMORY_ALLOCATION_ERROR
;
887 *status
= U_ZERO_ERROR
; // reset error
889 b1Len
= idnaref_toUnicode( labelStart
, labelLen
, b1
, b1Len
,
890 options
, parseError
, status
);
894 if(U_FAILURE(*status
)){
897 int32_t tempLen
= (reqLength
+ b1Len
);
899 if( tempLen
< destCapacity
){
900 uprv_memmove(dest
+reqLength
, b1
, b1Len
* U_SIZEOF_UCHAR
);
904 // add the label separator
906 if(reqLength
< destCapacity
){
907 dest
[reqLength
] = FULL_STOP
;
912 labelStart
= delimiter
;
917 if(delimiter
== src
+srcLength
){
921 labelLen
= getNextSeparator(labelStart
, remainingLen
, prep
, &delimiter
, &done
, status
);
923 if(labelLen
==0 && done
==FALSE
){
924 *status
= U_IDNA_ZERO_LENGTH_LABEL_ERROR
;
927 b1Len
= idnaref_toUnicode( labelStart
,labelLen
, b1
, b1Capacity
,
928 options
, parseError
, status
);
930 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
931 // redo processing of string
932 /* we do not have enough room so grow the buffer*/
933 b1
= (UChar
*) uprv_malloc(b1Len
* U_SIZEOF_UCHAR
);
935 *status
= U_MEMORY_ALLOCATION_ERROR
;
939 *status
= U_ZERO_ERROR
; // reset error
941 b1Len
= idnaref_toUnicode( labelStart
, labelLen
, b1
, b1Len
,
942 options
, parseError
, status
);
946 if(U_FAILURE(*status
)){
949 int32_t tempLen
= (reqLength
+ b1Len
);
951 if( tempLen
< destCapacity
){
952 uprv_memmove(dest
+reqLength
, b1
, b1Len
* U_SIZEOF_UCHAR
);
957 // add the label separator
959 if(reqLength
< destCapacity
){
960 dest
[reqLength
] = FULL_STOP
;
965 labelStart
= delimiter
;
966 remainingLen
= srcLength
- (delimiter
- src
);
978 return u_terminateUChars(dest
, destCapacity
, reqLength
, status
);
981 U_CFUNC
int32_t U_EXPORT2
982 idnaref_compare( const UChar
*s1
, int32_t length1
,
983 const UChar
*s2
, int32_t length2
,
987 if(status
== NULL
|| U_FAILURE(*status
)){
991 UChar b1Stack
[MAX_IDN_BUFFER_SIZE
], b2Stack
[MAX_IDN_BUFFER_SIZE
];
992 UChar
*b1
= b1Stack
, *b2
= b2Stack
;
993 int32_t b1Len
, b2Len
, b1Capacity
= MAX_IDN_BUFFER_SIZE
, b2Capacity
= MAX_IDN_BUFFER_SIZE
;
996 UParseError parseError
;
998 b1Len
= idnaref_IDNToASCII(s1
, length1
, b1
, b1Capacity
, options
, &parseError
, status
);
999 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
1000 // redo processing of string
1001 /* we do not have enough room so grow the buffer*/
1002 b1
= (UChar
*) uprv_malloc(b1Len
* U_SIZEOF_UCHAR
);
1004 *status
= U_MEMORY_ALLOCATION_ERROR
;
1008 *status
= U_ZERO_ERROR
; // reset error
1010 b1Len
= idnaref_IDNToASCII(s1
,length1
,b1
,b1Len
, options
, &parseError
, status
);
1014 b2Len
= idnaref_IDNToASCII(s2
,length2
,b2
,b2Capacity
,options
, &parseError
, status
);
1015 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
1016 // redo processing of string
1017 /* we do not have enough room so grow the buffer*/
1018 b2
= (UChar
*) uprv_malloc(b2Len
* U_SIZEOF_UCHAR
);
1020 *status
= U_MEMORY_ALLOCATION_ERROR
;
1024 *status
= U_ZERO_ERROR
; // reset error
1026 b2Len
= idnaref_IDNToASCII(s2
,length2
,b2
,b2Len
,options
, &parseError
, status
);
1029 // when toASCII is applied all label separators are replaced with FULL_STOP
1030 result
= compareCaseInsensitiveASCII(b1
,b1Len
,b2
,b2Len
);
1043 #endif /* #if !UCONFIG_NO_IDNA */