2 *******************************************************************************
4 * Copyright (C) 2003-2007, International Business Machines
5 * Corporation and others. All Rights Reserved.
7 *******************************************************************************
8 * file name: idnaref.cpp
10 * tab size: 8 (not used)
13 * created on: 2003feb1
14 * created by: Ram Viswanadha
17 #include "unicode/utypes.h"
19 #if !UCONFIG_NO_IDNA && !UCONFIG_NO_TRANSLITERATION
28 #include "unicode/ustring.h"
30 /* it is official IDNA ACE Prefix is "xn--" */
31 static const UChar ACE_PREFIX
[] ={ 0x0078,0x006E,0x002d,0x002d } ;
32 #define ACE_PREFIX_LENGTH 4
34 #define MAX_LABEL_LENGTH 63
36 /* The Max length of the labels should not be more than 64 */
37 #define MAX_LABEL_BUFFER_SIZE 100
38 #define MAX_IDN_BUFFER_SIZE 300
40 #define CAPITAL_A 0x0041
41 #define CAPITAL_Z 0x005A
42 #define LOWER_CASE_DELTA 0x0020
43 #define FULL_STOP 0x002E
47 startsWithPrefix(const UChar
* src
, int32_t srcLength
){
48 UBool startsWithPrefix
= TRUE
;
50 if(srcLength
< ACE_PREFIX_LENGTH
){
54 for(int8_t i
=0; i
< ACE_PREFIX_LENGTH
; i
++){
55 if(u_tolower(src
[i
]) != ACE_PREFIX
[i
]){
56 startsWithPrefix
= FALSE
;
59 return startsWithPrefix
;
63 toASCIILower(UChar ch
){
64 if(CAPITAL_A
<= ch
&& ch
<= CAPITAL_Z
){
65 return ch
+ LOWER_CASE_DELTA
;
71 compareCaseInsensitiveASCII(const UChar
* s1
, int32_t s1Len
,
72 const UChar
* s2
, int32_t s2Len
){
74 return (s1Len
> s2Len
) ? s1Len
: s2Len
;
79 for(int32_t i
=0;/* no condition */;i
++) {
80 /* If we reach the ends of both strings then they match */
88 /* Case-insensitive comparison */
90 rc
=(int32_t)toASCIILower(c1
)-(int32_t)toASCIILower(c2
);
99 static UErrorCode
getError(enum punycode_status status
){
101 case punycode_success
:
103 case punycode_bad_input
: /* Input is invalid. */
104 return U_INVALID_CHAR_FOUND
;
105 case punycode_big_output
: /* Output would exceed the space provided. */
106 return U_BUFFER_OVERFLOW_ERROR
;
107 case punycode_overflow
: /* Input requires wider integers to process. */
108 return U_INDEX_OUTOFBOUNDS_ERROR
;
110 return U_INTERNAL_PROGRAM_ERROR
;
114 static inline int32_t convertASCIIToUChars(const char* src
,UChar
* dest
, int32_t length
){
116 for(i
=0;i
<length
;i
++){
121 static inline int32_t convertUCharsToASCII(const UChar
* src
,char* dest
, int32_t length
){
123 for(i
=0;i
<length
;i
++){
124 dest
[i
] = (char)src
[i
];
128 // wrapper around the reference Punycode implementation
129 static int32_t convertToPuny(const UChar
* src
, int32_t srcLength
,
130 UChar
* dest
, int32_t destCapacity
,
132 uint32_t b1Stack
[MAX_LABEL_BUFFER_SIZE
];
133 int32_t b1Len
= 0, b1Capacity
= MAX_LABEL_BUFFER_SIZE
;
134 uint32_t* b1
= b1Stack
;
135 char b2Stack
[MAX_LABEL_BUFFER_SIZE
];
137 int32_t b2Len
=MAX_LABEL_BUFFER_SIZE
;
138 punycode_status error
;
139 unsigned char* caseFlags
= NULL
;
141 u_strToUTF32((UChar32
*)b1
,b1Capacity
,&b1Len
,src
,srcLength
,&status
);
142 if(status
== U_BUFFER_OVERFLOW_ERROR
){
143 // redo processing of string
144 /* we do not have enough room so grow the buffer*/
145 b1
= (uint32_t*) uprv_malloc(b1Len
* sizeof(uint32_t));
147 status
= U_MEMORY_ALLOCATION_ERROR
;
151 status
= U_ZERO_ERROR
; // reset error
153 u_strToUTF32((UChar32
*)b1
,b1Len
,&b1Len
,src
,srcLength
,&status
);
155 if(U_FAILURE(status
)){
159 //caseFlags = (unsigned char*) uprv_malloc(b1Len *sizeof(unsigned char));
161 error
= punycode_encode(b1Len
,b1
,caseFlags
, (uint32_t*)&b2Len
, b2
);
162 status
= getError(error
);
164 if(status
== U_BUFFER_OVERFLOW_ERROR
){
165 /* we do not have enough room so grow the buffer*/
166 b2
= (char*) uprv_malloc( b2Len
* sizeof(char));
168 status
= U_MEMORY_ALLOCATION_ERROR
;
172 status
= U_ZERO_ERROR
; // reset error
174 punycode_status error
= punycode_encode(b1Len
,b1
,caseFlags
, (uint32_t*)&b2Len
, b2
);
175 status
= getError(error
);
177 if(U_FAILURE(status
)){
181 if(b2Len
< destCapacity
){
182 convertASCIIToUChars(b2
,dest
,b2Len
);
184 status
=U_BUFFER_OVERFLOW_ERROR
;
194 uprv_free(caseFlags
);
199 static int32_t convertFromPuny( const UChar
* src
, int32_t srcLength
,
200 UChar
* dest
, int32_t destCapacity
,
202 char b1Stack
[MAX_LABEL_BUFFER_SIZE
];
206 convertUCharsToASCII(src
, b1
,srcLength
);
208 uint32_t b2Stack
[MAX_LABEL_BUFFER_SIZE
];
209 uint32_t* b2
= b2Stack
;
210 int32_t b2Len
=MAX_LABEL_BUFFER_SIZE
;
211 unsigned char* caseFlags
= NULL
; //(unsigned char*) uprv_malloc(srcLength * sizeof(unsigned char*));
212 punycode_status error
= punycode_decode(srcLength
,b1
,(uint32_t*)&b2Len
,b2
,caseFlags
);
213 status
= getError(error
);
214 if(status
== U_BUFFER_OVERFLOW_ERROR
){
215 b2
= (uint32_t*) uprv_malloc(b2Len
* sizeof(uint32_t));
217 status
= U_MEMORY_ALLOCATION_ERROR
;
220 error
= punycode_decode(srcLength
,b1
,(uint32_t*)&b2Len
,b2
,caseFlags
);
221 status
= getError(error
);
224 if(U_FAILURE(status
)){
228 u_strFromUTF32(dest
,destCapacity
,&destLen
,(UChar32
*)b2
,b2Len
,&status
);
237 uprv_free(caseFlags
);
243 U_CFUNC
int32_t U_EXPORT2
244 idnaref_toASCII(const UChar
* src
, int32_t srcLength
,
245 UChar
* dest
, int32_t destCapacity
,
247 UParseError
* parseError
,
250 if(status
== NULL
|| U_FAILURE(*status
)){
253 if((src
== NULL
) || (srcLength
< -1) || (destCapacity
<0) || (!dest
&& destCapacity
> 0)){
254 *status
= U_ILLEGAL_ARGUMENT_ERROR
;
257 UChar b1Stack
[MAX_LABEL_BUFFER_SIZE
], b2Stack
[MAX_LABEL_BUFFER_SIZE
];
258 //initialize pointers to stack buffers
259 UChar
*b1
= b1Stack
, *b2
= b2Stack
;
260 int32_t b1Len
=0, b2Len
=0,
261 b1Capacity
= MAX_LABEL_BUFFER_SIZE
,
262 b2Capacity
= MAX_LABEL_BUFFER_SIZE
,
266 UBool allowUnassigned
= (UBool
)((options
& IDNAREF_ALLOW_UNASSIGNED
) != 0);
267 UBool useSTD3ASCIIRules
= (UBool
)((options
& IDNAREF_USE_STD3_RULES
) != 0);
269 UBool
* caseFlags
= NULL
;
271 // assume the source contains all ascii codepoints
272 UBool srcIsASCII
= TRUE
;
273 // assume the source contains all LDH codepoints
274 UBool srcIsLDH
= TRUE
;
278 srcLength
= u_strlen(src
);
282 for( j
=0;j
<srcLength
;j
++){
286 b1
[b1Len
++] = src
[j
];
289 NamePrepTransform
* prep
= TestIDNA::getInstance(*status
);
291 if(U_FAILURE(*status
)){
295 b1Len
= prep
->process(src
,srcLength
,b1
, b1Capacity
,allowUnassigned
,parseError
,*status
);
297 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
298 // redo processing of string
299 /* we do not have enough room so grow the buffer*/
300 b1
= (UChar
*) uprv_malloc(b1Len
* U_SIZEOF_UCHAR
);
302 *status
= U_MEMORY_ALLOCATION_ERROR
;
306 *status
= U_ZERO_ERROR
; // reset error
308 b1Len
= prep
->process(src
,srcLength
,b1
, b1Len
,allowUnassigned
, parseError
, *status
);
311 if(U_FAILURE(*status
)){
316 *status
= U_IDNA_ZERO_LENGTH_LABEL_ERROR
;
322 for( j
=0;j
<b1Len
;j
++){
323 if(b1
[j
] > 0x7F){// check if output of usprep_prepare is all ASCII
325 }else if(prep
->isLDHChar(b1
[j
])==FALSE
){ // if the char is in ASCII range verify that it is an LDH character{
330 if(useSTD3ASCIIRules
== TRUE
){
332 if( srcIsLDH
== FALSE
/* source contains some non-LDH characters */
333 || b1
[0] == HYPHEN
|| b1
[b1Len
-1] == HYPHEN
){
334 *status
= U_IDNA_STD3_ASCII_RULES_ERROR
;
339 if(b1Len
<= destCapacity
){
340 uprv_memmove(dest
, b1
, b1Len
* U_SIZEOF_UCHAR
);
347 // step 5 : verify the sequence does not begin with ACE prefix
348 if(!startsWithPrefix(b1
,b1Len
)){
350 //step 6: encode the sequence with punycode
351 //caseFlags = (UBool*) uprv_malloc(b1Len * sizeof(UBool));
353 b2Len
= convertToPuny(b1
,b1Len
, b2
,b2Capacity
,*status
);
354 //b2Len = u_strToPunycode(b2,b2Capacity,b1,b1Len, caseFlags, status);
355 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
356 // redo processing of string
357 /* we do not have enough room so grow the buffer*/
358 b2
= (UChar
*) uprv_malloc(b2Len
* U_SIZEOF_UCHAR
);
360 *status
= U_MEMORY_ALLOCATION_ERROR
;
364 *status
= U_ZERO_ERROR
; // reset error
366 b2Len
= convertToPuny(b1
, b1Len
, b2
, b2Len
, *status
);
367 //b2Len = u_strToPunycode(b2,b2Len,b1,b1Len, caseFlags, status);
371 if(U_FAILURE(*status
)){
374 reqLength
= b2Len
+ACE_PREFIX_LENGTH
;
376 if(reqLength
> destCapacity
){
377 *status
= U_BUFFER_OVERFLOW_ERROR
;
380 //Step 7: prepend the ACE prefix
381 uprv_memcpy(dest
,ACE_PREFIX
,ACE_PREFIX_LENGTH
* U_SIZEOF_UCHAR
);
382 //Step 6: copy the contents in b2 into dest
383 uprv_memcpy(dest
+ACE_PREFIX_LENGTH
, b2
, b2Len
* U_SIZEOF_UCHAR
);
386 *status
= U_IDNA_ACE_PREFIX_ERROR
;
391 if(reqLength
> MAX_LABEL_LENGTH
){
392 *status
= U_IDNA_LABEL_TOO_LONG_ERROR
;
402 uprv_free(caseFlags
);
406 return u_terminateUChars(dest
, destCapacity
, reqLength
, status
);
410 U_CFUNC
int32_t U_EXPORT2
411 idnaref_toUnicode(const UChar
* src
, int32_t srcLength
,
412 UChar
* dest
, int32_t destCapacity
,
414 UParseError
* parseError
,
417 if(status
== NULL
|| U_FAILURE(*status
)){
420 if((src
== NULL
) || (srcLength
< -1) || (destCapacity
<0) || (!dest
&& destCapacity
> 0)){
421 *status
= U_ILLEGAL_ARGUMENT_ERROR
;
427 UChar b1Stack
[MAX_LABEL_BUFFER_SIZE
], b2Stack
[MAX_LABEL_BUFFER_SIZE
], b3Stack
[MAX_LABEL_BUFFER_SIZE
];
429 //initialize pointers to stack buffers
430 UChar
*b1
= b1Stack
, *b2
= b2Stack
, *b1Prime
=NULL
, *b3
=b3Stack
;
431 int32_t b1Len
, b2Len
, b1PrimeLen
, b3Len
,
432 b1Capacity
= MAX_LABEL_BUFFER_SIZE
,
433 b2Capacity
= MAX_LABEL_BUFFER_SIZE
,
434 b3Capacity
= MAX_LABEL_BUFFER_SIZE
,
436 // UParseError parseError;
438 NamePrepTransform
* prep
= TestIDNA::getInstance(*status
);
440 UBool
* caseFlags
= NULL
;
443 UBool allowUnassigned
= (UBool
)((options
& IDNAREF_ALLOW_UNASSIGNED
) != 0);
444 UBool useSTD3ASCIIRules
= (UBool
)((options
& IDNAREF_USE_STD3_RULES
) != 0);
446 UBool srcIsASCII
= TRUE
;
447 UBool srcIsLDH
= TRUE
;
450 if(U_FAILURE(*status
)){
453 // step 1: find out if all the codepoints in src are ASCII
456 for(;src
[srcLength
]!=0;){
457 if(src
[srcLength
]> 0x7f){
459 }if(prep
->isLDHChar(src
[srcLength
])==FALSE
){
460 // here we do not assemble surrogates
461 // since we know that LDH code points
462 // are in the ASCII range only
469 for(int32_t j
=0; j
<srcLength
; j
++){
472 }else if(prep
->isLDHChar(src
[j
])==FALSE
){
473 // here we do not assemble surrogates
474 // since we know that LDH code points
475 // are in the ASCII range only
482 if(srcIsASCII
== FALSE
){
483 // step 2: process the string
484 b1Len
= prep
->process(src
,srcLength
,b1
,b1Capacity
,allowUnassigned
, parseError
, *status
);
485 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
486 // redo processing of string
487 /* we do not have enough room so grow the buffer*/
488 b1
= (UChar
*) uprv_malloc(b1Len
* U_SIZEOF_UCHAR
);
490 *status
= U_MEMORY_ALLOCATION_ERROR
;
494 *status
= U_ZERO_ERROR
; // reset error
496 b1Len
= prep
->process(src
,srcLength
,b1
, b1Len
,allowUnassigned
, parseError
, *status
);
499 if(U_FAILURE(*status
)){
504 // copy everything to b1
505 if(srcLength
< b1Capacity
){
506 uprv_memmove(b1
,src
, srcLength
* U_SIZEOF_UCHAR
);
508 /* we do not have enough room so grow the buffer*/
509 b1
= (UChar
*) uprv_malloc(srcLength
* U_SIZEOF_UCHAR
);
511 *status
= U_MEMORY_ALLOCATION_ERROR
;
514 uprv_memmove(b1
,src
, srcLength
* U_SIZEOF_UCHAR
);
518 //step 3: verify ACE Prefix
519 if(startsWithPrefix(src
,srcLength
)){
521 //step 4: Remove the ACE Prefix
522 b1Prime
= b1
+ ACE_PREFIX_LENGTH
;
523 b1PrimeLen
= b1Len
- ACE_PREFIX_LENGTH
;
525 //step 5: Decode using punycode
526 b2Len
= convertFromPuny(b1Prime
,b1PrimeLen
, b2
, b2Capacity
, *status
);
527 //b2Len = u_strFromPunycode(b2, b2Capacity,b1Prime,b1PrimeLen, caseFlags, status);
529 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
530 // redo processing of string
531 /* we do not have enough room so grow the buffer*/
532 b2
= (UChar
*) uprv_malloc(b2Len
* U_SIZEOF_UCHAR
);
534 *status
= U_MEMORY_ALLOCATION_ERROR
;
538 *status
= U_ZERO_ERROR
; // reset error
540 b2Len
= convertFromPuny(b1Prime
,b1PrimeLen
, b2
, b2Len
, *status
);
541 //b2Len = u_strFromPunycode(b2, b2Len,b1Prime,b1PrimeLen,caseFlags, status);
545 //step 6:Apply toASCII
546 b3Len
= idnaref_toASCII(b2
,b2Len
,b3
,b3Capacity
,options
,parseError
, status
);
548 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
549 // redo processing of string
550 /* we do not have enough room so grow the buffer*/
551 b3
= (UChar
*) uprv_malloc(b3Len
* U_SIZEOF_UCHAR
);
553 *status
= U_MEMORY_ALLOCATION_ERROR
;
557 *status
= U_ZERO_ERROR
; // reset error
559 b3Len
= idnaref_toASCII(b2
,b2Len
,b3
,b3Len
, options
, parseError
, status
);
563 if(U_FAILURE(*status
)){
568 if(compareCaseInsensitiveASCII(b1
, b1Len
, b3
, b3Len
) !=0){
569 *status
= U_IDNA_VERIFICATION_ERROR
;
573 //step 8: return output of step 5
575 if(b2Len
<= destCapacity
) {
576 uprv_memmove(dest
, b2
, b2Len
* U_SIZEOF_UCHAR
);
579 // verify that STD3 ASCII rules are satisfied
580 if(useSTD3ASCIIRules
== TRUE
){
581 if( srcIsLDH
== FALSE
/* source contains some non-LDH characters */
582 || src
[0] == HYPHEN
|| src
[srcLength
-1] == HYPHEN
){
583 *status
= U_IDNA_STD3_ASCII_RULES_ERROR
;
585 /* populate the parseError struct */
587 // failPos is always set the index of failure
588 uprv_syntaxError(src
,failPos
, srcLength
,parseError
);
589 }else if(src
[0] == HYPHEN
){
590 // fail position is 0
591 uprv_syntaxError(src
,0,srcLength
,parseError
);
593 // the last index in the source is always length-1
594 uprv_syntaxError(src
, (srcLength
>0) ? srcLength
-1 : srcLength
, srcLength
,parseError
);
600 //copy the source to destination
601 if(srcLength
<= destCapacity
){
602 uprv_memmove(dest
,src
,srcLength
* U_SIZEOF_UCHAR
);
604 reqLength
= srcLength
;
615 uprv_free(caseFlags
);
617 // The RFC states that
619 // ToUnicode never fails. If any step fails, then the original input
620 // is returned immediately in that step.
622 // So if any step fails lets copy source to destination
623 if(U_FAILURE(*status
)){
624 //copy the source to destination
625 if(dest
&& srcLength
<= destCapacity
){
626 if(srcLength
== -1) {
627 uprv_memmove(dest
,src
,u_strlen(src
)* U_SIZEOF_UCHAR
);
629 uprv_memmove(dest
,src
,srcLength
* U_SIZEOF_UCHAR
);
632 reqLength
= srcLength
;
633 *status
= U_ZERO_ERROR
;
635 return u_terminateUChars(dest
, destCapacity
, reqLength
, status
);
640 getNextSeparator(UChar
*src
,int32_t srcLength
,NamePrepTransform
* prep
,
648 *limit
= src
+ i
; // point to null
652 if(prep
->isLabelSeparator(src
[i
],*status
)){
653 *limit
= src
+ (i
+1); // go past the delimiter
660 for(i
=0;i
<srcLength
;i
++){
661 if(prep
->isLabelSeparator(src
[i
],*status
)){
662 *limit
= src
+ (i
+1); // go past the delimiter
666 // we have not found the delimiter
668 *limit
= src
+srcLength
;
675 U_CFUNC
int32_t U_EXPORT2
676 idnaref_IDNToASCII( const UChar
* src
, int32_t srcLength
,
677 UChar
* dest
, int32_t destCapacity
,
679 UParseError
* parseError
,
682 if(status
== NULL
|| U_FAILURE(*status
)){
685 if((src
== NULL
) || (srcLength
< -1) || (destCapacity
<0) || (!dest
&& destCapacity
> 0)){
686 *status
= U_ILLEGAL_ARGUMENT_ERROR
;
690 int32_t reqLength
= 0;
691 // UParseError parseError;
693 NamePrepTransform
* prep
= TestIDNA::getInstance(*status
);
695 //initialize pointers to stack buffers
696 UChar b1Stack
[MAX_LABEL_BUFFER_SIZE
];
698 int32_t b1Len
, labelLen
;
699 UChar
* delimiter
= (UChar
*)src
;
700 UChar
* labelStart
= (UChar
*)src
;
701 int32_t remainingLen
= srcLength
;
702 int32_t b1Capacity
= MAX_LABEL_BUFFER_SIZE
;
705 // UBool allowUnassigned = (UBool)((options & IDNAREF_ALLOW_UNASSIGNED) != 0);
706 // UBool useSTD3ASCIIRules = (UBool)((options & IDNAREF_USE_STD3_RULES) != 0);
709 if(U_FAILURE(*status
)){
721 labelLen
= getNextSeparator(labelStart
, -1, prep
, &delimiter
, &done
, status
);
723 if(!(labelLen
==0 && done
)){// make sure this is not a root label separator.
725 b1Len
= idnaref_toASCII(labelStart
, labelLen
, b1
, b1Capacity
,
726 options
, parseError
, status
);
728 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
729 // redo processing of string
730 /* we do not have enough room so grow the buffer*/
731 b1
= (UChar
*) uprv_malloc(b1Len
* U_SIZEOF_UCHAR
);
733 *status
= U_MEMORY_ALLOCATION_ERROR
;
737 *status
= U_ZERO_ERROR
; // reset error
739 b1Len
= idnaref_toASCII(labelStart
, labelLen
, b1
, b1Len
,
740 options
, parseError
, status
);
745 if(U_FAILURE(*status
)){
748 int32_t tempLen
= (reqLength
+ b1Len
);
750 if( tempLen
< destCapacity
){
751 uprv_memmove(dest
+reqLength
, b1
, b1Len
* U_SIZEOF_UCHAR
);
756 // add the label separator
758 if(reqLength
< destCapacity
){
759 dest
[reqLength
] = FULL_STOP
;
764 labelStart
= delimiter
;
769 if(delimiter
== src
+srcLength
){
773 labelLen
= getNextSeparator(labelStart
, remainingLen
, prep
, &delimiter
, &done
, status
);
775 b1Len
= idnaref_toASCII(labelStart
, labelLen
, b1
, b1Capacity
,
776 options
,parseError
, status
);
778 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
779 // redo processing of string
780 /* we do not have enough room so grow the buffer*/
781 b1
= (UChar
*) uprv_malloc(b1Len
* U_SIZEOF_UCHAR
);
783 *status
= U_MEMORY_ALLOCATION_ERROR
;
787 *status
= U_ZERO_ERROR
; // reset error
789 b1Len
= idnaref_toASCII(labelStart
, labelLen
, b1
, b1Len
,
790 options
, parseError
, status
);
794 if(U_FAILURE(*status
)){
797 int32_t tempLen
= (reqLength
+ b1Len
);
799 if( tempLen
< destCapacity
){
800 uprv_memmove(dest
+reqLength
, b1
, b1Len
* U_SIZEOF_UCHAR
);
805 // add the label separator
807 if(reqLength
< destCapacity
){
808 dest
[reqLength
] = FULL_STOP
;
813 labelStart
= delimiter
;
814 remainingLen
= srcLength
- (delimiter
- src
);
827 return u_terminateUChars(dest
, destCapacity
, reqLength
, status
);
830 U_CFUNC
int32_t U_EXPORT2
831 idnaref_IDNToUnicode( const UChar
* src
, int32_t srcLength
,
832 UChar
* dest
, int32_t destCapacity
,
834 UParseError
* parseError
,
837 if(status
== NULL
|| U_FAILURE(*status
)){
840 if((src
== NULL
) || (srcLength
< -1) || (destCapacity
<0) || (!dest
&& destCapacity
> 0)){
841 *status
= U_ILLEGAL_ARGUMENT_ERROR
;
845 int32_t reqLength
= 0;
849 NamePrepTransform
* prep
= TestIDNA::getInstance(*status
);
851 //initialize pointers to stack buffers
852 UChar b1Stack
[MAX_LABEL_BUFFER_SIZE
];
854 int32_t b1Len
, labelLen
;
855 UChar
* delimiter
= (UChar
*)src
;
856 UChar
* labelStart
= (UChar
*)src
;
857 int32_t remainingLen
= srcLength
;
858 int32_t b1Capacity
= MAX_LABEL_BUFFER_SIZE
;
861 // UBool allowUnassigned = (UBool)((options & IDNAREF_ALLOW_UNASSIGNED) != 0);
862 // UBool useSTD3ASCIIRules = (UBool)((options & IDNAREF_USE_STD3_RULES) != 0);
864 if(U_FAILURE(*status
)){
875 labelLen
= getNextSeparator(labelStart
, -1, prep
, &delimiter
, &done
, status
);
877 if(labelLen
==0 && done
==FALSE
){
878 *status
= U_IDNA_ZERO_LENGTH_LABEL_ERROR
;
880 b1Len
= idnaref_toUnicode(labelStart
, labelLen
, b1
, b1Capacity
,
881 options
, parseError
, status
);
883 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
884 // redo processing of string
885 /* we do not have enough room so grow the buffer*/
886 b1
= (UChar
*) uprv_malloc(b1Len
* U_SIZEOF_UCHAR
);
888 *status
= U_MEMORY_ALLOCATION_ERROR
;
892 *status
= U_ZERO_ERROR
; // reset error
894 b1Len
= idnaref_toUnicode( labelStart
, labelLen
, b1
, b1Len
,
895 options
, parseError
, status
);
899 if(U_FAILURE(*status
)){
902 int32_t tempLen
= (reqLength
+ b1Len
);
904 if( tempLen
< destCapacity
){
905 uprv_memmove(dest
+reqLength
, b1
, b1Len
* U_SIZEOF_UCHAR
);
909 // add the label separator
911 if(reqLength
< destCapacity
){
912 dest
[reqLength
] = FULL_STOP
;
917 labelStart
= delimiter
;
922 if(delimiter
== src
+srcLength
){
926 labelLen
= getNextSeparator(labelStart
, remainingLen
, prep
, &delimiter
, &done
, status
);
928 if(labelLen
==0 && done
==FALSE
){
929 *status
= U_IDNA_ZERO_LENGTH_LABEL_ERROR
;
932 b1Len
= idnaref_toUnicode( labelStart
,labelLen
, b1
, b1Capacity
,
933 options
, parseError
, status
);
935 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
936 // redo processing of string
937 /* we do not have enough room so grow the buffer*/
938 b1
= (UChar
*) uprv_malloc(b1Len
* U_SIZEOF_UCHAR
);
940 *status
= U_MEMORY_ALLOCATION_ERROR
;
944 *status
= U_ZERO_ERROR
; // reset error
946 b1Len
= idnaref_toUnicode( labelStart
, labelLen
, b1
, b1Len
,
947 options
, parseError
, status
);
951 if(U_FAILURE(*status
)){
954 int32_t tempLen
= (reqLength
+ b1Len
);
956 if( tempLen
< destCapacity
){
957 uprv_memmove(dest
+reqLength
, b1
, b1Len
* U_SIZEOF_UCHAR
);
962 // add the label separator
964 if(reqLength
< destCapacity
){
965 dest
[reqLength
] = FULL_STOP
;
970 labelStart
= delimiter
;
971 remainingLen
= srcLength
- (delimiter
- src
);
983 return u_terminateUChars(dest
, destCapacity
, reqLength
, status
);
986 U_CFUNC
int32_t U_EXPORT2
987 idnaref_compare( const UChar
*s1
, int32_t length1
,
988 const UChar
*s2
, int32_t length2
,
992 if(status
== NULL
|| U_FAILURE(*status
)){
996 UChar b1Stack
[MAX_IDN_BUFFER_SIZE
], b2Stack
[MAX_IDN_BUFFER_SIZE
];
997 UChar
*b1
= b1Stack
, *b2
= b2Stack
;
998 int32_t b1Len
, b2Len
, b1Capacity
= MAX_IDN_BUFFER_SIZE
, b2Capacity
= MAX_IDN_BUFFER_SIZE
;
1001 UParseError parseError
;
1003 b1Len
= idnaref_IDNToASCII(s1
, length1
, b1
, b1Capacity
, options
, &parseError
, status
);
1004 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
1005 // redo processing of string
1006 /* we do not have enough room so grow the buffer*/
1007 b1
= (UChar
*) uprv_malloc(b1Len
* U_SIZEOF_UCHAR
);
1009 *status
= U_MEMORY_ALLOCATION_ERROR
;
1013 *status
= U_ZERO_ERROR
; // reset error
1015 b1Len
= idnaref_IDNToASCII(s1
,length1
,b1
,b1Len
, options
, &parseError
, status
);
1019 b2Len
= idnaref_IDNToASCII(s2
,length2
,b2
,b2Capacity
,options
, &parseError
, status
);
1020 if(*status
== U_BUFFER_OVERFLOW_ERROR
){
1021 // redo processing of string
1022 /* we do not have enough room so grow the buffer*/
1023 b2
= (UChar
*) uprv_malloc(b2Len
* U_SIZEOF_UCHAR
);
1025 *status
= U_MEMORY_ALLOCATION_ERROR
;
1029 *status
= U_ZERO_ERROR
; // reset error
1031 b2Len
= idnaref_IDNToASCII(s2
,length2
,b2
,b2Len
,options
, &parseError
, status
);
1034 // when toASCII is applied all label separators are replaced with FULL_STOP
1035 result
= compareCaseInsensitiveASCII(b1
,b1Len
,b2
,b2Len
);
1048 #endif /* #if !UCONFIG_NO_IDNA */