X-Git-Url: https://git.sur5r.net/?a=blobdiff_plain;f=libraries%2Fliblunicode%2Fucstr.c;h=6d947737164344690ce63af5c131966f9186b72b;hb=4ebed09d81ec07faeb78b5da8946624cc825257f;hp=53b1ed349f01ee6d00acae2f925f6dd13828d9ed;hpb=808cb504cecb44124b16e7b9284145f176e97985;p=openldap diff --git a/libraries/liblunicode/ucstr.c b/libraries/liblunicode/ucstr.c index 53b1ed349f..6d94773716 100644 --- a/libraries/liblunicode/ucstr.c +++ b/libraries/liblunicode/ucstr.c @@ -1,16 +1,26 @@ -/* - * Copyright 2000-2003 The OpenLDAP Foundation - * COPYING RESTRICTIONS APPLY. See COPYRIGHT File in top level directory - * of this package for details. +/* $OpenLDAP$ */ +/* This work is part of OpenLDAP Software . + * + * Copyright 1998-2005 The OpenLDAP Foundation. + * All rights reserved. + * + * Redistribution and use in source and binary forms, with or without + * modification, are permitted only as authorized by the OpenLDAP + * Public License. + * + * A copy of this license is available in file LICENSE in the + * top-level directory of the distribution or, alternatively, at + * . */ #include "portable.h" +#include #include #include #include -#include +#include #include #include @@ -100,12 +110,13 @@ struct berval * UTF8bvnormalize( { int i, j, len, clen, outpos, ucsoutlen, outsize, last; char *out, *outtmp, *s; - unsigned long *ucs, *p, *ucsout; + ac_uint4 *ucs, *p, *ucsout; + + static unsigned char mask[] = { + 0, 0x7f, 0x1f, 0x0f, 0x07, 0x03, 0x01 }; unsigned casefold = flags & LDAP_UTF8_CASEFOLD; unsigned approx = flags & LDAP_UTF8_APPROX; - static unsigned char mask[] = { - 0, 0x7f, 0x1f, 0x0f, 0x07, 0x03, 0x01 }; if ( bv == NULL ) { return NULL; @@ -118,9 +129,9 @@ struct berval * UTF8bvnormalize( return ber_dupbv_x( newbv, bv, ctx ); } - /* FIXME: Should first check to see if string is already in - * proper normalized form. This is almost as time consuming - * as the normalization though. + /* Should first check to see if string is already in proper + * normalized form. This is almost as time consuming as + * the normalization though. */ /* finish off everything up to character before first non-ascii */ @@ -137,7 +148,7 @@ struct berval * UTF8bvnormalize( out[outpos++] = TOLOWER( s[i-1] ); } if ( i == len ) { - out[outpos++] = TOLOWER( s[len - 1] ); + out[outpos++] = TOLOWER( s[len-1] ); out[outpos] = '\0'; return ber_str2bv( out, outpos, 0, newbv); } @@ -176,7 +187,7 @@ struct berval * UTF8bvnormalize( /* convert character before first non-ascii to ucs-4 */ if ( i > 0 ) { - *p = casefold ? TOLOWER( s[i - 1] ) : s[i - 1]; + *p = casefold ? TOLOWER( s[i-1] ) : s[i-1]; p++; } @@ -211,7 +222,7 @@ struct berval * UTF8bvnormalize( *p = uctolower( *p ); } p++; - } + } /* normalize ucs of length p - ucs */ uccompatdecomp( ucs, p - ucs, &ucsout, &ucsoutlen, ctx ); if ( approx ) { @@ -250,20 +261,33 @@ struct berval * UTF8bvnormalize( last = i; + /* Allocate more space in out if necessary */ + if (len - i >= outsize - outpos) { + outsize += 1 + ((len - i) - (outsize - outpos)); + outtmp = (char *) realloc(out, outsize); + if (outtmp == NULL) { + free(out); + free(ucs); + return NULL; + } + out = outtmp; + } + /* s[i] is ascii */ /* finish off everything up to char before next non-ascii */ for ( i++; (i < len) && LDAP_UTF8_ISASCII(s + i); i++ ) { out[outpos++] = casefold ? TOLOWER( s[i-1] ) : s[i-1]; } if ( i == len ) { - out[outpos++] = casefold ? TOLOWER( s[len - 1] ) : s[len - 1]; + out[outpos++] = casefold ? TOLOWER( s[len-1] ) : s[len-1]; break; } /* convert character before next non-ascii to ucs-4 */ - *ucs = casefold ? TOLOWER( s[i - 1] ) : s[i - 1]; + *ucs = casefold ? TOLOWER( s[i-1] ) : s[i-1]; p = ucs + 1; - } + } + free( ucs ); out[outpos] = '\0'; return ber_str2bv( out, outpos, 0, newbv ); @@ -279,13 +303,15 @@ int UTF8bvnormcmp( { int i, l1, l2, len, ulen, res = 0; char *s1, *s2, *done; - unsigned long *ucs, *ucsout1, *ucsout2; + ac_uint4 *ucs, *ucsout1, *ucsout2; + unsigned casefold = flags & LDAP_UTF8_CASEFOLD; unsigned norm1 = flags & LDAP_UTF8_ARG1NFC; unsigned norm2 = flags & LDAP_UTF8_ARG2NFC; if (bv1 == NULL) { return bv2 == NULL ? 0 : -1; + } else if (bv2 == NULL) { return 1; } @@ -306,7 +332,7 @@ int UTF8bvnormcmp( if (casefold) { char c1 = TOLOWER(*s1); char c2 = TOLOWER(*s2); - res = c1 - c2; + res = c1 - c2; } else { res = *s1 - *s2; } @@ -319,7 +345,8 @@ int UTF8bvnormcmp( break; } } else if (((len < l1) && !LDAP_UTF8_ISASCII(s1)) || - ((len < l2) && !LDAP_UTF8_ISASCII(s2))) { + ((len < l2) && !LDAP_UTF8_ISASCII(s2))) + { break; } return res; @@ -346,10 +373,9 @@ int UTF8bvnormcmp( l2 -= i - 1; } - /* FIXME: Should first check to see if strings are already in + /* Should first check to see if strings are already in * proper normalized form. */ - ucs = malloc( ( ( norm1 || l1 > l2 ) ? l1 : l2 ) * sizeof(*ucs) ); if ( ucs == NULL ) { return l1 > l2 ? 1 : -1; /* what to do??? */ @@ -357,16 +383,16 @@ int UTF8bvnormcmp( /* * XXYYZ: we convert to ucs4 even though -llunicode - * expects ucs2 in an unsigned long + * expects ucs2 in an ac_uint4 */ /* convert and normalize 1st string */ for ( i = 0, ulen = 0; i < l1; i += len, ulen++ ) { - ucs[ulen] = ldap_x_utf8_to_ucs4( s1 + i ); - if ( ucs[ulen] == LDAP_UCS4_INVALID ) { + ucs[ulen] = ldap_x_utf8_to_ucs4( s1 + i ); + if ( ucs[ulen] == LDAP_UCS4_INVALID ) { free( ucs ); - return -1; /* what to do??? */ - } + return -1; /* what to do??? */ + } len = LDAP_UTF8_CHARLEN( s1 + i ); } @@ -384,12 +410,12 @@ int UTF8bvnormcmp( /* convert and normalize 2nd string */ for ( i = 0, ulen = 0; i < l2; i += len, ulen++ ) { - ucs[ulen] = ldap_x_utf8_to_ucs4( s2 + i ); - if ( ucs[ulen] == LDAP_UCS4_INVALID ) { + ucs[ulen] = ldap_x_utf8_to_ucs4( s2 + i ); + if ( ucs[ulen] == LDAP_UCS4_INVALID ) { free( ucsout1 ); free( ucs ); - return 1; /* what to do??? */ - } + return 1; /* what to do??? */ + } len = LDAP_UTF8_CHARLEN( s2 + i ); }