1 /* a_mbstr.c */ 2 /* Written by Dr Stephen N Henson (steve@openssl.org) for the OpenSSL 3 * project 1999. 4 */ 5 /* ==================================================================== 6 * Copyright (c) 1999 The OpenSSL Project. All rights reserved. 7 * 8 * Redistribution and use in source and binary forms, with or without 9 * modification, are permitted provided that the following conditions 10 * are met: 11 * 12 * 1. Redistributions of source code must retain the above copyright 13 * notice, this list of conditions and the following disclaimer. 14 * 15 * 2. Redistributions in binary form must reproduce the above copyright 16 * notice, this list of conditions and the following disclaimer in 17 * the documentation and/or other materials provided with the 18 * distribution. 19 * 20 * 3. All advertising materials mentioning features or use of this 21 * software must display the following acknowledgment: 22 * "This product includes software developed by the OpenSSL Project 23 * for use in the OpenSSL Toolkit. (http://www.OpenSSL.org/)" 24 * 25 * 4. The names "OpenSSL Toolkit" and "OpenSSL Project" must not be used to 26 * endorse or promote products derived from this software without 27 * prior written permission. For written permission, please contact 28 * licensing@OpenSSL.org. 29 * 30 * 5. Products derived from this software may not be called "OpenSSL" 31 * nor may "OpenSSL" appear in their names without prior written 32 * permission of the OpenSSL Project. 33 * 34 * 6. Redistributions of any form whatsoever must retain the following 35 * acknowledgment: 36 * "This product includes software developed by the OpenSSL Project 37 * for use in the OpenSSL Toolkit (http://www.OpenSSL.org/)" 38 * 39 * THIS SOFTWARE IS PROVIDED BY THE OpenSSL PROJECT ``AS IS'' AND ANY 40 * EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 41 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 42 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE OpenSSL PROJECT OR 43 * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 44 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 45 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; 46 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 47 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, 48 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 49 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED 50 * OF THE POSSIBILITY OF SUCH DAMAGE. 51 * ==================================================================== 52 * 53 * This product includes cryptographic software written by Eric Young 54 * (eay@cryptsoft.com). This product includes software written by Tim 55 * Hudson (tjh@cryptsoft.com). 56 * 57 */ 58 59 #include <stdio.h> 60 #include <ctype.h> 61 #include "cryptlib.h" 62 #include <openssl/asn1.h> 63 64 static int traverse_string(const unsigned char *p, int len, int inform, 65 int (*rfunc)(unsigned long value, void *in), void *arg); 66 static int in_utf8(unsigned long value, void *arg); 67 static int out_utf8(unsigned long value, void *arg); 68 static int type_str(unsigned long value, void *arg); 69 static int cpy_asc(unsigned long value, void *arg); 70 static int cpy_bmp(unsigned long value, void *arg); 71 static int cpy_univ(unsigned long value, void *arg); 72 static int cpy_utf8(unsigned long value, void *arg); 73 static int is_printable(unsigned long value); 74 75 /* These functions take a string in UTF8, ASCII or multibyte form and 76 * a mask of permissible ASN1 string types. It then works out the minimal 77 * type (using the order Printable < IA5 < T61 < BMP < Universal < UTF8) 78 * and creates a string of the correct type with the supplied data. 79 * Yes this is horrible: it has to be :-( 80 * The 'ncopy' form checks minimum and maximum size limits too. 81 */ 82 83 int ASN1_mbstring_copy(ASN1_STRING **out, const unsigned char *in, int len, 84 int inform, unsigned long mask) 85 { 86 return ASN1_mbstring_ncopy(out, in, len, inform, mask, 0, 0); 87 } 88 89 int ASN1_mbstring_ncopy(ASN1_STRING **out, const unsigned char *in, int len, 90 int inform, unsigned long mask, 91 long minsize, long maxsize) 92 { 93 int str_type; 94 int ret; 95 char free_out; 96 int outform, outlen = 0; 97 ASN1_STRING *dest; 98 unsigned char *p; 99 int nchar; 100 char strbuf[32]; 101 int (*cpyfunc)(unsigned long,void *) = NULL; 102 if(len == -1) len = strlen((const char *)in); 103 if(!mask) mask = DIRSTRING_TYPE; 104 105 /* First do a string check and work out the number of characters */ 106 switch(inform) { 107 108 case MBSTRING_BMP: 109 if(len & 1) { 110 ASN1err(ASN1_F_ASN1_MBSTRING_NCOPY, 111 ASN1_R_INVALID_BMPSTRING_LENGTH); 112 return -1; 113 } 114 nchar = len >> 1; 115 break; 116 117 case MBSTRING_UNIV: 118 if(len & 3) { 119 ASN1err(ASN1_F_ASN1_MBSTRING_NCOPY, 120 ASN1_R_INVALID_UNIVERSALSTRING_LENGTH); 121 return -1; 122 } 123 nchar = len >> 2; 124 break; 125 126 case MBSTRING_UTF8: 127 nchar = 0; 128 /* This counts the characters and does utf8 syntax checking */ 129 ret = traverse_string(in, len, MBSTRING_UTF8, in_utf8, &nchar); 130 if(ret < 0) { 131 ASN1err(ASN1_F_ASN1_MBSTRING_NCOPY, 132 ASN1_R_INVALID_UTF8STRING); 133 return -1; 134 } 135 break; 136 137 case MBSTRING_ASC: 138 nchar = len; 139 break; 140 141 default: 142 ASN1err(ASN1_F_ASN1_MBSTRING_NCOPY, ASN1_R_UNKNOWN_FORMAT); 143 return -1; 144 } 145 146 if((minsize > 0) && (nchar < minsize)) { 147 ASN1err(ASN1_F_ASN1_MBSTRING_NCOPY, ASN1_R_STRING_TOO_SHORT); 148 BIO_snprintf(strbuf, sizeof strbuf, "%ld", minsize); 149 ERR_add_error_data(2, "minsize=", strbuf); 150 return -1; 151 } 152 153 if((maxsize > 0) && (nchar > maxsize)) { 154 ASN1err(ASN1_F_ASN1_MBSTRING_NCOPY, ASN1_R_STRING_TOO_LONG); 155 BIO_snprintf(strbuf, sizeof strbuf, "%ld", maxsize); 156 ERR_add_error_data(2, "maxsize=", strbuf); 157 return -1; 158 } 159 160 /* Now work out minimal type (if any) */ 161 if(traverse_string(in, len, inform, type_str, &mask) < 0) { 162 ASN1err(ASN1_F_ASN1_MBSTRING_NCOPY, ASN1_R_ILLEGAL_CHARACTERS); 163 return -1; 164 } 165 166 167 /* Now work out output format and string type */ 168 outform = MBSTRING_ASC; 169 if(mask & B_ASN1_PRINTABLESTRING) str_type = V_ASN1_PRINTABLESTRING; 170 else if(mask & B_ASN1_IA5STRING) str_type = V_ASN1_IA5STRING; 171 else if(mask & B_ASN1_T61STRING) str_type = V_ASN1_T61STRING; 172 else if(mask & B_ASN1_BMPSTRING) { 173 str_type = V_ASN1_BMPSTRING; 174 outform = MBSTRING_BMP; 175 } else if(mask & B_ASN1_UNIVERSALSTRING) { 176 str_type = V_ASN1_UNIVERSALSTRING; 177 outform = MBSTRING_UNIV; 178 } else { 179 str_type = V_ASN1_UTF8STRING; 180 outform = MBSTRING_UTF8; 181 } 182 if(!out) return str_type; 183 if(*out) { 184 free_out = 0; 185 dest = *out; 186 if(dest->data) { 187 dest->length = 0; 188 OPENSSL_free(dest->data); 189 dest->data = NULL; 190 } 191 dest->type = str_type; 192 } else { 193 free_out = 1; 194 dest = ASN1_STRING_type_new(str_type); 195 if(!dest) { 196 ASN1err(ASN1_F_ASN1_MBSTRING_NCOPY, 197 ERR_R_MALLOC_FAILURE); 198 return -1; 199 } 200 *out = dest; 201 } 202 /* If both the same type just copy across */ 203 if(inform == outform) { 204 if(!ASN1_STRING_set(dest, in, len)) { 205 ASN1err(ASN1_F_ASN1_MBSTRING_NCOPY,ERR_R_MALLOC_FAILURE); 206 return -1; 207 } 208 return str_type; 209 } 210 211 /* Work out how much space the destination will need */ 212 switch(outform) { 213 case MBSTRING_ASC: 214 outlen = nchar; 215 cpyfunc = cpy_asc; 216 break; 217 218 case MBSTRING_BMP: 219 outlen = nchar << 1; 220 cpyfunc = cpy_bmp; 221 break; 222 223 case MBSTRING_UNIV: 224 outlen = nchar << 2; 225 cpyfunc = cpy_univ; 226 break; 227 228 case MBSTRING_UTF8: 229 outlen = 0; 230 traverse_string(in, len, inform, out_utf8, &outlen); 231 cpyfunc = cpy_utf8; 232 break; 233 } 234 if(!(p = OPENSSL_malloc(outlen + 1))) { 235 if(free_out) ASN1_STRING_free(dest); 236 ASN1err(ASN1_F_ASN1_MBSTRING_NCOPY,ERR_R_MALLOC_FAILURE); 237 return -1; 238 } 239 dest->length = outlen; 240 dest->data = p; 241 p[outlen] = 0; 242 traverse_string(in, len, inform, cpyfunc, &p); 243 return str_type; 244 } 245 246 /* This function traverses a string and passes the value of each character 247 * to an optional function along with a void * argument. 248 */ 249 250 static int traverse_string(const unsigned char *p, int len, int inform, 251 int (*rfunc)(unsigned long value, void *in), void *arg) 252 { 253 unsigned long value; 254 int ret; 255 while(len) { 256 if(inform == MBSTRING_ASC) { 257 value = *p++; 258 len--; 259 } else if(inform == MBSTRING_BMP) { 260 value = *p++ << 8; 261 value |= *p++; 262 len -= 2; 263 } else if(inform == MBSTRING_UNIV) { 264 value = ((unsigned long)*p++) << 24; 265 value |= ((unsigned long)*p++) << 16; 266 value |= *p++ << 8; 267 value |= *p++; 268 len -= 4; 269 } else { 270 ret = UTF8_getc(p, len, &value); 271 if(ret < 0) return -1; 272 len -= ret; 273 p += ret; 274 } 275 if(rfunc) { 276 ret = rfunc(value, arg); 277 if(ret <= 0) return ret; 278 } 279 } 280 return 1; 281 } 282 283 /* Various utility functions for traverse_string */ 284 285 /* Just count number of characters */ 286 287 static int in_utf8(unsigned long value, void *arg) 288 { 289 int *nchar; 290 nchar = arg; 291 (*nchar)++; 292 return 1; 293 } 294 295 /* Determine size of output as a UTF8 String */ 296 297 static int out_utf8(unsigned long value, void *arg) 298 { 299 int *outlen; 300 outlen = arg; 301 *outlen += UTF8_putc(NULL, -1, value); 302 return 1; 303 } 304 305 /* Determine the "type" of a string: check each character against a 306 * supplied "mask". 307 */ 308 309 static int type_str(unsigned long value, void *arg) 310 { 311 unsigned long types; 312 types = *((unsigned long *)arg); 313 if((types & B_ASN1_PRINTABLESTRING) && !is_printable(value)) 314 types &= ~B_ASN1_PRINTABLESTRING; 315 if((types & B_ASN1_IA5STRING) && (value > 127)) 316 types &= ~B_ASN1_IA5STRING; 317 if((types & B_ASN1_T61STRING) && (value > 0xff)) 318 types &= ~B_ASN1_T61STRING; 319 if((types & B_ASN1_BMPSTRING) && (value > 0xffff)) 320 types &= ~B_ASN1_BMPSTRING; 321 if(!types) return -1; 322 *((unsigned long *)arg) = types; 323 return 1; 324 } 325 326 /* Copy one byte per character ASCII like strings */ 327 328 static int cpy_asc(unsigned long value, void *arg) 329 { 330 unsigned char **p, *q; 331 p = arg; 332 q = *p; 333 *q = (unsigned char) value; 334 (*p)++; 335 return 1; 336 } 337 338 /* Copy two byte per character BMPStrings */ 339 340 static int cpy_bmp(unsigned long value, void *arg) 341 { 342 unsigned char **p, *q; 343 p = arg; 344 q = *p; 345 *q++ = (unsigned char) ((value >> 8) & 0xff); 346 *q = (unsigned char) (value & 0xff); 347 *p += 2; 348 return 1; 349 } 350 351 /* Copy four byte per character UniversalStrings */ 352 353 static int cpy_univ(unsigned long value, void *arg) 354 { 355 unsigned char **p, *q; 356 p = arg; 357 q = *p; 358 *q++ = (unsigned char) ((value >> 24) & 0xff); 359 *q++ = (unsigned char) ((value >> 16) & 0xff); 360 *q++ = (unsigned char) ((value >> 8) & 0xff); 361 *q = (unsigned char) (value & 0xff); 362 *p += 4; 363 return 1; 364 } 365 366 /* Copy to a UTF8String */ 367 368 static int cpy_utf8(unsigned long value, void *arg) 369 { 370 unsigned char **p; 371 int ret; 372 p = arg; 373 /* We already know there is enough room so pass 0xff as the length */ 374 ret = UTF8_putc(*p, 0xff, value); 375 *p += ret; 376 return 1; 377 } 378 379 /* Return 1 if the character is permitted in a PrintableString */ 380 static int is_printable(unsigned long value) 381 { 382 int ch; 383 if(value > 0x7f) return 0; 384 ch = (int) value; 385 /* Note: we can't use 'isalnum' because certain accented 386 * characters may count as alphanumeric in some environments. 387 */ 388 #ifndef CHARSET_EBCDIC 389 if((ch >= 'a') && (ch <= 'z')) return 1; 390 if((ch >= 'A') && (ch <= 'Z')) return 1; 391 if((ch >= '0') && (ch <= '9')) return 1; 392 if ((ch == ' ') || strchr("'()+,-./:=?", ch)) return 1; 393 #else /*CHARSET_EBCDIC*/ 394 if((ch >= os_toascii['a']) && (ch <= os_toascii['z'])) return 1; 395 if((ch >= os_toascii['A']) && (ch <= os_toascii['Z'])) return 1; 396 if((ch >= os_toascii['0']) && (ch <= os_toascii['9'])) return 1; 397 if ((ch == os_toascii[' ']) || strchr("'()+,-./:=?", os_toebcdic[ch])) return 1; 398 #endif /*CHARSET_EBCDIC*/ 399 return 0; 400 }