diff options
Diffstat (limited to 'src/lib/libcrypto/asn1/a_utf8.c')
| -rw-r--r-- | src/lib/libcrypto/asn1/a_utf8.c | 144 |
1 files changed, 53 insertions, 91 deletions
diff --git a/src/lib/libcrypto/asn1/a_utf8.c b/src/lib/libcrypto/asn1/a_utf8.c index c224db4c12..f5e4bec7e0 100644 --- a/src/lib/libcrypto/asn1/a_utf8.c +++ b/src/lib/libcrypto/asn1/a_utf8.c | |||
| @@ -59,11 +59,13 @@ | |||
| 59 | #include <stdio.h> | 59 | #include <stdio.h> |
| 60 | #include "cryptlib.h" | 60 | #include "cryptlib.h" |
| 61 | #include <openssl/asn1.h> | 61 | #include <openssl/asn1.h> |
| 62 | #include "asn1_locl.h" | ||
| 62 | 63 | ||
| 63 | 64 | ||
| 64 | /* UTF8 utilities */ | 65 | /* UTF8 utilities */ |
| 65 | 66 | ||
| 66 | /* This parses a UTF8 string one character at a time. It is passed a pointer | 67 | /* |
| 68 | * This parses a UTF8 string one character at a time. It is passed a pointer | ||
| 67 | * to the string and the length of the string. It sets 'value' to the value of | 69 | * to the string and the length of the string. It sets 'value' to the value of |
| 68 | * the current character. It returns the number of characters read or a | 70 | * the current character. It returns the number of characters read or a |
| 69 | * negative error code: | 71 | * negative error code: |
| @@ -88,6 +90,8 @@ UTF8_getc(const unsigned char *str, int len, unsigned long *val) | |||
| 88 | value = *p++ & 0x7f; | 90 | value = *p++ & 0x7f; |
| 89 | ret = 1; | 91 | ret = 1; |
| 90 | } else if ((*p & 0xe0) == 0xc0) { | 92 | } else if ((*p & 0xe0) == 0xc0) { |
| 93 | if (*p < 0xc2) | ||
| 94 | return -2; | ||
| 91 | if (len < 2) | 95 | if (len < 2) |
| 92 | return -1; | 96 | return -1; |
| 93 | if ((p[1] & 0xc0) != 0x80) | 97 | if ((p[1] & 0xc0) != 0x80) |
| @@ -108,8 +112,11 @@ UTF8_getc(const unsigned char *str, int len, unsigned long *val) | |||
| 108 | value |= *p++ & 0x3f; | 112 | value |= *p++ & 0x3f; |
| 109 | if (value < 0x800) | 113 | if (value < 0x800) |
| 110 | return -4; | 114 | return -4; |
| 115 | /* surrogate pair code points are not valid */ | ||
| 116 | if (value >= 0xd800 && value < 0xe000) | ||
| 117 | return -2; | ||
| 111 | ret = 3; | 118 | ret = 3; |
| 112 | } else if ((*p & 0xf8) == 0xf0) { | 119 | } else if ((*p & 0xf8) == 0xf0 && (*p < 0xf5)) { |
| 113 | if (len < 4) | 120 | if (len < 4) |
| 114 | return -1; | 121 | return -1; |
| 115 | if (((p[1] & 0xc0) != 0x80) || | 122 | if (((p[1] & 0xc0) != 0x80) || |
| @@ -122,116 +129,71 @@ UTF8_getc(const unsigned char *str, int len, unsigned long *val) | |||
| 122 | value |= *p++ & 0x3f; | 129 | value |= *p++ & 0x3f; |
| 123 | if (value < 0x10000) | 130 | if (value < 0x10000) |
| 124 | return -4; | 131 | return -4; |
| 132 | if (value > UNICODE_MAX) | ||
| 133 | return -2; | ||
| 125 | ret = 4; | 134 | ret = 4; |
| 126 | } else if ((*p & 0xfc) == 0xf8) { | 135 | } else |
| 127 | if (len < 5) | 136 | return -2; |
| 128 | return -1; | 137 | *val = value; |
| 129 | if (((p[1] & 0xc0) != 0x80) || | ||
| 130 | ((p[2] & 0xc0) != 0x80) || | ||
| 131 | ((p[3] & 0xc0) != 0x80) || | ||
| 132 | ((p[4] & 0xc0) != 0x80)) | ||
| 133 | return -3; | ||
| 134 | value = ((unsigned long)(*p++ & 0x3)) << 24; | ||
| 135 | value |= ((unsigned long)(*p++ & 0x3f)) << 18; | ||
| 136 | value |= ((unsigned long)(*p++ & 0x3f)) << 12; | ||
| 137 | value |= (*p++ & 0x3f) << 6; | ||
| 138 | value |= *p++ & 0x3f; | ||
| 139 | if (value < 0x200000) | ||
| 140 | return -4; | ||
| 141 | ret = 5; | ||
| 142 | } else if ((*p & 0xfe) == 0xfc) { | ||
| 143 | if (len < 6) | ||
| 144 | return -1; | ||
| 145 | if (((p[1] & 0xc0) != 0x80) || | ||
| 146 | ((p[2] & 0xc0) != 0x80) || | ||
| 147 | ((p[3] & 0xc0) != 0x80) || | ||
| 148 | ((p[4] & 0xc0) != 0x80) || | ||
| 149 | ((p[5] & 0xc0) != 0x80)) | ||
| 150 | return -3; | ||
| 151 | value = ((unsigned long)(*p++ & 0x1)) << 30; | ||
| 152 | value |= ((unsigned long)(*p++ & 0x3f)) << 24; | ||
| 153 | value |= ((unsigned long)(*p++ & 0x3f)) << 18; | ||
| 154 | value |= ((unsigned long)(*p++ & 0x3f)) << 12; | ||
| 155 | value |= (*p++ & 0x3f) << 6; | ||
| 156 | value |= *p++ & 0x3f; | ||
| 157 | if (value < 0x4000000) | ||
| 158 | return -4; | ||
| 159 | ret = 6; | ||
| 160 | } else return -2; | ||
| 161 | *val = value; | ||
| 162 | return ret; | 138 | return ret; |
| 163 | } | 139 | } |
| 164 | 140 | ||
| 165 | /* This takes a character 'value' and writes the UTF8 encoded value in | 141 | /* This takes a Unicode code point 'value' and writes its UTF-8 encoded form |
| 166 | * 'str' where 'str' is a buffer containing 'len' characters. Returns | 142 | * in 'str' where 'str' is a buffer of at least length 'len'. If 'str' |
| 167 | * the number of characters written or -1 if 'len' is too small. 'str' can | 143 | * is NULL, then nothing is written and just the return code is determined. |
| 168 | * be set to NULL in which case it just returns the number of characters. | 144 | |
| 169 | * It will need at most 6 characters. | 145 | * Returns less than zero on error: |
| 146 | * -1 if 'str' is not NULL and 'len' is too small | ||
| 147 | * -2 if 'value' is an invalid character (surrogate or out-of-range) | ||
| 148 | * | ||
| 149 | * Otherwise, returns the number of bytes in 'value's encoded form | ||
| 150 | * (i.e., the number of bytes written to 'str' when it's not NULL). | ||
| 151 | * | ||
| 152 | * It will need at most 4 characters. | ||
| 170 | */ | 153 | */ |
| 171 | 154 | ||
| 172 | int | 155 | int |
| 173 | UTF8_putc(unsigned char *str, int len, unsigned long value) | 156 | UTF8_putc(unsigned char *str, int len, unsigned long value) |
| 174 | { | 157 | { |
| 175 | if (!str) | ||
| 176 | len = 6; /* Maximum we will need */ | ||
| 177 | else if (len <= 0) | ||
| 178 | return -1; | ||
| 179 | if (value < 0x80) { | 158 | if (value < 0x80) { |
| 180 | if (str) | 159 | if (str != NULL) { |
| 181 | *str = (unsigned char)value; | 160 | if (len < 1) |
| 161 | return -1; | ||
| 162 | str[0] = (unsigned char)value; | ||
| 163 | } | ||
| 182 | return 1; | 164 | return 1; |
| 183 | } | 165 | } |
| 184 | if (value < 0x800) { | 166 | if (value < 0x800) { |
| 185 | if (len < 2) | 167 | if (str != NULL) { |
| 186 | return -1; | 168 | if (len < 2) |
| 187 | if (str) { | 169 | return -1; |
| 188 | *str++ = (unsigned char)(((value >> 6) & 0x1f) | 0xc0); | 170 | str[0] = (unsigned char)(((value >> 6) & 0x1f) | 0xc0); |
| 189 | *str = (unsigned char)((value & 0x3f) | 0x80); | 171 | str[1] = (unsigned char)((value & 0x3f) | 0x80); |
| 190 | } | 172 | } |
| 191 | return 2; | 173 | return 2; |
| 192 | } | 174 | } |
| 193 | if (value < 0x10000) { | 175 | if (value < 0x10000) { |
| 194 | if (len < 3) | 176 | if (UNICODE_IS_SURROGATE(value)) |
| 195 | return -1; | 177 | return -2; |
| 196 | if (str) { | 178 | if (str != NULL) { |
| 197 | *str++ = (unsigned char)(((value >> 12) & 0xf) | 0xe0); | 179 | if (len < 3) |
| 198 | *str++ = (unsigned char)(((value >> 6) & 0x3f) | 0x80); | 180 | return -1; |
| 199 | *str = (unsigned char)((value & 0x3f) | 0x80); | 181 | str[0] = (unsigned char)(((value >> 12) & 0xf) | 0xe0); |
| 182 | str[1] = (unsigned char)(((value >> 6) & 0x3f) | 0x80); | ||
| 183 | str[2] = (unsigned char)((value & 0x3f) | 0x80); | ||
| 200 | } | 184 | } |
| 201 | return 3; | 185 | return 3; |
| 202 | } | 186 | } |
| 203 | if (value < 0x200000) { | 187 | if (value <= UNICODE_MAX) { |
| 204 | if (len < 4) | 188 | if (str != NULL) { |
| 205 | return -1; | 189 | if (len < 4) |
| 206 | if (str) { | 190 | return -1; |
| 207 | *str++ = (unsigned char)(((value >> 18) & 0x7) | 0xf0); | 191 | str[0] = (unsigned char)(((value >> 18) & 0x7) | 0xf0); |
| 208 | *str++ = (unsigned char)(((value >> 12) & 0x3f) | 0x80); | 192 | str[1] = (unsigned char)(((value >> 12) & 0x3f) | 0x80); |
| 209 | *str++ = (unsigned char)(((value >> 6) & 0x3f) | 0x80); | 193 | str[2] = (unsigned char)(((value >> 6) & 0x3f) | 0x80); |
| 210 | *str = (unsigned char)((value & 0x3f) | 0x80); | 194 | str[3] = (unsigned char)((value & 0x3f) | 0x80); |
| 211 | } | 195 | } |
| 212 | return 4; | 196 | return 4; |
| 213 | } | 197 | } |
| 214 | if (value < 0x4000000) { | 198 | return -2; |
| 215 | if (len < 5) | ||
| 216 | return -1; | ||
| 217 | if (str) { | ||
| 218 | *str++ = (unsigned char)(((value >> 24) & 0x3) | 0xf8); | ||
| 219 | *str++ = (unsigned char)(((value >> 18) & 0x3f) | 0x80); | ||
| 220 | *str++ = (unsigned char)(((value >> 12) & 0x3f) | 0x80); | ||
| 221 | *str++ = (unsigned char)(((value >> 6) & 0x3f) | 0x80); | ||
| 222 | *str = (unsigned char)((value & 0x3f) | 0x80); | ||
| 223 | } | ||
| 224 | return 5; | ||
| 225 | } | ||
| 226 | if (len < 6) | ||
| 227 | return -1; | ||
| 228 | if (str) { | ||
| 229 | *str++ = (unsigned char)(((value >> 30) & 0x1) | 0xfc); | ||
| 230 | *str++ = (unsigned char)(((value >> 24) & 0x3f) | 0x80); | ||
| 231 | *str++ = (unsigned char)(((value >> 18) & 0x3f) | 0x80); | ||
| 232 | *str++ = (unsigned char)(((value >> 12) & 0x3f) | 0x80); | ||
| 233 | *str++ = (unsigned char)(((value >> 6) & 0x3f) | 0x80); | ||
| 234 | *str = (unsigned char)((value & 0x3f) | 0x80); | ||
| 235 | } | ||
| 236 | return 6; | ||
| 237 | } | 199 | } |
