blob: 4103af3ede16cf4820411e2eeb90c4a2109b4e71 [file] [log] [blame]
Harald Welte92c45f32010-06-12 18:59:38 +02001/*-
2 * Copyright (c) 2003, 2004, 2006 Lev Walkin <vlm@lionet.info>.
3 * All rights reserved.
4 * Redistribution and modifications are permitted subject to BSD license.
5 */
6#include <asn_internal.h>
7#include <UTF8String.h>
8
9/*
10 * UTF8String basic type description.
11 */
Harald Welte41b85d52015-08-31 08:56:53 +020012static const ber_tlv_tag_t asn_DEF_UTF8String_tags[] = {
Harald Welte92c45f32010-06-12 18:59:38 +020013 (ASN_TAG_CLASS_UNIVERSAL | (12 << 2)), /* [UNIVERSAL 12] IMPLICIT ...*/
14 (ASN_TAG_CLASS_UNIVERSAL | (4 << 2)), /* ... OCTET STRING */
15};
16asn_TYPE_descriptor_t asn_DEF_UTF8String = {
17 "UTF8String",
18 "UTF8String",
19 OCTET_STRING_free,
20 UTF8String_print,
21 UTF8String_constraint, /* Check for invalid codes, etc. */
22 OCTET_STRING_decode_ber, /* Implemented in terms of OCTET STRING */
23 OCTET_STRING_encode_der,
24 OCTET_STRING_decode_xer_utf8,
25 OCTET_STRING_encode_xer_utf8,
Harald Welteec0e2172010-07-20 00:03:44 +020026 OCTET_STRING_decode_uper,
27 OCTET_STRING_encode_uper,
Harald Welte41b85d52015-08-31 08:56:53 +020028 OCTET_STRING_decode_aper,
29 OCTET_STRING_encode_aper,
Harald Welte92c45f32010-06-12 18:59:38 +020030 0, /* Use generic outmost tag fetcher */
31 asn_DEF_UTF8String_tags,
32 sizeof(asn_DEF_UTF8String_tags)
33 / sizeof(asn_DEF_UTF8String_tags[0]) - 1,
34 asn_DEF_UTF8String_tags,
35 sizeof(asn_DEF_UTF8String_tags)
36 / sizeof(asn_DEF_UTF8String_tags[0]),
37 0, /* No PER visible constraints */
38 0, 0, /* No members */
39 0 /* No specifics */
40};
41
42/*
43 * This is the table of length expectations.
44 * The second half of this table is only applicable to the long sequences.
45 */
Harald Welte41b85d52015-08-31 08:56:53 +020046static const int UTF8String_ht[2][16] = {
Harald Welte92c45f32010-06-12 18:59:38 +020047 { /* 0x0 ... 0x7 */
48 /* 0000..0111 */
49 1, 1, 1, 1, 1, 1, 1, 1,
50 /* 1000..1011(0), 1100..1101(2), 1110(3), 1111(-1) */
51 0, 0, 0, 0, 2, 2, 3, -1 },
52 { /* 0xF0 .. 0xF7 */
53 /* 11110000..11110111 */
54 4, 4, 4, 4, 4, 4, 4, 4,
55 5, 5, 5, 5, 6, 6, -1, -1 }
56};
Harald Welte41b85d52015-08-31 08:56:53 +020057static const int32_t UTF8String_mv[7] = { 0, 0,
Harald Welte92c45f32010-06-12 18:59:38 +020058 0x00000080,
59 0x00000800,
60 0x00010000,
61 0x00200000,
62 0x04000000
63};
64
65/* Internal aliases for return codes */
66#define U8E_TRUNC -1 /* UTF-8 sequence truncated */
67#define U8E_ILLSTART -2 /* Illegal UTF-8 sequence start */
68#define U8E_NOTCONT -3 /* Continuation expectation failed */
69#define U8E_NOTMIN -4 /* Not minimal length encoding */
70#define U8E_EINVAL -5 /* Invalid arguments */
71
72int
73UTF8String_constraint(asn_TYPE_descriptor_t *td, const void *sptr,
74 asn_app_constraint_failed_f *ctfailcb, void *app_key) {
75 ssize_t len = UTF8String_length((const UTF8String_t *)sptr);
76 switch(len) {
77 case U8E_EINVAL:
Harald Welteec0e2172010-07-20 00:03:44 +020078 _ASN_CTFAIL(app_key, td, sptr,
Harald Welte92c45f32010-06-12 18:59:38 +020079 "%s: value not given", td->name);
80 break;
81 case U8E_TRUNC:
Harald Welteec0e2172010-07-20 00:03:44 +020082 _ASN_CTFAIL(app_key, td, sptr,
Harald Welte92c45f32010-06-12 18:59:38 +020083 "%s: truncated UTF-8 sequence (%s:%d)",
84 td->name, __FILE__, __LINE__);
85 break;
86 case U8E_ILLSTART:
Harald Welteec0e2172010-07-20 00:03:44 +020087 _ASN_CTFAIL(app_key, td, sptr,
Harald Welte92c45f32010-06-12 18:59:38 +020088 "%s: UTF-8 illegal start of encoding (%s:%d)",
89 td->name, __FILE__, __LINE__);
90 break;
91 case U8E_NOTCONT:
Harald Welteec0e2172010-07-20 00:03:44 +020092 _ASN_CTFAIL(app_key, td, sptr,
Harald Welte92c45f32010-06-12 18:59:38 +020093 "%s: UTF-8 not continuation (%s:%d)",
94 td->name, __FILE__, __LINE__);
95 break;
96 case U8E_NOTMIN:
Harald Welteec0e2172010-07-20 00:03:44 +020097 _ASN_CTFAIL(app_key, td, sptr,
Harald Welte92c45f32010-06-12 18:59:38 +020098 "%s: UTF-8 not minimal sequence (%s:%d)",
99 td->name, __FILE__, __LINE__);
100 break;
101 }
102 return (len < 0) ? -1 : 0;
103}
104
105static ssize_t
106UTF8String__process(const UTF8String_t *st, uint32_t *dst, size_t dstlen) {
107 size_t length;
108 uint8_t *buf = st->buf;
109 uint8_t *end = buf + st->size;
110 uint32_t *dstend = dst + dstlen;
111
112 for(length = 0; buf < end; length++) {
113 int ch = *buf;
114 uint8_t *cend;
115 int32_t value;
116 int want;
117
118 /* Compute the sequence length */
119 want = UTF8String_ht[0][ch >> 4];
120 switch(want) {
121 case -1:
122 /* Second half of the table, long sequence */
123 want = UTF8String_ht[1][ch & 0x0F];
124 if(want != -1) break;
125 /* Fall through */
126 case 0:
127 return U8E_ILLSTART;
128 }
129
130 /* assert(want >= 1 && want <= 6) */
131
132 /* Check character sequence length */
133 if(buf + want > end) return U8E_TRUNC;
134
135 value = ch & (0xff >> want);
136 cend = buf + want;
137 for(buf++; buf < cend; buf++) {
138 ch = *buf;
139 if(ch < 0x80 || ch > 0xbf) return U8E_NOTCONT;
140 value = (value << 6) | (ch & 0x3F);
141 }
142 if(value < UTF8String_mv[want])
143 return U8E_NOTMIN;
144 if(dst < dstend)
145 *dst++ = value; /* Record value */
146 }
147
148 if(dst < dstend) *dst = 0; /* zero-terminate */
149
150 return length;
151}
152
153
154ssize_t
155UTF8String_length(const UTF8String_t *st) {
156 if(st && st->buf) {
157 return UTF8String__process(st, 0, 0);
158 } else {
159 return U8E_EINVAL;
160 }
161}
162
163size_t
164UTF8String_to_wcs(const UTF8String_t *st, uint32_t *dst, size_t dstlen) {
165 if(st && st->buf) {
166 ssize_t ret = UTF8String__process(st, dst, dstlen);
167 return (ret < 0) ? 0 : ret;
168 } else {
169 return 0;
170 }
171}
172
173int
174UTF8String_print(asn_TYPE_descriptor_t *td, const void *sptr, int ilevel,
175 asn_app_consume_bytes_f *cb, void *app_key) {
176 const UTF8String_t *st = (const UTF8String_t *)sptr;
177
178 (void)td; /* Unused argument */
179 (void)ilevel; /* Unused argument */
180
181 if(st && st->buf) {
182 return (cb(st->buf, st->size, app_key) < 0) ? -1 : 0;
183 } else {
184 return (cb("<absent>", 8, app_key) < 0) ? -1 : 0;
185 }
186}