blob: 15969b1eb240b8263efd9027a4dbca74c6284f32 [file] [log] [blame]
Lev Walkinf15320b2004-06-03 03:38:44 +00001/*-
Lev Walkin4902f052006-10-16 12:18:10 +00002 * Copyright (c) 2003, 2006 Lev Walkin <vlm@lionet.info>. All rights reserved.
Lev Walkinf15320b2004-06-03 03:38:44 +00003 * Redistribution and modifications are permitted subject to BSD license.
4 */
Lev Walkina9cc46e2004-09-22 16:06:28 +00005#include <asn_internal.h>
Lev Walkinf15320b2004-06-03 03:38:44 +00006#include <TeletexString.h>
7
8/*
9 * TeletexString basic type description.
10 */
Wim Lewis18c2ec92014-07-29 11:30:10 -070011static const ber_tlv_tag_t asn_DEF_TeletexString_tags[] = {
Lev Walkin188ed2c2004-09-13 08:31:01 +000012 (ASN_TAG_CLASS_UNIVERSAL | (20 << 2)), /* [UNIVERSAL 20] IMPLICIT ...*/
13 (ASN_TAG_CLASS_UNIVERSAL | (4 << 2)), /* ... OCTET STRING */
Lev Walkinf15320b2004-06-03 03:38:44 +000014};
Lev Walkin5e033762004-09-29 13:26:15 +000015asn_TYPE_descriptor_t asn_DEF_TeletexString = {
Lev Walkinf15320b2004-06-03 03:38:44 +000016 "TeletexString",
Lev Walkindc06f6b2004-10-20 15:50:55 +000017 "TeletexString",
Lev Walkina9cc46e2004-09-22 16:06:28 +000018 OCTET_STRING_free,
19 OCTET_STRING_print, /* non-ascii string */
Lev Walkincd2f48e2017-08-10 02:14:59 -070020 OCTET_STRING_compare,
Lev Walkinf15320b2004-06-03 03:38:44 +000021 asn_generic_unknown_constraint,
22 OCTET_STRING_decode_ber, /* Implemented in terms of OCTET STRING */
Lev Walkindc06f6b2004-10-20 15:50:55 +000023 OCTET_STRING_encode_der,
24 OCTET_STRING_decode_xer_hex,
25 OCTET_STRING_encode_xer,
Lev Walkincc159472017-07-06 08:26:36 -070026#ifdef ASN_DISABLE_OER_SUPPORT
27 0,
28 0,
29#else
Lev Walkin1d76f3c2017-07-25 07:58:05 -070030 OCTET_STRING_decode_oer,
31 OCTET_STRING_encode_oer,
Lev Walkincc159472017-07-06 08:26:36 -070032#endif /* ASN_DISABLE_OER_SUPPORT */
Lev Walkinb33425f2017-07-14 14:59:52 +040033#ifdef ASN_DISABLE_PER_SUPPORT
34 0,
35 0,
36#else
37 OCTET_STRING_decode_uper,
38 OCTET_STRING_encode_uper,
39#endif /* ASN_DISABLE_PER_SUPPORT */
Lev Walkinf15320b2004-06-03 03:38:44 +000040 0, /* Use generic outmost tag fetcher */
Lev Walkin5e033762004-09-29 13:26:15 +000041 asn_DEF_TeletexString_tags,
42 sizeof(asn_DEF_TeletexString_tags)
43 / sizeof(asn_DEF_TeletexString_tags[0]) - 1,
44 asn_DEF_TeletexString_tags,
45 sizeof(asn_DEF_TeletexString_tags)
46 / sizeof(asn_DEF_TeletexString_tags[0]),
Lev Walkin76780762017-07-07 10:07:30 -070047 0, /* No OER visible constraints */
Lev Walkin59b176e2005-11-26 11:25:14 +000048 0, /* No PER visible constraints */
Lev Walkin449f8322004-08-20 13:23:42 +000049 0, 0, /* No members */
Lev Walkind9bd7752004-06-05 08:17:50 +000050 0 /* No specifics */
Lev Walkinf15320b2004-06-03 03:38:44 +000051};
52
Lev Walkin4902f052006-10-16 12:18:10 +000053/*
54 * Here is a formal attempt at creating a mapping from TeletexString
55 * (T61String) of the latest ASN.1 standard (X.680:2002) into the Unicode
56 * character set. -- Lev Walkin <vlm@lionet.info>
57 *
58 * The first thing to keep in mind is that TeletexString (T61String)
59 * is defined in ASN.1, and is not really a T.61 string.
60 * The T.61 standard is withdrawn by ITU-T and is no longer an authoritative
61 * reference. See http://www.itu.int/rec/T-REC-T.61
62 *
63 * The X.680 specifies TeletexString (T61String) as a combination of the
64 * character sets specified by the registration numbers listed in
65 * ISO International Register of Coded Character Sets to be used with
66 * Escape Sequences (ISO-2375):
67 * 6, 87, 102, 103, 106, 107, 126, 144, 150, 153, 156, 164, 165, 168,
68 * plus SPACE and DELETE characters.
69 * In addition to that, the X.680 Table 6 NOTE 2 allows using register entries
70 * 6 and 156 instead of 102 and 103.
71 *
72 * The ISO Register itself is available at http://www.itscj.ipsj.or.jp/ISO-IR/
73 *
74 * #6 is ASCII. http://www.itscj.ipsj.or.jp/ISO-IR/006.pdf
75 * Escapes into:
76 * G0: ESC 2/8 4/2 ("(B")
77 * G1: ESC 2/9 4/2 (")B")
78 * The range is [0x21 .. 0x7e]. Conversion into Unicode
79 * is simple, because it has one-to-one correspondence.
80 * #87 is a "Japanese Graphic Character Set for Information Interchange".
81 * Is a multiple-byte set of 6877 characters.
82 * The character set is JIS X 0208-1983 (originally JIS C 6226-1983).
83 * Escapes into:
84 * G0: ESC 2/4 4/2 ("$B")
85 * G1: ESC 2/4 2/9 4/2 ("$)B")
86 * G2: ESC 2/4 2/10 4/2 ("$*B")
87 * G3: ESC 2/4 2/11 4/2 ("$+B")
88 * #102 is "Teletex Primary Set of Graphic Characters" and is almost ASCII.
89 * Escapes into:
90 * G0: ESC 2/8 7/5 ("(u")
91 * G1: ESC 2/9 7/5 (")u")
92 * G2: ESC 2/10 7/5 ("*u")
93 * G3: ESC 2/11 7/5 ("+u")
94 * It is almost identical to ASCII, except for ASCII position for '$'
95 * (DOLLAR SIGN) is filled with 'ยค' (CURRENCY SIGN), which is U+00A4.
96 * Also, ASCII positions for '`', '\', '^', '{', '}', '~' are marked
97 * as "should not be used".
98 * #103 is a supplementary set of characters used in combination with #102.
99 * Escapes into:
100 * G0: ESC 2/8 7/6 ("(v")
101 * G1: ESC 2/9 7/6 (")v")
102 * G2: ESC 2/10 7/6 ("*v")
103 * G3: ESC 2/11 7/6 ("+v")
104 * Some characters in that character set are combining characters,
105 * which can only be restrictively used with certain basic Latin letters.
106 * It can be thought of as a subset of #156 with the exception of 4/12
107 * which is UNDERLINE in #103 and absent in #156.
108 * #106 is a primary set of control functions, used in combination with #107.
109 * Escapes into:
110 * C0: ESC 2/1 4/5 ("!E")
111 * This set is so short I can list it here:
112 * 0x08 BS BACKSPACE -- same as Unicode
113 * 0x0a LF LINE FEED -- same as Unicode
114 * 0x0c FF FORM FEED -- same as Unicode
115 * 0x0d CR CARRIAGE RETURN -- same as Unicode
116 * 0x0e LS1 LOCKING SHIFT ONE
117 * 0x0f LS0 LOCKING SHIFT ZERO
118 * 0x19 SS2 SINGLE SHIFT TWO
119 * 0x1a SUB SUBSTITUTE CHARACTER
120 * 0x1b ESC ESCAPE -- same as Unicode
121 * 0x1d SS3 SINGLE SHIFT THREE
122 * The LS1 and LS0 are two magical functions which, respectively, invoke
123 * the currently designated G1 or G0 set into positions 2/1 to 7/14
124 * The SS2 and SS3, respectively, invoke one character of the
125 * currently designated set G2 and G3.
126 * The SUB is wholly equivalent to U+001a (SUBSTITUTE)
127 * #107 is a supplementary set of control functions, used with #106.
128 * Escapes into:
129 * C1: ESC 2/2 4/8 ('"H')
130 * This set contains three special control codes:
131 * 0x8b PLD PARTIAL LINE DOWN -- similar to <SUB>
132 * 0x8c PLU PARTIAL LINE UP -- sumilar to <SUP>
133 * 0x9b CSI CONTROL SEQUENCE INTRODUCER
134 * This set is so out of world we can probably safely ignore it.
135 * #126 is a "Right-hand Part of the Latin/Greek Alphabet".
136 * Comprises of 90 characters, including accented letters.
137 * Escapes into:
138 * G1: ESC 2/13 4/6 ("-F")
139 * G2: ESC 2/14 4/6 (".F")
140 * G3: ESC 2/15 4/6 ("/F")
141 * Note: This Registration is a subset of ISO-IR 227.
142 * #144 is a "Cyrillic part of the Latin/Cyrillic Alphabet".
143 * Comprises of 95 characters.
144 * Escapes into:
145 * G1: ESC 2/13 4/12 ("-L")
146 * G2: ESC 2/14 4/12 (".L")
147 * G3: ESC 2/15 4/12 ("/L")
148 * #150 is a "Greek Primary Set of Graphic Characters".
149 * Comprises of 94 characters.
150 * Escapes into:
151 * G0: ESC 2/8 2/1 4/0 ("(!@")
152 * G1: ESC 2/9 2/1 4/0 (")!@")
153 * G2: ESC 2/10 2/1 4/0 ("*!@")
154 * G3: ESC 2/11 2/1 4/0 ("+!@")
155 * #153 is a "Basic Cyrillic Character Set for 8-bit codes".
156 * Comprises of 68 characters.
157 * Escapes into:
158 * G1: ESC 2/13 4/15 ("-O")
159 * G2: ESC 2/14 4/15 (".O")
160 * G3: ESC 2/15 4/15 ("/O")
161 * #156 is a "Supplementary Set of ISO/IEC 6937:1992" for use with #6
162 * Comprises of 87 characters.
163 * Escapes into:
164 * G1: ESC 2/13 5/2 ("-R")
165 * G2: ESC 2/14 5/2 (".R")
166 * G3: ESC 2/15 5/2 ("/R")
167 * #164 is a "Hebrew Supplementary Set of Graphic Characters"
168 * Comprises of 27 characters.
169 * Escapes into:
170 * G1: ESC 2/13 5/3 ("-S")
171 * G2: ESC 2/14 5/3 (".S")
172 * G3: ESC 2/15 5/3 ("/S")
173 * #165 is a set of "Codes of the Chinese graphic character set"
174 * Is a multiple-byte set of 8446 characters.
175 * Escapes into:
176 * G0: ESC 2/4 2/8 4/5 ("$(E")
177 * G1: ESC 2/4 2/9 4/5 ("$)E")
178 * G2: ESC 2/4 2/10 4/5 ("$*E")
179 * G3: ESC 2/4 2/11 4/5 ("$+E")
180 * #168 is a "Japanese Graphic Character Set for Information Interchange"
181 * A multiple-byte set of 6879 characters updated from #87.
182 * Escapes into:
183 * G0: ESC 2/6 4/0 ESC 2/4 4/2 ("&@" "$B")
184 * G1: ESC 2/6 4/0 ESC 2/4 2/9 4/2 ("&@" "$)B")
185 * G2: ESC 2/6 4/0 ESC 2/4 2/10 4/2 ("&@" "$*B")
186 * G3: ESC 2/6 4/0 ESC 2/4 2/11 4/2 ("&@" "$+B")
187 */
188