annotate libcoding/utf8_decode2.c @ 33:a91fb88a57b2 default tip

add INSTALL document
author Mychaela Falconia <falcon@freecalypso.org>
date Fri, 14 Jun 2024 20:29:17 +0000
parents e56bb9f09ff1
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
1 /*
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
2 * This library module implements the function for converting UTF-8 input
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
3 * to UCS-2 in outgoing SMS composition.
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
4 */
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
5
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
6 #include <sys/types.h>
23
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
7 #include <ctype.h>
0
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
8
23
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
9 static int
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
10 handle_escape(ipp, outp)
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
11 u_char **ipp;
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
12 unsigned *outp;
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
13 {
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
14 unsigned c, n, acc;
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
15
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
16 c = *(*ipp)++;
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
17 switch (c) {
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
18 case '"':
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
19 case '\\':
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
20 *outp = c;
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
21 return(0);
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
22 case 'n':
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
23 *outp = '\n';
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
24 return(0);
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
25 case 'r':
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
26 *outp = '\r';
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
27 return(0);
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
28 case 'u':
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
29 acc = 0;
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
30 for (n = 0; n < 4; n++) {
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
31 c = *(*ipp)++;
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
32 if (!isxdigit(c))
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
33 return(-3);
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
34 acc <<= 4;
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
35 acc |= decode_hex_digit(c);
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
36 }
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
37 *outp = acc;
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
38 return(0);
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
39 default:
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
40 return(-3);
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
41 }
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
42 }
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
43
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
44 utf8_to_ucs2(inbuf, outbuf, outmax, outlenp, allow_escape)
0
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
45 u_char *inbuf;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
46 u_short *outbuf;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
47 unsigned outmax, *outlenp;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
48 {
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
49 u_char *ip = inbuf;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
50 u_short *op = outbuf;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
51 unsigned outcnt = 0, c, n, uni;
23
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
52 int rc;
0
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
53
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
54 while (c = *ip++) {
23
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
55 if (c == '\\' && allow_escape) {
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
56 rc = handle_escape(&ip, &uni);
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
57 if (rc < 0)
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
58 return(rc);
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
59 goto gotuni;
e56bb9f09ff1 sms-encode-text: port over -e option from fcup-smsend
Mychaela Falconia <falcon@freecalypso.org>
parents: 0
diff changeset
60 }
0
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
61 if (c < 0x80) {
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
62 uni = c;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
63 goto gotuni;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
64 }
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
65 if (c < 0xC0 || c > 0xEF)
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
66 return(-1);
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
67 uni = c & 0x1F;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
68 if (c >= 0xE0)
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
69 n = 2;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
70 else
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
71 n = 1;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
72 for (; n; n--) {
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
73 c = *ip++;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
74 if (c < 0x80 || c > 0xBF)
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
75 return(-1);
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
76 uni <<= 6;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
77 uni |= c & 0x3F;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
78 }
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
79 gotuni: if (outcnt >= outmax)
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
80 return(-2);
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
81 *op++ = uni;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
82 outcnt++;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
83 }
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
84 *outlenp = outcnt;
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
85 return(0);
2d0082216916 libcoding: beginning with a subset of uptools version
Mychaela Falconia <falcon@freecalypso.org>
parents:
diff changeset
86 }