]>
Commit | Line | Data |
---|---|---|
1 | /* Determine the number of screen columns needed for a string. | |
2 | Copyright (C) 2000-2002 Free Software Foundation, Inc. | |
3 | ||
4 | This program is free software; you can redistribute it and/or modify | |
5 | it under the terms of the GNU General Public License as published by | |
6 | the Free Software Foundation; either version 2, or (at your option) | |
7 | any later version. | |
8 | ||
9 | This program is distributed in the hope that it will be useful, | |
10 | but WITHOUT ANY WARRANTY; without even the implied warranty of | |
11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
12 | GNU General Public License for more details. | |
13 | ||
14 | You should have received a copy of the GNU General Public License | |
15 | along with this program; if not, write to the Free Software Foundation, | |
16 | Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */ | |
17 | ||
18 | /* Written by Bruno Haible <haible@clisp.cons.org>. */ | |
19 | ||
20 | #ifdef HAVE_CONFIG_H | |
21 | # include <config.h> | |
22 | #endif | |
23 | ||
24 | /* Specification. */ | |
25 | #include "mbswidth.h" | |
26 | ||
27 | /* Get MB_CUR_MAX. */ | |
28 | #include <stdlib.h> | |
29 | ||
30 | #include <string.h> | |
31 | ||
32 | /* Get isprint(). */ | |
33 | #include <ctype.h> | |
34 | ||
35 | /* Get mbstate_t, mbrtowc(), mbsinit(), wcwidth(). */ | |
36 | #if HAVE_WCHAR_H | |
37 | # include <wchar.h> | |
38 | #endif | |
39 | ||
40 | /* Get iswprint(), iswcntrl(). */ | |
41 | #if HAVE_WCTYPE_H | |
42 | # include <wctype.h> | |
43 | #endif | |
44 | #if !defined iswprint && !HAVE_ISWPRINT | |
45 | # define iswprint(wc) 1 | |
46 | #endif | |
47 | #if !defined iswcntrl && !HAVE_ISWCNTRL | |
48 | # define iswcntrl(wc) 0 | |
49 | #endif | |
50 | ||
51 | #ifndef mbsinit | |
52 | # if !HAVE_MBSINIT | |
53 | # define mbsinit(ps) 1 | |
54 | # endif | |
55 | #endif | |
56 | ||
57 | #ifndef HAVE_DECL_WCWIDTH | |
58 | "this configure-time declaration test was not run" | |
59 | #endif | |
60 | #if !HAVE_DECL_WCWIDTH | |
61 | int wcwidth (); | |
62 | #endif | |
63 | ||
64 | #ifndef wcwidth | |
65 | # if !HAVE_WCWIDTH | |
66 | /* wcwidth doesn't exist, so assume all printable characters have | |
67 | width 1. */ | |
68 | # define wcwidth(wc) ((wc) == 0 ? 0 : iswprint (wc) ? 1 : -1) | |
69 | # endif | |
70 | #endif | |
71 | ||
72 | /* Get ISPRINT. */ | |
73 | #if defined (STDC_HEADERS) || (!defined (isascii) && !defined (HAVE_ISASCII)) | |
74 | # define IN_CTYPE_DOMAIN(c) 1 | |
75 | #else | |
76 | # define IN_CTYPE_DOMAIN(c) isascii(c) | |
77 | #endif | |
78 | /* Undefine to protect against the definition in wctype.h of solaris2.6. */ | |
79 | #undef ISPRINT | |
80 | #define ISPRINT(c) (IN_CTYPE_DOMAIN (c) && isprint (c)) | |
81 | #undef ISCNTRL | |
82 | #define ISCNTRL(c) (IN_CTYPE_DOMAIN (c) && iscntrl (c)) | |
83 | ||
84 | /* Returns the number of columns needed to represent the multibyte | |
85 | character string pointed to by STRING. If a non-printable character | |
86 | occurs, and MBSW_REJECT_UNPRINTABLE is specified, -1 is returned. | |
87 | With flags = MBSW_REJECT_INVALID | MBSW_REJECT_UNPRINTABLE, this is | |
88 | the multibyte analogon of the wcswidth function. */ | |
89 | int | |
90 | mbswidth (const char *string, int flags) | |
91 | { | |
92 | return mbsnwidth (string, strlen (string), flags); | |
93 | } | |
94 | ||
95 | /* Returns the number of columns needed to represent the multibyte | |
96 | character string pointed to by STRING of length NBYTES. If a | |
97 | non-printable character occurs, and MBSW_REJECT_UNPRINTABLE is | |
98 | specified, -1 is returned. */ | |
99 | int | |
100 | mbsnwidth (const char *string, size_t nbytes, int flags) | |
101 | { | |
102 | const char *p = string; | |
103 | const char *plimit = p + nbytes; | |
104 | int width; | |
105 | ||
106 | width = 0; | |
107 | #if HAVE_MBRTOWC | |
108 | if (MB_CUR_MAX > 1) | |
109 | { | |
110 | while (p < plimit) | |
111 | switch (*p) | |
112 | { | |
113 | case ' ': case '!': case '"': case '#': case '%': | |
114 | case '&': case '\'': case '(': case ')': case '*': | |
115 | case '+': case ',': case '-': case '.': case '/': | |
116 | case '0': case '1': case '2': case '3': case '4': | |
117 | case '5': case '6': case '7': case '8': case '9': | |
118 | case ':': case ';': case '<': case '=': case '>': | |
119 | case '?': | |
120 | case 'A': case 'B': case 'C': case 'D': case 'E': | |
121 | case 'F': case 'G': case 'H': case 'I': case 'J': | |
122 | case 'K': case 'L': case 'M': case 'N': case 'O': | |
123 | case 'P': case 'Q': case 'R': case 'S': case 'T': | |
124 | case 'U': case 'V': case 'W': case 'X': case 'Y': | |
125 | case 'Z': | |
126 | case '[': case '\\': case ']': case '^': case '_': | |
127 | case 'a': case 'b': case 'c': case 'd': case 'e': | |
128 | case 'f': case 'g': case 'h': case 'i': case 'j': | |
129 | case 'k': case 'l': case 'm': case 'n': case 'o': | |
130 | case 'p': case 'q': case 'r': case 's': case 't': | |
131 | case 'u': case 'v': case 'w': case 'x': case 'y': | |
132 | case 'z': case '{': case '|': case '}': case '~': | |
133 | /* These characters are printable ASCII characters. */ | |
134 | p++; | |
135 | width++; | |
136 | break; | |
137 | default: | |
138 | /* If we have a multibyte sequence, scan it up to its end. */ | |
139 | { | |
140 | mbstate_t mbstate; | |
141 | memset (&mbstate, 0, sizeof mbstate); | |
142 | do | |
143 | { | |
144 | wchar_t wc; | |
145 | size_t bytes; | |
146 | int w; | |
147 | ||
148 | bytes = mbrtowc (&wc, p, plimit - p, &mbstate); | |
149 | ||
150 | if (bytes == (size_t) -1) | |
151 | /* An invalid multibyte sequence was encountered. */ | |
152 | { | |
153 | if (!(flags & MBSW_REJECT_INVALID)) | |
154 | { | |
155 | p++; | |
156 | width++; | |
157 | break; | |
158 | } | |
159 | else | |
160 | return -1; | |
161 | } | |
162 | ||
163 | if (bytes == (size_t) -2) | |
164 | /* An incomplete multibyte character at the end. */ | |
165 | { | |
166 | if (!(flags & MBSW_REJECT_INVALID)) | |
167 | { | |
168 | p = plimit; | |
169 | width++; | |
170 | break; | |
171 | } | |
172 | else | |
173 | return -1; | |
174 | } | |
175 | ||
176 | if (bytes == 0) | |
177 | /* A null wide character was encountered. */ | |
178 | bytes = 1; | |
179 | ||
180 | w = wcwidth (wc); | |
181 | if (w >= 0) | |
182 | /* A printable multibyte character. */ | |
183 | width += w; | |
184 | else | |
185 | /* An unprintable multibyte character. */ | |
186 | if (!(flags & MBSW_REJECT_UNPRINTABLE)) | |
187 | width += (iswcntrl (wc) ? 0 : 1); | |
188 | else | |
189 | return -1; | |
190 | ||
191 | p += bytes; | |
192 | } | |
193 | while (! mbsinit (&mbstate)); | |
194 | } | |
195 | break; | |
196 | } | |
197 | return width; | |
198 | } | |
199 | #endif | |
200 | ||
201 | while (p < plimit) | |
202 | { | |
203 | unsigned char c = (unsigned char) *p++; | |
204 | ||
205 | if (ISPRINT (c)) | |
206 | width++; | |
207 | else if (!(flags & MBSW_REJECT_UNPRINTABLE)) | |
208 | width += (ISCNTRL (c) ? 0 : 1); | |
209 | else | |
210 | return -1; | |
211 | } | |
212 | return width; | |
213 | } |