chiark / gitweb /
Build system overhaul.
[misc] / space.c
CommitLineData
df33ee54
MW
1#include <ctype.h>
2#include <errno.h>
3#include <stdio.h>
4#include <stdlib.h>
5#include <string.h>
6
7#include <sys/types.h>
8#include <sys/stat.h>
9
10#include <fcntl.h>
11#include <getopt.h>
12#include <unistd.h>
13
14enum {
15 OK = 0,
16 BADNESS = 1,
17 TROUBLE = 32
18};
19
20static const char *ego = "<unset>";
21
22static const char *bkp = 0;
23
24static unsigned flags = 0;
25#define F_MIDLINETABS 1u
26#define F_INPLACE 2u
27#define F_CHECK 4u
28#define F_BOGUS 8u
29#define F_UNTABIFY 16u
30#define F_TABIFY 32u
31#define F_VERBOSE 64u
32
33static void usage(FILE *fp)
34 { fprintf(fp, "Usage: %s [-cmtuv] [-i[BKP]] [FILE...]\n\n", ego); }
35
36static char *augment(const char *name, const char *suffix)
37{
38 size_t n = strlen(name), nn = strlen(suffix);
39 char *p = malloc(n + nn + 1);
40
41 if (!p) {
42 fprintf(stderr, "%s: Out of memory!\n", ego);
43 return (0);
44 }
45 memcpy(p, name, n);
46 memcpy(p + n, suffix, nn + 1);
47 return (p);
48}
49
50static FILE *freshname(const char *name, char **newname, mode_t mode)
51{
52 char buf[16];
53 int i;
54 int fd;
55 FILE *fp;
56 char *n;
57
58 for (i = 0; i < 32767; i++) {
59 sprintf(buf, ".new%d", i);
60 if ((n = augment(name, buf)) == 0)
61 goto fail_0;
62 if ((fd = open(n, O_WRONLY | O_CREAT | O_EXCL, mode)) < 0) {
63 if (errno == EEXIST) {
64 free(n);
65 continue;
66 }
67 fprintf(stderr, "%s: Can't create new file for `%s': %s\n",
68 ego, name, strerror(errno));
69 goto fail_1;
70 }
71 goto win;
72 }
73 fprintf(stderr, "%s: Can't find new file to update `%s'\n", ego, name);
74 goto fail_1;
75
76win:
77 if (chmod(n, mode)) {
78 fprintf(stderr, "%s: Can't set permissions on `%s': %s\n",
79 ego, n, strerror(errno));
80 goto fail_2;
81 }
82 if ((fp = fdopen(fd, "w")) == 0) {
83 fprintf(stderr, "%s: fdopen on `%s' failed: %s\n",
84 ego, n, strerror(errno));
85 goto fail_2;
86 }
87 *newname = n;
88 return (fp);
89
90fail_2:
91 close(fd);
92fail_1:
93 free(n);
94fail_0:
95 return (0);
96}
97
98typedef struct buf {
99 char *b;
100 size_t n;
101 size_t sz;
102} buf;
103#define BUF_INIT { 0, 0, 0 }
104
105static void reset(buf *b) { b->n = 0; }
106
107static int put(buf *b, int ch)
108{
109 size_t w;
110
111 if (b->n >= b->sz) {
112 if (!b->sz) {
113 w = 64;
114 b->b = malloc(w);
115 } else {
116 w = b->sz * 2;
117 b->b = realloc(b->b, w);
118 }
119 if (!b->b) {
120 fprintf(stderr, "%s: Not enough memory for buffer!\n", ego);
121 return (-1);
122 }
123 b->sz = w;
124 }
125 b->b[b->n++] = ch;
126 return (0);
127}
128
129#define TABSTOP(n) (((n) + 8u) & ~7u)
130
131static int space(const char *name)
132{
133 static buf b = BUF_INIT;
134 FILE *fin, *fout = stdout;
135 char *newname = 0, *oldname = 0;
136 int rc = TROUBLE, status = OK;
137 int last = '\n';
138 unsigned nsp = 0, nwsp = 0, hpos = 0, ohpos = 0, nhpos = 0, nl = 1;
139 unsigned i;
140#define f_newline 1u
141#define f_warnspacetab 2u
142#define f_tabify 4u
143#define f_warntabs 8u
144#define f_warnspaces 16u
145#define f_tab 32u
146#define f_bad 64u
147#define f_forced 128u
148 unsigned f = f_newline | (flags & F_TABIFY ? f_tabify : 0);
149 int ch;
150
151 if (strcmp(name, "-") == 0) {
152 if (flags & F_INPLACE) {
153 fprintf(stderr, "%s: Can't modify stdin in-place.\n", ego);
154 goto done_0;
155 }
156 fin = stdin;
157 } else {
158 if ((fin = fopen(name, "r")) == 0) {
159 fprintf(stderr, "%s: Failed to open file `%s': %s.\n",
160 ego, name, strerror(errno));
161 goto done_0;
162 }
163 else if (flags & F_INPLACE) {
164 struct stat st;
165 if (stat(name, &st)) {
166 fprintf(stderr, "%s: Can't stat `%s': %s.\n",
167 ego, name, strerror(errno));
168 goto done_1;
169 }
170 if ((fout = freshname(name, &newname, st.st_mode)) == 0)
171 goto done_1;
172 }
173 }
174 if (flags & F_CHECK)
175 fout = 0;
176
177 for (;;) {
178 ch = getc(fin);
179 switch (ch) {
180 case ' ':
181 nsp++; nwsp++; hpos++;
182 if (put(&b, ' ')) goto done_2;
183 break;
184 case '\t':
185 if (flags & F_UNTABIFY) {
186 if ((flags & F_CHECK) && !(f & f_warntabs)) {
187 fprintf(stderr, "%s:%u: found tab\n", name, nl);
188 f |= f_warntabs;
189 status = BADNESS;
190 }
191 } else if (((flags & F_MIDLINETABS) || (f & f_newline)) && nsp) {
192 if ((flags & F_VERBOSE) && !(f & f_warnspacetab)) {
193 fprintf(stderr, "%s:%u: space followed by tab\n", name, nl);
194 f |= f_warnspacetab;
195 status = BADNESS;
196 }
197 f |= f_tabify | f_forced;
198 }
199 f |= f_tab;
200 nsp = 0; nwsp++; hpos = TABSTOP(hpos);
201 if (put(&b, '\t')) goto done_2;
202 break;
203 case EOF:
204 if (nwsp || !(f & f_newline)) {
205 if (flags & F_VERBOSE)
206 fprintf(stderr, "%s:%u: file ends in mid-line\n", name, nl);
207 status = BADNESS;
208 if (fout) putc('\n', fout);
209 }
210 goto end;
211 case '\n':
212 case '\v':
213 if (nwsp && (flags & F_VERBOSE)) {
214 fprintf(stderr, "%s:%u: trailing whitespace\n", name, nl);
215 status = BADNESS;
216 }
217 if (fout) putc('\n', fout);
218 reset(&b);
219 nsp = nwsp = hpos = ohpos = 0; nl++;
220 f |= f_newline;
221 f &= ~(f_tab | f_warnspacetab | f_warntabs | f_warnspaces);
222 if (flags & F_TABIFY)
223 f |= f_tabify;
224 else
225 f &= ~f_tabify;
226 last = '\n';
227 break;
228 default:
229 if (nwsp) {
230 if (flags & F_UNTABIFY) {
231 if (fout) for (; ohpos < hpos; ohpos++) putc(' ', fout);
232 } else if ((f & f_tabify) &&
233 ((hpos - ohpos >= (last == '.' || last == ':' ?
234 3 : 2)) ||
235 (f & (f_tab | f_newline)))) {
236 i = 0;
237 for (;;) {
238 nhpos = TABSTOP(ohpos);
239 if (nhpos > hpos) break;
240 if (fout) putc('\t', fout);
241 if ((flags & F_VERBOSE) && (flags & F_TABIFY) &&
242 i < b.n && b.b[i] != '\t' &&
243 !(f & (f_warnspaces | f_forced))) {
244 fprintf(stderr, "%s:%u: spaces could be turned into tabs\n",
245 name, nl);
246 f |= f_warnspaces;
247 }
248 ohpos = nhpos;
249 i++;
250 }
251 if (fout)
252 for (; ohpos < hpos; ohpos++) putc(' ', fout);
253 } else if (fout)
254 for (i = 0; i < b.n; i++) putc(b.b[i], fout);
255 }
256 reset(&b);
257 f &= ~(f_newline | f_tab | f_forced);
258 if (!(flags & F_TABIFY) || !(flags & F_MIDLINETABS)) f &= ~f_tabify;
259 nwsp = nsp = 0;
260 hpos++; ohpos = hpos;
261 if (fout) putc(ch, fout);
262 if (ch != '"' && ch != '\'')
263 last = ch;
264 break;
265 }
266 }
267end:;
268
269 if (ferror(fin)) {
270 fprintf(stderr, "%s: Error reading `%s': %s\n",
271 ego, name, strerror(errno));
272 goto done_2;
273 }
274
275 if (fout) {
276 if (fflush(fout) || ferror(fout)) f |= f_bad;
277 if (fout != stdout && fclose(fout)) f |= f_bad;
278 fout = 0;
279 if (f & f_bad) {
280 fprintf(stderr, "%s: Error writing `%s': %s\n",
281 ego, newname, strerror(errno));
282 goto done_2;
283 }
284 }
285
286 if (flags & F_INPLACE) {
287 if (bkp) {
288 if ((oldname = augment(name, bkp)) == 0)
289 goto done_2;
290 if (rename(name, oldname)) {
291 fprintf(stderr, "%s: Failed to back up `%s' as `%s': %s\n",
292 ego, name, oldname, strerror(errno));
293 goto done_2;
294 }
295 }
296 if (rename(newname, name)) {
297 if (oldname) rename(oldname, name);
298 fprintf(stderr, "%s: Failed to install `%s' as `%s': %s\n",
299 ego, newname, name, strerror(errno));
300 goto done_2;
301 }
302 }
303
304 rc = status;
305
306done_2:
307 if (oldname) free(oldname);
308 if (newname) {
309 remove(newname);
310 free(newname);
311 }
312done_1:
313 if (fout && fout != stdout) fclose(fout);
314 fclose(fin);
315done_0:
316 return (rc);
317}
318
319static int manysetp(unsigned f) { return (!!(f & (f - 1))); }
320
321int main(int argc, char *argv[])
322{
323 int i;
324 int rc = OK, st;
325
326 if ((ego = strrchr(argv[0], '/')) == 0)
327 ego = argv[0];
328 else
329 ego++;
330
331 for (;;) {
332 if ((i = getopt(argc, argv, "h" "cmtuv" "i::")) < 0)
333 break;
334 switch (i) {
335 case 'h':
336 printf("%s -- remove extraneous spaces from files\n\n", ego);
337 usage(stdout);
338 fputs("Options:\n\
339 -h Print this help text\n\
340 -c Check files for badness, but don't produce other output\n\
341 -m Fix spaces followed by tabs in mid-line\n\
342 -t Tabify file completely\n\
343 -u Untabify file completely\n\
344 -i[BKP] Modify files in place; leave FILEBKP as copy of old FILE\n\
345", stdout);
346 exit(0);
347 case 'i':
348 bkp = optarg;
349 flags |= F_INPLACE;
350 break;
351 case 'm':
352 flags |= F_MIDLINETABS;
353 break;
354 case 'c':
355 flags |= F_CHECK;
356 break;
357 case 't':
358 flags |= F_TABIFY;
359 break;
360 case 'u':
361 flags |= F_UNTABIFY;
362 break;
363 case 'v':
364 flags |= F_VERBOSE;
365 break;
366 default:
367 flags |= F_BOGUS;
368 break;
369 }
370 }
371 if (flags & F_BOGUS) {
372 usage(stderr);
373 exit(TROUBLE);
374 }
375 if (manysetp(flags & (F_CHECK | F_INPLACE))) {
376 fprintf(stderr, "%s: Options -c and -i are mutually exclusive.\n", ego);
377 exit(TROUBLE);
378 }
379 if (manysetp(flags & (F_TABIFY | F_UNTABIFY))) {
380 fprintf(stderr, "%s: Options -t and -u are mutually exclusive.\n", ego);
381 exit(TROUBLE);
382 }
383
384 if (optind == argc) {
385 if (isatty(0)) {
386 fprintf(stderr, "%s: No options given and stdin is a terminal.\n",
387 ego);
388 exit(TROUBLE);
389 }
390 rc = space("-");
391 } else for (i = optind; i < argc; i++) {
392 st = space(argv[i]);
393 if (st > rc) rc = st;
394 }
395 if (rc == BADNESS && !(flags & F_CHECK))
396 rc = OK;
397 return (rc);
398}