]> CyberLeo.Net >> Repos - FreeBSD/releng/8.1.git/blob - usr.bin/xstr/xstr.c
Copy stable/8 to releng/8.1 in preparation for 8.1-RC1.
[FreeBSD/releng/8.1.git] / usr.bin / xstr / xstr.c
1 /*
2  * Copyright (c) 1980, 1993
3  *      The Regents of the University of California.  All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions
7  * are met:
8  * 1. Redistributions of source code must retain the above copyright
9  *    notice, this list of conditions and the following disclaimer.
10  * 2. Redistributions in binary form must reproduce the above copyright
11  *    notice, this list of conditions and the following disclaimer in the
12  *    documentation and/or other materials provided with the distribution.
13  * 3. All advertising materials mentioning features or use of this software
14  *    must display the following acknowledgement:
15  *      This product includes software developed by the University of
16  *      California, Berkeley and its contributors.
17  * 4. Neither the name of the University nor the names of its contributors
18  *    may be used to endorse or promote products derived from this software
19  *    without specific prior written permission.
20  *
21  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
22  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
26  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
27  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
28  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
29  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
30  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31  * SUCH DAMAGE.
32  */
33
34 #include <sys/cdefs.h>
35
36 __FBSDID("$FreeBSD$");
37
38 #ifndef lint
39 static const char copyright[] =
40 "@(#) Copyright (c) 1980, 1993\n\
41         The Regents of the University of California.  All rights reserved.\n";
42 #endif
43
44 #ifndef lint
45 static const char sccsid[] = "@(#)xstr.c        8.1 (Berkeley) 6/9/93";
46 #endif
47
48 #include <sys/types.h>
49
50 #include <ctype.h>
51 #include <err.h>
52 #include <stdio.h>
53 #include <stdlib.h>
54 #include <signal.h>
55 #include <string.h>
56 #include <unistd.h>
57
58 #include "pathnames.h"
59
60 /*
61  * xstr - extract and hash strings in a C program
62  *
63  * Bill Joy UCB
64  * November, 1978
65  */
66
67 #define ignore(a)       ((void) a)
68
69 off_t   tellpt;
70
71 off_t   mesgpt;
72 char    cstrings[] =    "strings";
73 char    *strings =      cstrings;
74
75 int     cflg;
76 int     vflg;
77 int     readstd;
78
79 char lastchr(char *);
80
81 int fgetNUL(char *, int, FILE *);
82 int istail(char *, char *);
83 int octdigit(char);
84 int xgetc(FILE *);
85
86 off_t hashit(char *, int);
87 off_t yankstr(char **);
88
89 static void usage(void);
90
91 void flushsh(void);
92 void found(int, off_t, char *);
93 void inithash(void);
94 void onintr(int);
95 void process(const char *);
96 void prstr(char *);
97 void xsdotc(void);
98
99 int
100 main(int argc, char *argv[])
101 {
102         int c;
103         int fdesc;
104
105         while ((c = getopt(argc, argv, "-cv")) != -1)
106                 switch (c) {
107                 case '-':
108                         readstd++;
109                         break;
110                 case 'c':
111                         cflg++;
112                         break;
113                 case 'v':
114                         vflg++;
115                         break;
116                 default:
117                         usage();
118                 }
119         argc -= optind;
120         argv += optind;
121                 
122         if (signal(SIGINT, SIG_IGN) == SIG_DFL)
123                 signal(SIGINT, onintr);
124         if (cflg || (argc == 0 && !readstd))
125                 inithash();
126         else {
127                 strings = strdup(_PATH_TMP);
128                 if (strings == NULL)
129                         err(1, "strdup() failed");
130                 fdesc = mkstemp(strings);
131                 if (fdesc == -1)
132                         err(1, "Unable to create temporary file");
133                 close(fdesc);
134         }
135
136         while (readstd || argc > 0) {
137                 if (freopen("x.c", "w", stdout) == NULL)
138                         err(1, "x.c");
139                 if (!readstd && freopen(argv[0], "r", stdin) == NULL)
140                         err(2, "%s", argv[0]);
141                 process("x.c");
142                 if (readstd == 0)
143                         argc--, argv++;
144                 else
145                         readstd = 0;
146         };
147         flushsh();
148         if (cflg == 0)
149                 xsdotc();
150         if (strings[0] == '/')
151                 ignore(unlink(strings));
152         exit(0);
153 }
154
155 static void
156 usage(void)
157 {
158         fprintf(stderr, "usage: xstr [-cv] [-] [file ...]\n");
159         exit (1);
160 }
161
162 char linebuf[BUFSIZ];
163
164 void
165 process(const char *name)
166 {
167         char *cp;
168         int c;
169         int incomm = 0;
170         int ret;
171
172         printf("extern char\txstr[];\n");
173         for (;;) {
174                 if (fgets(linebuf, sizeof linebuf, stdin) == NULL) {
175                         if (ferror(stdin))
176                                 err(3, "%s", name);
177                         break;
178                 }
179                 if (linebuf[0] == '#') {
180                         if (linebuf[1] == ' ' && isdigit(linebuf[2]))
181                                 printf("#line%s", &linebuf[1]);
182                         else
183                                 printf("%s", linebuf);
184                         continue;
185                 }
186                 for (cp = linebuf; (c = *cp++);) switch (c) {
187
188                 case '"':
189                         if (incomm)
190                                 goto def;
191                         if ((ret = (int) yankstr(&cp)) == -1)
192                                 goto out;
193                         printf("(&xstr[%d])", ret);
194                         break;
195
196                 case '\'':
197                         if (incomm)
198                                 goto def;
199                         putchar(c);
200                         if (*cp)
201                                 putchar(*cp++);
202                         break;
203
204                 case '/':
205                         if (incomm || *cp != '*')
206                                 goto def;
207                         incomm = 1;
208                         cp++;
209                         printf("/*");
210                         continue;
211
212                 case '*':
213                         if (incomm && *cp == '/') {
214                                 incomm = 0;
215                                 cp++;
216                                 printf("*/");
217                                 continue;
218                         }
219                         goto def;
220
221 def:
222                 default:
223                         putchar(c);
224                         break;
225                 }
226         }
227 out:
228         if (ferror(stdout))
229                 warn("x.c"), onintr(0);
230 }
231
232 off_t
233 yankstr(char **cpp)
234 {
235         char *cp = *cpp;
236         int c, ch;
237         char dbuf[BUFSIZ];
238         char *dp = dbuf;
239         char *tp;
240         static char tmp[] = "b\bt\tr\rn\nf\f\\\\\"\"";
241
242         while ((c = *cp++)) {
243                 if (dp == dbuf + sizeof(dbuf) - 3)
244                         errx(1, "message too long");
245                 switch (c) {
246
247                 case '"':
248                         cp++;
249                         goto out;
250
251                 case '\\':
252                         c = *cp++;
253                         if (c == 0)
254                                 break;
255                         if (c == '\n') {
256                                 if (fgets(linebuf, sizeof linebuf, stdin)
257                                     == NULL) {
258                                         if (ferror(stdin))
259                                                 err(3, "x.c");
260                                         return(-1);
261                                 }
262                                 cp = linebuf;
263                                 continue;
264                         }
265                         for (tp = tmp; (ch = *tp++); tp++)
266                                 if (c == ch) {
267                                         c = *tp;
268                                         goto gotc;
269                                 }
270                         if (!octdigit(c)) {
271                                 *dp++ = '\\';
272                                 break;
273                         }
274                         c -= '0';
275                         if (!octdigit(*cp))
276                                 break;
277                         c <<= 3, c += *cp++ - '0';
278                         if (!octdigit(*cp))
279                                 break;
280                         c <<= 3, c += *cp++ - '0';
281                         break;
282                 }
283 gotc:
284                 *dp++ = c;
285         }
286 out:
287         *cpp = --cp;
288         *dp = 0;
289         return (hashit(dbuf, 1));
290 }
291
292 int
293 octdigit(char c)
294 {
295         return (isdigit(c) && c != '8' && c != '9');
296 }
297
298 void
299 inithash(void)
300 {
301         char buf[BUFSIZ];
302         FILE *mesgread = fopen(strings, "r");
303
304         if (mesgread == NULL)
305                 return;
306         for (;;) {
307                 mesgpt = tellpt;
308                 if (fgetNUL(buf, sizeof buf, mesgread) == 0)
309                         break;
310                 ignore(hashit(buf, 0));
311         }
312         ignore(fclose(mesgread));
313 }
314
315 int
316 fgetNUL(char *obuf, int rmdr, FILE *file)
317 {
318         int c;
319         char *buf = obuf;
320
321         while (--rmdr > 0 && (c = xgetc(file)) != 0 && c != EOF)
322                 *buf++ = c;
323         *buf++ = 0;
324         return ((feof(file) || ferror(file)) ? 0 : 1);
325 }
326
327 int
328 xgetc(FILE *file)
329 {
330
331         tellpt++;
332         return (getc(file));
333 }
334
335 #define BUCKETS 128
336
337 struct  hash {
338         off_t   hpt;
339         char    *hstr;
340         struct  hash *hnext;
341         short   hnew;
342 } bucket[BUCKETS];
343
344 off_t
345 hashit(char *str, int new)
346 {
347         int i;
348         struct hash *hp, *hp0;
349
350         hp = hp0 = &bucket[lastchr(str) & 0177];
351         while (hp->hnext) {
352                 hp = hp->hnext;
353                 i = istail(str, hp->hstr);
354                 if (i >= 0)
355                         return (hp->hpt + i);
356         }
357         if ((hp = (struct hash *) calloc(1, sizeof (*hp))) == NULL)
358                 errx(8, "calloc");
359         hp->hpt = mesgpt;
360         if (!(hp->hstr = strdup(str)))
361                 err(1, NULL);
362         mesgpt += strlen(hp->hstr) + 1;
363         hp->hnext = hp0->hnext;
364         hp->hnew = new;
365         hp0->hnext = hp;
366         return (hp->hpt);
367 }
368
369 void
370 flushsh(void)
371 {
372         int i;
373         struct hash *hp;
374         FILE *mesgwrit;
375         int old = 0, new = 0;
376
377         for (i = 0; i < BUCKETS; i++)
378                 for (hp = bucket[i].hnext; hp != NULL; hp = hp->hnext)
379                         if (hp->hnew)
380                                 new++;
381                         else
382                                 old++;
383         if (new == 0 && old != 0)
384                 return;
385         mesgwrit = fopen(strings, old ? "r+" : "w");
386         if (mesgwrit == NULL)
387                 err(4, "%s", strings);
388         for (i = 0; i < BUCKETS; i++)
389                 for (hp = bucket[i].hnext; hp != NULL; hp = hp->hnext) {
390                         found(hp->hnew, hp->hpt, hp->hstr);
391                         if (hp->hnew) {
392                                 fseek(mesgwrit, hp->hpt, 0);
393                                 ignore(fwrite(hp->hstr, strlen(hp->hstr) + 1, 1, mesgwrit));
394                                 if (ferror(mesgwrit))
395                                         err(4, "%s", strings);
396                         }
397                 }
398         if (fclose(mesgwrit) == EOF)
399                 err(4, "%s", strings);
400 }
401
402 void
403 found(int new, off_t off, char *str)
404 {
405         if (vflg == 0)
406                 return;
407         if (!new)
408                 fprintf(stderr, "found at %d:", (int) off);
409         else
410                 fprintf(stderr, "new at %d:", (int) off);
411         prstr(str);
412         fprintf(stderr, "\n");
413 }
414
415 void
416 prstr(char *cp)
417 {
418         int c;
419
420         while ((c = (*cp++ & 0377)))
421                 if (c < ' ')
422                         fprintf(stderr, "^%c", c + '`');
423                 else if (c == 0177)
424                         fprintf(stderr, "^?");
425                 else if (c > 0200)
426                         fprintf(stderr, "\\%03o", c);
427                 else
428                         fprintf(stderr, "%c", c);
429 }
430
431 void
432 xsdotc(void)
433 {
434         FILE *strf = fopen(strings, "r");
435         FILE *xdotcf;
436
437         if (strf == NULL)
438                 err(5, "%s", strings);
439         xdotcf = fopen("xs.c", "w");
440         if (xdotcf == NULL)
441                 err(6, "xs.c");
442         fprintf(xdotcf, "char\txstr[] = {\n");
443         for (;;) {
444                 int i, c;
445
446                 for (i = 0; i < 8; i++) {
447                         c = getc(strf);
448                         if (ferror(strf)) {
449                                 warn("%s", strings);
450                                 onintr(0);
451                         }
452                         if (feof(strf)) {
453                                 fprintf(xdotcf, "\n");
454                                 goto out;
455                         }
456                         fprintf(xdotcf, "0x%02x,", c);
457                 }
458                 fprintf(xdotcf, "\n");
459         }
460 out:
461         fprintf(xdotcf, "};\n");
462         ignore(fclose(xdotcf));
463         ignore(fclose(strf));
464 }
465
466 char
467 lastchr(char *cp)
468 {
469
470         while (cp[0] && cp[1])
471                 cp++;
472         return (*cp);
473 }
474
475 int
476 istail(char *str, char *of)
477 {
478         int d = strlen(of) - strlen(str);
479
480         if (d < 0 || strcmp(&of[d], str) != 0)
481                 return (-1);
482         return (d);
483 }
484
485 void
486 onintr(int dummy __unused)
487 {
488
489         ignore(signal(SIGINT, SIG_IGN));
490         if (strings[0] == '/')
491                 ignore(unlink(strings));
492         ignore(unlink("x.c"));
493         ignore(unlink("xs.c"));
494         exit(7);
495 }