3 * Copyright (c) 2011 James Gritton
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions
9 * 1. Redistributions of source code must retain the above copyright
10 * notice, this list of conditions and the following disclaimer.
11 * 2. Redistributions in binary form must reproduce the above copyright
12 * notice, this list of conditions and the following disclaimer in the
13 * documentation and/or other materials provided with the distribution.
15 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
16 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
21 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
28 #include <sys/cdefs.h>
29 __FBSDID("$FreeBSD$");
41 static ssize_t text2lval(size_t triml, size_t trimr, int tovar);
44 static int lineno = 1;
46 #define YY_DECL int yylex(void)
56 /* Whitespace or equivalent */
60 <_>\/\*([^*]|(\*+([^*\/])))*\*+\/ {
63 for (s = yytext; s < yytext + yyleng; s++)
83 /* Atomic (unquoted) strings */
84 <_,DQ>[A-Za-z0-9_!%&()\-.:<>?@\[\]^`|~]+ |
85 <_,DQ>\\(.|\n|[0-7]{1,3}|x[0-9A-Fa-f]{1,2}) |
87 (void)text2lval(0, 0, 0);
88 return instr ? STR1 : (instr = 1, STR);
91 /* Single and double quoted strings */
92 <_>'([^\'\\]|\\(.|\n))*' {
93 (void)text2lval(1, 1, 0);
94 return instr ? STR1 : (instr = 1, STR);
96 <_>\"([^"\\]|\\(.|\n))*\" |
97 <DQ>[^\"$\\]([^"\\]|\\(.|\n))*\" {
101 skip = yytext[0] == '"' ? 1 : 0;
102 atvar = text2lval(skip, 1, 1);
107 * The string has a variable inside it.
108 * Go into DQ mode to get the variable
109 * and then the rest of the string.
114 return instr ? STR1 : (instr = 1, STR);
118 /* Variables, single-word or bracketed */
119 <_,DQ>$[A-Za-z_][A-Za-z_0-9]* {
120 (void)text2lval(1, 0, 0);
121 return instr ? VAR1 : (instr = 1, VAR);
123 <_>$\{([^\n{}]|\\(.|\n))*\} |
124 <DQ>$\{([^\n\"{}]|\\(.|\n))*\} {
125 (void)text2lval(2, 1, 0);
126 return instr ? VAR1 : (instr = 1, VAR);
129 /* Partially formed bits worth complaining about */
130 <_>\/\*([^*]|(\*+([^*\/])))*\** {
131 warnx("%s line %d: unterminated comment",
135 <_>'([^\n'\\]|\\.)* |
136 <_>\"([^\n\"\\]|\\.)* {
137 warnx("%s line %d: unterminated string",
141 <_>$\{([^\n{}]|\\.)* |
142 <DQ>$\{([^\n\"{}]|\\.)* {
143 warnx("%s line %d: unterminated variable",
148 /* A hack because "<0>" rules aren't allowed */
149 <_>. return yytext[0];
158 yyerror(const char *s)
161 warnx("%s line %d: %s", cfname, lineno, s);
163 warnx("%s: unexpected EOF", cfname);
165 warnx("%s line %d: %s: %s", cfname, lineno, yytext, s);
169 * Copy string from yytext to yylval, handling backslash escapes,
170 * and optionally stopping at the beginning of a variable.
173 text2lval(size_t triml, size_t trimr, int tovar)
178 yylval.cs = d = emalloc(yyleng - trimr - triml + 1);
179 se = yytext + (yyleng - trimr);
180 for (s = yytext + triml; s < se; s++, d++) {
182 if (tovar && *s == '$') {
192 if (*s >= '0' && *s <= '7') {
194 if (s + 1 < se && s[1] >= '0' && s[1] <= '7') {
195 *d = 010 * *d + (*++s - '0');
196 if (s + 1 < se && s[1] >= '0' && s[1] <= '7')
197 *d = 010 * *d + (*++s - '0');
202 case 'a': *d = '\a'; break;
203 case 'b': *d = '\b'; break;
204 case 'f': *d = '\f'; break;
205 case 'n': *d = '\n'; break;
206 case 'r': *d = '\r'; break;
207 case 't': *d = '\t'; break;
208 case 'v': *d = '\v'; break;
209 case '\n': d--; lineno++; break;
210 default: *d = *s; break;
215 if (s[1] >= '0' && s[1] <= '9')
217 else if (s[1] >= 'A' && s[1] <= 'F')
218 *d = *++s + (0xA - 'A');
219 else if (s[1] >= 'a' && s[1] <= 'a')
220 *d = *++s + (0xa - 'a');
225 if (s[1] >= '0' && s[1] <= '9')
226 *d = *d * 0x10 + (*++s - '0');
227 else if (s[1] >= 'A' && s[1] <= 'F')
228 *d = *d * 0x10 + (*++s + (0xA - 'A'));
229 else if (s[1] >= 'a' && s[1] <= 'a')
230 *d = *d * 0x10 + (*++s + (0xa - 'a'));