comparison src/tokenizer.cpp @ 0:0aa1171aebd2 stable-1-0-0

initial version
author Carl Byington <carl@five-ten-sg.com>
date Wed, 15 May 2013 13:15:59 -0700
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:0aa1171aebd2
1 /*
2
3 Copyright (c) 2007 Carl Byington - 510 Software Group, released under
4 the GPL version 3 or any later version at your choice available at
5 http://www.gnu.org/licenses/gpl-3.0.txt
6
7 */
8
9 // This version of the tokenizer does not force the config to lower
10 // case, to avoid lowercasing the iptables commands, which need some
11 // uppercase arguments. It also considers / to be a separate token
12 // since that is needed for the cidr style ignore statement.
13
14 #include "includes.h"
15
16 const int maxlen = 1000; // used for snprintf buffers
17
18 enum state {s_init,
19 s_token,
20 s_string,
21 s_ignore, // whitespace
22 s_eol, // ignore to eol
23 end_state,
24
25 s_term, // token terminator
26 s_single,
27 s_string1, // first " of string
28 s_string2, // last " of string
29 s_slash // possible start of ignore to eol
30 };
31
32 typedef state PARSE[end_state];
33
34 static PARSE parse_table[256] = {
35 // s_init s_token s_string s_ignore s_eol
36 { s_single, s_term, s_string, s_single, s_eol, }, // 0x00
37 { s_single, s_term, s_string, s_single, s_eol, }, // 0x01
38 { s_single, s_term, s_string, s_single, s_eol, }, // 0x02
39 { s_single, s_term, s_string, s_single, s_eol, }, // 0x03
40 { s_single, s_term, s_string, s_single, s_eol, }, // 0x04
41 { s_single, s_term, s_string, s_single, s_eol, }, // 0x05
42 { s_single, s_term, s_string, s_single, s_eol, }, // 0x06
43 { s_single, s_term, s_string, s_single, s_eol, }, // 0x07
44 { s_single, s_term, s_string, s_single, s_eol, }, // 0x08
45 { s_ignore, s_term, s_string, s_ignore, s_eol, }, // 0x09 <tab>
46 { s_ignore, s_term, s_string2, s_ignore, s_ignore, }, // 0x0a <lf>
47 { s_single, s_term, s_string, s_single, s_eol, }, // 0x0b
48 { s_single, s_term, s_string, s_single, s_eol, }, // 0x0c
49 { s_ignore, s_term, s_string2, s_ignore, s_eol, }, // 0x0d <cr>
50 { s_single, s_term, s_string, s_single, s_eol, }, // 0x0e
51 { s_single, s_term, s_string, s_single, s_eol, }, // 0x0f
52 { s_single, s_term, s_string, s_single, s_eol, }, // 0x10
53 { s_single, s_term, s_string, s_single, s_eol, }, // 0x11 xon char
54 { s_single, s_term, s_string, s_single, s_eol, }, // 0x12
55 { s_single, s_term, s_string, s_single, s_eol, }, // 0x13 xoff char
56 { s_single, s_term, s_string, s_single, s_eol, }, // 0x14
57 { s_single, s_term, s_string, s_single, s_eol, }, // 0x15
58 { s_single, s_term, s_string, s_single, s_eol, }, // 0x16
59 { s_single, s_term, s_string, s_single, s_eol, }, // 0x17
60 { s_single, s_term, s_string, s_single, s_eol, }, // 0x18
61 { s_single, s_term, s_string, s_single, s_eol, }, // 0x19
62 { s_single, s_term, s_string, s_single, s_eol, }, // 0x1a
63 { s_single, s_term, s_string, s_single, s_eol, }, // 0x1b
64 { s_single, s_term, s_string, s_single, s_eol, }, // 0x1c
65 { s_single, s_term, s_string, s_single, s_eol, }, // 0x1d
66 { s_single, s_term, s_string, s_single, s_eol, }, // 0x1e
67 { s_single, s_term, s_string, s_single, s_eol, }, // 0x1f
68 { s_ignore, s_term, s_string, s_ignore, s_eol, }, // 0x20 space
69 { s_single, s_term, s_string, s_single, s_eol, }, // 0x21 !
70 { s_string1, s_term, s_string2, s_string1, s_eol, }, // 0x22 "
71 { s_eol, s_term, s_string, s_eol, s_eol, }, // 0x23 #
72 { s_single, s_term, s_string, s_single, s_eol, }, // 0x24 $
73 { s_single, s_term, s_string, s_single, s_eol, }, // 0x25 %
74 { s_single, s_term, s_string, s_single, s_eol, }, // 0x26 &
75 { s_single, s_term, s_string, s_single, s_eol, }, // 0x27 '
76 { s_single, s_term, s_string, s_single, s_eol, }, // 0x28 (
77 { s_single, s_term, s_string, s_single, s_eol, }, // 0x29 )
78 { s_single, s_term, s_string, s_single, s_eol, }, // 0x2A *
79 { s_single, s_token, s_string, s_single, s_eol, }, // 0x2B +
80 { s_single, s_term, s_string, s_single, s_eol, }, // 0x2C ,
81 { s_single, s_token, s_string, s_single, s_eol, }, // 0x2D -
82 { s_single, s_token, s_string, s_single, s_eol, }, // 0x2E .
83 { s_slash, s_term, s_string, s_slash, s_eol, }, // 0x2F /
84 { s_token, s_token, s_string, s_token, s_eol, }, // 0x30 0
85 { s_token, s_token, s_string, s_token, s_eol, }, // 0x31 1
86 { s_token, s_token, s_string, s_token, s_eol, }, // 0x32 2
87 { s_token, s_token, s_string, s_token, s_eol, }, // 0x33 3
88 { s_token, s_token, s_string, s_token, s_eol, }, // 0x34 4
89 { s_token, s_token, s_string, s_token, s_eol, }, // 0x35 5
90 { s_token, s_token, s_string, s_token, s_eol, }, // 0x36 6
91 { s_token, s_token, s_string, s_token, s_eol, }, // 0x37 7
92 { s_token, s_token, s_string, s_token, s_eol, }, // 0x38 8
93 { s_token, s_token, s_string, s_token, s_eol, }, // 0x39 9
94 { s_single, s_term, s_string, s_single, s_eol, }, // 0x3A :
95 { s_single, s_term, s_string, s_single, s_eol, }, // 0x3B ;
96 { s_single, s_term, s_string, s_single, s_eol, }, // 0x3C <
97 { s_single, s_token, s_string, s_single, s_eol, }, // 0x3D =
98 { s_single, s_term, s_string, s_single, s_eol, }, // 0x3E >
99 { s_single, s_term, s_string, s_single, s_eol, }, // 0x3F ?
100 { s_single, s_token, s_string, s_single, s_eol, }, // 0x40 @
101 { s_token, s_token, s_string, s_token, s_eol, }, // 0x41 A
102 { s_token, s_token, s_string, s_token, s_eol, }, // 0x42 B
103 { s_token, s_token, s_string, s_token, s_eol, }, // 0x43 C
104 { s_token, s_token, s_string, s_token, s_eol, }, // 0x44 D
105 { s_token, s_token, s_string, s_token, s_eol, }, // 0x45 E
106 { s_token, s_token, s_string, s_token, s_eol, }, // 0x46 F
107 { s_token, s_token, s_string, s_token, s_eol, }, // 0x47 G
108 { s_token, s_token, s_string, s_token, s_eol, }, // 0x48 H
109 { s_token, s_token, s_string, s_token, s_eol, }, // 0x49 I
110 { s_token, s_token, s_string, s_token, s_eol, }, // 0x4A J
111 { s_token, s_token, s_string, s_token, s_eol, }, // 0x4B K
112 { s_token, s_token, s_string, s_token, s_eol, }, // 0x4C L
113 { s_token, s_token, s_string, s_token, s_eol, }, // 0x4D M
114 { s_token, s_token, s_string, s_token, s_eol, }, // 0x4E N
115 { s_token, s_token, s_string, s_token, s_eol, }, // 0x4F O
116 { s_token, s_token, s_string, s_token, s_eol, }, // 0x50 P
117 { s_token, s_token, s_string, s_token, s_eol, }, // 0x51 Q
118 { s_token, s_token, s_string, s_token, s_eol, }, // 0x52 R
119 { s_token, s_token, s_string, s_token, s_eol, }, // 0x53 S
120 { s_token, s_token, s_string, s_token, s_eol, }, // 0x54 T
121 { s_token, s_token, s_string, s_token, s_eol, }, // 0x55 U
122 { s_token, s_token, s_string, s_token, s_eol, }, // 0x56 V
123 { s_token, s_token, s_string, s_token, s_eol, }, // 0x57 W
124 { s_token, s_token, s_string, s_token, s_eol, }, // 0x58 X
125 { s_token, s_token, s_string, s_token, s_eol, }, // 0x59 Y
126 { s_token, s_token, s_string, s_token, s_eol, }, // 0x5A Z
127 { s_single, s_term, s_string, s_single, s_eol, }, // 0x5B [
128 { s_single, s_term, s_string, s_single, s_eol, }, // 0x5C backslash
129 { s_single, s_term, s_string, s_single, s_eol, }, // 0x5D ]
130 { s_single, s_term, s_string, s_single, s_eol, }, // 0x5E ^
131 { s_single, s_token, s_string, s_single, s_eol, }, // 0x5F _
132 { s_single, s_term, s_string, s_single, s_eol, }, // 0x60 `
133 { s_token, s_token, s_string, s_token, s_eol, }, // 0x61 a
134 { s_token, s_token, s_string, s_token, s_eol, }, // 0x62 b
135 { s_token, s_token, s_string, s_token, s_eol, }, // 0x63 c
136 { s_token, s_token, s_string, s_token, s_eol, }, // 0x64 d
137 { s_token, s_token, s_string, s_token, s_eol, }, // 0x65 e
138 { s_token, s_token, s_string, s_token, s_eol, }, // 0x66 f
139 { s_token, s_token, s_string, s_token, s_eol, }, // 0x67 g
140 { s_token, s_token, s_string, s_token, s_eol, }, // 0x68 h
141 { s_token, s_token, s_string, s_token, s_eol, }, // 0x69 i
142 { s_token, s_token, s_string, s_token, s_eol, }, // 0x6A j
143 { s_token, s_token, s_string, s_token, s_eol, }, // 0x6B k
144 { s_token, s_token, s_string, s_token, s_eol, }, // 0x6C l
145 { s_token, s_token, s_string, s_token, s_eol, }, // 0x6D m
146 { s_token, s_token, s_string, s_token, s_eol, }, // 0x6E n
147 { s_token, s_token, s_string, s_token, s_eol, }, // 0x6F o
148 { s_token, s_token, s_string, s_token, s_eol, }, // 0x70 p
149 { s_token, s_token, s_string, s_token, s_eol, }, // 0x71 q
150 { s_token, s_token, s_string, s_token, s_eol, }, // 0x72 r
151 { s_token, s_token, s_string, s_token, s_eol, }, // 0x73 s
152 { s_token, s_token, s_string, s_token, s_eol, }, // 0x74 t
153 { s_token, s_token, s_string, s_token, s_eol, }, // 0x75 u
154 { s_token, s_token, s_string, s_token, s_eol, }, // 0x76 v
155 { s_token, s_token, s_string, s_token, s_eol, }, // 0x77 w
156 { s_token, s_token, s_string, s_token, s_eol, }, // 0x78 x
157 { s_token, s_token, s_string, s_token, s_eol, }, // 0x79 y
158 { s_token, s_token, s_string, s_token, s_eol, }, // 0x7A z
159 { s_single, s_term, s_string, s_single, s_eol, }, // 0x7B {
160 { s_single, s_term, s_string, s_single, s_eol, }, // 0x7C |
161 { s_single, s_term, s_string, s_single, s_eol, }, // 0x7D }
162 { s_single, s_term, s_string, s_single, s_eol, }, // 0x7E ~
163 { s_single, s_term, s_string, s_single, s_eol, }, // 0x7f
164 { s_single, s_term, s_string, s_single, s_eol, }, // 0x80
165 { s_single, s_term, s_string, s_single, s_eol, }, // 0x81
166 { s_single, s_term, s_string, s_single, s_eol, }, // 0x82
167 { s_single, s_term, s_string, s_single, s_eol, }, // 0x83
168 { s_single, s_term, s_string, s_single, s_eol, }, // 0x84
169 { s_single, s_term, s_string, s_single, s_eol, }, // 0x85
170 { s_single, s_term, s_string, s_single, s_eol, }, // 0x86
171 { s_single, s_term, s_string, s_single, s_eol, }, // 0x87
172 { s_single, s_term, s_string, s_single, s_eol, }, // 0x88
173 { s_single, s_term, s_string, s_single, s_eol, }, // 0x89
174 { s_single, s_term, s_string, s_single, s_eol, }, // 0x8a
175 { s_single, s_term, s_string, s_single, s_eol, }, // 0x8b
176 { s_single, s_term, s_string, s_single, s_eol, }, // 0x8c
177 { s_single, s_term, s_string, s_single, s_eol, }, // 0x8d
178 { s_single, s_term, s_string, s_single, s_eol, }, // 0x8e
179 { s_single, s_term, s_string, s_single, s_eol, }, // 0x8f
180 { s_single, s_term, s_string, s_single, s_eol, }, // 0x90
181 { s_single, s_term, s_string, s_single, s_eol, }, // 0x91
182 { s_single, s_term, s_string, s_single, s_eol, }, // 0x92
183 { s_single, s_term, s_string, s_single, s_eol, }, // 0x93
184 { s_single, s_term, s_string, s_single, s_eol, }, // 0x94
185 { s_single, s_term, s_string, s_single, s_eol, }, // 0x95
186 { s_single, s_term, s_string, s_single, s_eol, }, // 0x96
187 { s_single, s_term, s_string, s_single, s_eol, }, // 0x97
188 { s_single, s_term, s_string, s_single, s_eol, }, // 0x98
189 { s_single, s_term, s_string, s_single, s_eol, }, // 0x99
190 { s_single, s_term, s_string, s_single, s_eol, }, // 0x9a
191 { s_single, s_term, s_string, s_single, s_eol, }, // 0x9b
192 { s_single, s_term, s_string, s_single, s_eol, }, // 0x9c
193 { s_single, s_term, s_string, s_single, s_eol, }, // 0x9d
194 { s_single, s_term, s_string, s_single, s_eol, }, // 0x9e
195 { s_single, s_term, s_string, s_single, s_eol, }, // 0x9f
196 { s_single, s_term, s_string, s_single, s_eol, }, // 0xa0
197 { s_single, s_term, s_string, s_single, s_eol, }, // 0xa1
198 { s_single, s_term, s_string, s_single, s_eol, }, // 0xa2
199 { s_single, s_term, s_string, s_single, s_eol, }, // 0xa3
200 { s_single, s_term, s_string, s_single, s_eol, }, // 0xa4
201 { s_single, s_term, s_string, s_single, s_eol, }, // 0xa5
202 { s_single, s_term, s_string, s_single, s_eol, }, // 0xa6
203 { s_single, s_term, s_string, s_single, s_eol, }, // 0xa7
204 { s_single, s_term, s_string, s_single, s_eol, }, // 0xa8
205 { s_single, s_term, s_string, s_single, s_eol, }, // 0xa9
206 { s_single, s_term, s_string, s_single, s_eol, }, // 0xaa
207 { s_single, s_term, s_string, s_single, s_eol, }, // 0xab
208 { s_single, s_term, s_string, s_single, s_eol, }, // 0xac
209 { s_single, s_term, s_string, s_single, s_eol, }, // 0xad
210 { s_single, s_term, s_string, s_single, s_eol, }, // 0xae
211 { s_single, s_term, s_string, s_single, s_eol, }, // 0xaf
212 { s_single, s_term, s_string, s_single, s_eol, }, // 0xb0
213 { s_single, s_term, s_string, s_single, s_eol, }, // 0xb1
214 { s_single, s_term, s_string, s_single, s_eol, }, // 0xb2
215 { s_single, s_term, s_string, s_single, s_eol, }, // 0xb3
216 { s_single, s_term, s_string, s_single, s_eol, }, // 0xb4
217 { s_single, s_term, s_string, s_single, s_eol, }, // 0xb5
218 { s_single, s_term, s_string, s_single, s_eol, }, // 0xb6
219 { s_single, s_term, s_string, s_single, s_eol, }, // 0xb7
220 { s_single, s_term, s_string, s_single, s_eol, }, // 0xb8
221 { s_single, s_term, s_string, s_single, s_eol, }, // 0xb9
222 { s_single, s_term, s_string, s_single, s_eol, }, // 0xba
223 { s_single, s_term, s_string, s_single, s_eol, }, // 0xbb
224 { s_single, s_term, s_string, s_single, s_eol, }, // 0xbc
225 { s_single, s_term, s_string, s_single, s_eol, }, // 0xbd
226 { s_single, s_term, s_string, s_single, s_eol, }, // 0xbe
227 { s_single, s_term, s_string, s_single, s_eol, }, // 0xbf
228 { s_single, s_term, s_string, s_single, s_eol, }, // 0xc0
229 { s_single, s_term, s_string, s_single, s_eol, }, // 0xc1
230 { s_single, s_term, s_string, s_single, s_eol, }, // 0xc2
231 { s_single, s_term, s_string, s_single, s_eol, }, // 0xc3
232 { s_single, s_term, s_string, s_single, s_eol, }, // 0xc4
233 { s_single, s_term, s_string, s_single, s_eol, }, // 0xc5
234 { s_single, s_term, s_string, s_single, s_eol, }, // 0xc6
235 { s_single, s_term, s_string, s_single, s_eol, }, // 0xc7
236 { s_single, s_term, s_string, s_single, s_eol, }, // 0xc8
237 { s_single, s_term, s_string, s_single, s_eol, }, // 0xc9
238 { s_single, s_term, s_string, s_single, s_eol, }, // 0xca
239 { s_single, s_term, s_string, s_single, s_eol, }, // 0xcb
240 { s_single, s_term, s_string, s_single, s_eol, }, // 0xcc
241 { s_single, s_term, s_string, s_single, s_eol, }, // 0xcd
242 { s_single, s_term, s_string, s_single, s_eol, }, // 0xce
243 { s_single, s_term, s_string, s_single, s_eol, }, // 0xcf
244 { s_single, s_term, s_string, s_single, s_eol, }, // 0xd0
245 { s_single, s_term, s_string, s_single, s_eol, }, // 0xd1
246 { s_single, s_term, s_string, s_single, s_eol, }, // 0xd2
247 { s_single, s_term, s_string, s_single, s_eol, }, // 0xd3
248 { s_single, s_term, s_string, s_single, s_eol, }, // 0xd4
249 { s_single, s_term, s_string, s_single, s_eol, }, // 0xd5
250 { s_single, s_term, s_string, s_single, s_eol, }, // 0xd6
251 { s_single, s_term, s_string, s_single, s_eol, }, // 0xd7
252 { s_single, s_term, s_string, s_single, s_eol, }, // 0xd8
253 { s_single, s_term, s_string, s_single, s_eol, }, // 0xd9
254 { s_single, s_term, s_string, s_single, s_eol, }, // 0xda
255 { s_single, s_term, s_string, s_single, s_eol, }, // 0xdb
256 { s_single, s_term, s_string, s_single, s_eol, }, // 0xdc
257 { s_single, s_term, s_string, s_single, s_eol, }, // 0xdd
258 { s_single, s_term, s_string, s_single, s_eol, }, // 0xde
259 { s_single, s_term, s_string, s_single, s_eol, }, // 0xdf
260 { s_single, s_term, s_string, s_single, s_eol, }, // 0xe0
261 { s_single, s_term, s_string, s_single, s_eol, }, // 0xe1
262 { s_single, s_term, s_string, s_single, s_eol, }, // 0xe2
263 { s_single, s_term, s_string, s_single, s_eol, }, // 0xe3
264 { s_single, s_term, s_string, s_single, s_eol, }, // 0xe4
265 { s_single, s_term, s_string, s_single, s_eol, }, // 0xe5
266 { s_single, s_term, s_string, s_single, s_eol, }, // 0xe6
267 { s_single, s_term, s_string, s_single, s_eol, }, // 0xe7
268 { s_single, s_term, s_string, s_single, s_eol, }, // 0xe8
269 { s_single, s_term, s_string, s_single, s_eol, }, // 0xe9
270 { s_single, s_term, s_string, s_single, s_eol, }, // 0xea
271 { s_single, s_term, s_string, s_single, s_eol, }, // 0xeb
272 { s_single, s_term, s_string, s_single, s_eol, }, // 0xec
273 { s_single, s_term, s_string, s_single, s_eol, }, // 0xed
274 { s_single, s_term, s_string, s_single, s_eol, }, // 0xee
275 { s_single, s_term, s_string, s_single, s_eol, }, // 0xef
276 { s_single, s_term, s_string, s_single, s_eol, }, // 0xf0
277 { s_single, s_term, s_string, s_single, s_eol, }, // 0xf1
278 { s_single, s_term, s_string, s_single, s_eol, }, // 0xf2
279 { s_single, s_term, s_string, s_single, s_eol, }, // 0xf3
280 { s_single, s_term, s_string, s_single, s_eol, }, // 0xf4
281 { s_single, s_term, s_string, s_single, s_eol, }, // 0xf5
282 { s_single, s_term, s_string, s_single, s_eol, }, // 0xf6
283 { s_single, s_term, s_string, s_single, s_eol, }, // 0xf7
284 { s_single, s_term, s_string, s_single, s_eol, }, // 0xf8
285 { s_single, s_term, s_string, s_single, s_eol, }, // 0xf9
286 { s_single, s_term, s_string, s_single, s_eol, }, // 0xfa
287 { s_single, s_term, s_string, s_single, s_eol, }, // 0xfb
288 { s_single, s_term, s_string, s_single, s_eol, }, // 0xfc
289 { s_single, s_term, s_string, s_single, s_eol, }, // 0xfd
290 { s_single, s_term, s_string, s_single, s_eol, }, // 0xfe
291 { s_single, s_term, s_string, s_single, s_eol, }, // 0xff
292 };
293
294
295 TOKEN::TOKEN(const char *fn, string_set *includes) {
296 pushed = false;
297 include_files = includes;
298 include(fn);
299 }
300
301
302 TOKEN::~TOKEN() {
303 while (!streams.empty()) pop();
304 }
305
306
307 void TOKEN::pop() {
308 ifstream *is = streams.front();
309 const char *fn = filenames.front();
310 streams.pop_front();
311 filenamess.erase(fn);
312 if (filenames.size() > 1) filenames.pop_front();
313 if (linenumbers.size() > 1) linenumbers.pop_front();
314 is->close();
315 delete is;
316 }
317
318
319 void TOKEN::push_char(u_char c) {
320 pushed = true;
321 pushed_char = c;
322 }
323
324
325 bool TOKEN::next_char(u_char &uc) {
326 if (pushed) {
327 uc = pushed_char;
328 pushed = false;
329 return true;
330 }
331 while (!streams.empty() && streams.front()->eof()) {
332 pop();
333 }
334 if (streams.empty()) return false;
335 ifstream *is = streams.front();
336 uc = (u_char)is->get();
337 if (is->eof()) return next_char(uc);
338 if (uc == (u_char)'\n') {
339 int &line = linenumbers.front();
340 line++;
341 }
342 return true;
343 }
344
345
346 bool TOKEN::include(const char *fn) {
347 string_set::iterator i = filenamess.find(fn);
348 if (i != filenamess.end()) {
349 token_error("redundant or recursive include file detected");
350 return false;
351 }
352 ifstream *is = new ifstream;
353 is->open(fn);
354 if (is->fail()) {
355 char buf[maxlen];
356 snprintf(buf, sizeof(buf), "include file %s not found", fn);
357 token_error(buf);
358 return false;
359 }
360 string_set &inc = *include_files;
361 inc.insert(fn);
362 streams.push_front(is);
363 filenames.push_front(fn);
364 filenamess.insert(fn);
365 linenumbers.push_front(1);
366 return true;
367 }
368
369
370 const char *TOKEN::next() {
371 if (!pending_tokens.empty()) {
372 const char *t = pending_tokens.front();
373 pending_tokens.pop_front();
374 return t;
375 }
376 if (streams.empty()) return NULL;
377 const int PENDING_LIMIT = 1000;
378 u_char buffer[PENDING_LIMIT];
379 int count = 0;
380 state st = s_init;
381 while (true) {
382 if (count == (PENDING_LIMIT-1)) {
383 token_error("token too long");
384 break;
385 }
386 if (st >= end_state) {
387 token_error("finite state machine error");
388 break;
389 }
390 u_char c;
391 if (!next_char(c)) break;
392 st = parse_table[c][st];
393 switch (st) {
394 case s_string:
395 case s_token: {
396 buffer[count++] = c;
397 } break;
398
399 case s_term: {
400 push_char(c);
401 st = s_init;
402 } break;
403
404 case s_string1: {
405 st = s_string;
406 } break;
407
408 case s_string2: {
409 st = s_init;
410 } break;
411
412 case s_single: {
413 buffer[count++] = c;
414 st = s_init;
415 } break;
416
417 case s_ignore:
418 case s_eol: {
419 } break;
420
421
422 case s_slash: {
423 buffer[count++] = c;
424 if (next_char(c)) {
425 if (c == (u_char)'/') {
426 // start of ignore to eol on //
427 count--;
428 st = s_eol;
429 }
430 else {
431 // not a // token, just return this single /
432 push_char(c);
433 st = s_init;
434 }
435 }
436 else {
437 // cannot get another char
438 st = s_init;
439 }
440 } break;
441
442 default: {
443 token_error();
444 token_error("unknown state %d %s", st, " ");
445 } break;
446 }
447 if (st == s_init) break;
448 }
449
450 buffer[count] = '\0';
451 if (count == 0) return NULL;
452 const char *t = register_string((char*)buffer);
453 if (t == token_include) {
454 const char *f = next(); // should be file name
455 const char *s = next(); // should be semicolon
456 if (s == token_semi) {
457 include(f);
458 return next();
459 }
460 else {
461 push(s);
462 push(f);
463 return t;
464 }
465 }
466 return t;
467 }
468
469
470 int TOKEN::nextint() {
471 const char *t = next();
472 char *e;
473 long i = strtol(t, &e, 10);
474 if (*e != '\0') {
475 token_error("integer", t);
476 return 0;
477 }
478 return (int)i;
479 }
480
481
482 void TOKEN::skipeol() {
483 while (true) {
484 u_char c;
485 if (!next_char(c)) break;
486 if (c == (u_char)'\n') break;
487 }
488 }
489
490
491 void TOKEN::token_error(const char *err) {
492 token_error();
493 char buf[maxlen];
494 snprintf(buf, sizeof(buf), "%s \n", err);
495 my_syslog(buf);
496 }
497
498
499 void TOKEN::token_error(const char *fmt, int d, const char *s) {
500 char buf[maxlen];
501 snprintf(buf, sizeof(buf), fmt, d, s);
502 my_syslog(buf);
503 }
504
505
506 void TOKEN::token_error(const char *fmt, const char *t, const char *h) {
507 if (!h) h = "null";
508 char buf[maxlen];
509 snprintf(buf, sizeof(buf), fmt, t, h);
510 my_syslog(buf);
511 }
512
513
514 void TOKEN::token_error(const char *want, const char *have) {
515 token_error();
516 token_error("expecting %s, found %s", want, have);
517 }
518
519
520 void TOKEN::token_error() {
521 token_error("syntax error at line %d in file %s -- ", cur_line(), cur_fn());
522 line_list::iterator j = linenumbers.begin();
523 string_list::const_iterator i = filenames.begin();
524 for (; i!=filenames.end(); i++,j++) {
525 if (i != filenames.begin()) {
526 const char *fn = (*i);
527 int li = (*j);
528 token_error(" included from line %d in file %s -- ", li, fn);
529 }
530 }
531 }
532