3 %option outfile="dtd_parse.c"
4 %option prefix="Dtd_Parse_"
5 %option never-interactive
10 * an XML dissector for ethereal
11 * lexical analyzer for DTDs
13 * Copyright 2004, Luis E. Garcia Ontanon <luis.ontanon@gmail.com>
17 * Ethereal - Network traffic analyzer
18 * By Gerald Combs <gerald@ethereal.com>
19 * Copyright 1998 Gerald Combs
21 * This program is free software; you can redistribute it and/or
22 * modify it under the terms of the GNU General Public License
23 * as published by the Free Software Foundation; either version 2
24 * of the License, or (at your option) any later version.
26 * This program is distributed in the hope that it will be useful,
27 * but WITHOUT ANY WARRANTY; without even the implied warranty of
28 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
29 * GNU General Public License for more details.
31 * You should have received a copy of the GNU General Public License
32 * along with this program; if not, write to the Free Software
33 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
40 #include "dtd_grammar.h"
41 #include "dtd_parse.h"
43 struct _proto_xmlpi_attr {
49 GString* input_string;
55 static int my_yyinput(char* buff,guint size);
57 static dtd_token_data_t* new_token(gchar*);
59 static dtd_build_data_t* build_data;
61 static void set_proto_name (gchar* val) { if(build_data->proto_name) g_free(build_data->proto_name); build_data->proto_name = g_strdup(val); }
62 static void set_media_type (gchar* val) { if(build_data->media_type) g_free(build_data->media_type); build_data->media_type = g_strdup(val); }
63 static void set_proto_root (gchar* val) { if(build_data->proto_root) g_free(build_data->proto_root); build_data->proto_root = g_strdup(val); }
64 static void set_description (gchar* val) { if(build_data->description) g_free(build_data->description); build_data->description = g_strdup(val); }
65 static void set_recursive (gchar* val) { build_data->recursion = ( g_strcasecmp(val,"yes") == 0 ) ? TRUE : FALSE; }
67 struct _proto_xmlpi_attr proto_attrs[] =
69 { "proto_name", set_proto_name },
70 { "media", set_media_type },
71 { "root", set_proto_root },
72 { "description", set_description },
73 { "hierarchy", set_recursive },
77 #ifdef DEBUG_DTD_PARSER
78 #define DEBUG_DTD_TOKEN fprintf(stderr,"->%s (%i)%s\n",location,token_type,yytext)
80 #define DEBUG_DTD_TOKEN
83 #define DTD_PARSE(token_type) \
85 build_data->location = location; \
86 DtdParse(pParser, (token_type), new_token(yytext), build_data); \
87 if(build_data->error->len > 0) yyterminate(); \
91 #define YY_INPUT(buff,result,max_size) ( (result) = my_yyinput((buff),(max_size)) )
100 location_xmlpi "ethereal:location"
101 protocol_xmlpi "ethereal:protocol"
103 get_attr_quote =[:blank:]*["]
106 get_location_xmlpi [^[:blank:]]+
112 whitespace [[:blank:]\r\n]+
149 name [a-z][-a-zA-Z0-9_]*
153 %START DTD XMLPI LOCATION DONE PROTOCOL GET_ATTR_QUOTE GET_ATTR_VAL GET_ATTR_CLOSE_QUOTE IN_COMMENT
159 <DTD>{comment_start} { BEGIN IN_COMMENT; }
162 <IN_COMMENT>{comment_stop} { BEGIN DTD; }
168 <XMLPI>{location_xmlpi} {
169 if(location) g_free(location);
173 <XMLPI>{protocol_xmlpi} {
178 <XMLPI>{stop_xmlpi} BEGIN DTD;
180 <LOCATION>{get_location_xmlpi} {
181 location = g_strdup(yytext);
185 <DONE>{stop_xmlpi} BEGIN DTD;
188 attr_name = g_strdup(yytext);
189 g_strdown(attr_name);
190 BEGIN GET_ATTR_QUOTE;
193 <GET_ATTR_QUOTE>{get_attr_quote} { BEGIN GET_ATTR_VAL; }
196 g_string_sprintfa(build_data->error,
197 "error in ethereal:protocol xmpli at %s : could not find attribute value!",
202 <GET_ATTR_VAL>[^"]+ {
204 struct _proto_xmlpi_attr* pa;
205 gboolean got_it = FALSE;
207 for(pa = proto_attrs; pa->name; pa++) {
208 if (g_strcasecmp(attr_name,pa->name) == 0) {
216 g_string_sprintfa(build_data->error,
217 "error in ethereal:protocol xmpli at %s : no such parameter %s!",
218 location, attr_name);
225 BEGIN GET_ATTR_CLOSE_QUOTE;
228 <GET_ATTR_CLOSE_QUOTE>{dquote} { BEGIN PROTOCOL;}
230 <PROTOCOL>{stop_xmlpi} BEGIN DTD;
232 <DTD>{special_start} { DTD_PARSE(TOKEN_TAG_START); }
233 <DTD>{special_stop} { DTD_PARSE(TOKEN_TAG_STOP); }
235 <DTD>{attlist_kw} { DTD_PARSE(TOKEN_ATTLIST_KW); }
236 <DTD>{element_kw} { DTD_PARSE(TOKEN_ELEMENT_KW); }
237 <DTD>{doctype_kw} { DTD_PARSE(TOKEN_DOCTYPE_KW); }
239 <DTD>{pcdata} { DTD_PARSE(TOKEN_ELEM_DATA); }
240 <DTD>{any} { DTD_PARSE(TOKEN_ELEM_DATA); }
241 <DTD>{cdata} { DTD_PARSE(TOKEN_ELEM_DATA); }
242 <DTD>{empty} { DTD_PARSE(TOKEN_EMPTY_KW); }
244 <DTD>{iD} { DTD_PARSE(TOKEN_ATT_TYPE); }
245 <DTD>{idref} { DTD_PARSE(TOKEN_ATT_TYPE); }
246 <DTD>{idrefs} { DTD_PARSE(TOKEN_ATT_TYPE); }
247 <DTD>{nmtoken} { DTD_PARSE(TOKEN_ATT_TYPE); }
248 <DTD>{nmtokens} { DTD_PARSE(TOKEN_ATT_TYPE); }
249 <DTD>{entity} { DTD_PARSE(TOKEN_ATT_TYPE); }
250 <DTD>{entities} { DTD_PARSE(TOKEN_ATT_TYPE); }
251 <DTD>{notation} { DTD_PARSE(TOKEN_ATT_TYPE); }
252 <DTD>{cdata_t} { DTD_PARSE(TOKEN_ATT_TYPE); }
253 <DTD>{defaulT} { DTD_PARSE(TOKEN_ATT_DEF_WITH_VALUE); }
254 <DTD>{fixed} { DTD_PARSE(TOKEN_ATT_DEF_WITH_VALUE); }
255 <DTD>{required} { DTD_PARSE(TOKEN_ATT_DEF); }
256 <DTD>{implied} { DTD_PARSE(TOKEN_ATT_DEF); }
258 <DTD>{star} { DTD_PARSE(TOKEN_STAR); }
259 <DTD>{question} { DTD_PARSE(TOKEN_QUESTION); }
260 <DTD>{plus} { DTD_PARSE(TOKEN_PLUS); }
261 <DTD>{comma} { DTD_PARSE(TOKEN_COMMA); }
262 <DTD>{open_parens} { DTD_PARSE(TOKEN_OPEN_PARENS); }
263 <DTD>{close_parens} { DTD_PARSE(TOKEN_CLOSE_PARENS); }
264 <DTD>{open_bracket} { DTD_PARSE(TOKEN_OPEN_BRACKET); }
265 <DTD>{close_bracket} { DTD_PARSE(TOKEN_CLOSE_BRACKET); }
266 <DTD>{pipe} { DTD_PARSE(TOKEN_PIPE); }
269 <DTD>{squoted} { DTD_PARSE(TOKEN_QUOTED); }
270 <DTD>{name} { DTD_PARSE(TOKEN_NAME); }
274 static dtd_token_data_t* new_token(gchar* text) {
275 dtd_token_data_t* t = g_malloc(sizeof(dtd_token_data_t));
277 t->text = g_strdup(text);
278 t->location = g_strdup(location);
285 static int my_yyinput(char* buff, guint size) {
287 if (offset >= len ) {
289 } else if ( offset + size <= len ) {
290 memcpy(buff, input_string->str + offset,size);
295 memcpy(buff, input_string->str + offset,size);
301 extern dtd_build_data_t* dtd_parse(GString* s) {
305 len = input_string->len;
307 pParser = DtdParseAlloc(g_malloc);
309 #ifdef DEBUG_DTD_PARSER
310 DtdParseTrace(stderr, ">>");
313 build_data = g_malloc(sizeof(dtd_build_data_t));
315 build_data->proto_name = NULL;
316 build_data->media_type = NULL;
317 build_data->description = NULL;
318 build_data->proto_root = NULL;
319 build_data->recursion = FALSE;
321 build_data->elements = g_ptr_array_new();
322 build_data->attributes = g_ptr_array_new();
324 build_data->location = NULL;
325 build_data->error = g_string_new("");
333 DtdParse(pParser, 0, NULL,build_data);
339 DtdParseFree(pParser, g_free );