2 * We don't use unput, so don't generate code for it.
7 * We don't read from the terminal.
9 %option never-interactive
12 * The language we're scanning is case-insensitive.
17 * Prefix scanner routines with "Dtd_PreParse_" rather than "yy", so this
18 * scanner can coexist with other scanners.
20 %option prefix="Dtd_PreParse_"
22 %option outfile="dtd_preparse.c"
28 * an XML dissector for wireshark
30 * DTD Preparser - import a dtd file into a GString
31 * including files, removing comments
32 * and resolving %entities;
34 * Copyright 2004, Luis E. Garcia Ontanon <luis@ontanon.org>
38 * Wireshark - Network traffic analyzer
39 * By Gerald Combs <gerald@wireshark.org>
40 * Copyright 1998 Gerald Combs
42 * This program is free software; you can redistribute it and/or
43 * modify it under the terms of the GNU General Public License
44 * as published by the Free Software Foundation; either version 2
45 * of the License, or (at your option) any later version.
47 * This program is distributed in the hope that it will be useful,
48 * but WITHOUT ANY WARRANTY; without even the implied warranty of
49 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
50 * GNU General Public License for more details.
52 * You should have received a copy of the GNU General Public License
53 * along with this program; if not, write to the Free Software
54 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
62 #include "dtd_preparse_lex.h"
63 #include <wsutil/file_util.h>
65 #define ECHO g_string_append(current,yytext);
67 static GString* current;
68 static GString* output;
69 static GHashTable* entities;
70 static gchar* entity_name;
71 static GString* error;
73 static const gchar* dtd_dirname;
74 static const gchar* filename;
77 static gchar* replace_entity(gchar* s);
78 static const gchar* location(void);
81 * Flex (v 2.5.35) uses this symbol to "exclude" unistd.h
84 #define YY_NO_UNISTD_H
88 /* disable Windows VC compiler warning "signed/unsigned mismatch" associated */
89 /* with YY_INPUT code generated by flex versions such as 2.5.35. */
90 #pragma warning (disable:4018)
103 entity_start "<!"[[:blank:]\n]*entity[[:blank:]\n]*"%"
108 name [A-Za-z][-:A-Za-z0-9_\.]*
117 entity [%&][A-Za-z][-A-Za-z0-9_]*;
119 whitespace [[blank:]]+
121 %START OUTSIDE IN_COMMENT IN_ENTITY NAMED_ENTITY IN_QUOTE ENTITY_DONE XMLPI
125 {entity} if (current) g_string_append_printf(current,"%s\n%s\n",replace_entity(yytext),location());
127 {whitespace} if (current) g_string_append(current," ");
129 <OUTSIDE>{xmlpi_start} { g_string_append(current,yytext); BEGIN XMLPI; }
130 <XMLPI>{xmlpi_chars} { g_string_append(current,yytext); }
131 <XMLPI>{newline} { g_string_append(current,yytext); }
132 <XMLPI>{xmlpi_stop} { g_string_append(current,yytext); BEGIN OUTSIDE; }
134 <OUTSIDE>{comment_start} { current = NULL; BEGIN IN_COMMENT; }
137 <IN_COMMENT>{comment_stop} { current = output; BEGIN OUTSIDE; }
141 if (current) g_string_append_printf(current,"%s\n",location());
145 <OUTSIDE>{entity_start} { BEGIN IN_ENTITY; }
146 <IN_ENTITY>{name} { entity_name = g_strdup_printf("%%%s;",yytext); BEGIN NAMED_ENTITY; }
147 <NAMED_ENTITY>{quote} { current = g_string_new(location()); BEGIN IN_QUOTE; }
148 <IN_QUOTE>{quote} { g_hash_table_insert(entities,entity_name,current); BEGIN ENTITY_DONE; }
149 <IN_QUOTE>{percent} |
150 <IN_QUOTE>{non_quote} |
151 <IN_QUOTE>{escaped_quote} g_string_append(current,yytext);
152 <NAMED_ENTITY>{system} {
153 g_string_append_printf(error,"at %s:%u: file inclusion is not supported!", filename, linenum);
156 <ENTITY_DONE>{special_stop} { current = output; g_string_append(current,"\n"); BEGIN OUTSIDE; }
160 static gchar* replace_entity(gchar* entity) {
161 GString* replacement;
165 replacement = g_hash_table_lookup(entities,entity);
168 return replacement->str;
170 g_string_append_printf(error,"dtd_preparse: in file '%s': entity %s does not exists\n", filename, entity);
176 static const gchar* location(void) {
177 static gchar* loc = NULL;
179 if (loc) g_free(loc);
181 loc = g_strdup_printf("<? wireshark:location %s:%u ?>", filename, linenum);
186 static gboolean free_gstring_hash_items(gpointer k,gpointer v,gpointer p _U_) {
188 g_string_free(v,TRUE);
192 extern GString* dtd_preparse(const gchar* dname,const gchar* fname, GString* err) {
193 gchar* fullname = g_strdup_printf("%s%c%s",dname,G_DIR_SEPARATOR,fname);
199 yyin = ws_fopen(fullname,"r");
203 g_string_append_printf(err, "Could not open file: '%s', error: %s",fullname,g_strerror(errno));
210 entities = g_hash_table_new(g_str_hash,g_str_equal);
211 current = output = g_string_new(location());
221 g_hash_table_foreach_remove(entities,free_gstring_hash_items,NULL);
222 g_hash_table_destroy(entities);
230 * We want to stop processing when we get to the end of the input.
231 * (%option noyywrap is not used because if used then
232 * some flex versions (eg: 2.5.35) generate code which causes
233 * warnings by the Windows VC compiler).