2 * ethereal's xml dissector .
4 * (C) 2005, Luis E. Garcia Ontanon.
8 * Refer to the AUTHORS file or the AUTHORS section in the man page
9 * for contacting the author(s) of this file.
11 * Ethereal - Network traffic analyzer
12 * By Gerald Combs <gerald@ethereal.com>
13 * Copyright 1998 Gerald Combs
15 * This program is free software; you can redistribute it and/or
16 * modify it under the terms of the GNU General Public License
17 * as published by the Free Software Foundation; either version 2
18 * of the License, or (at your option) any later version.
20 * This program is distributed in the hope that it will be useful,
21 * but WITHOUT ANY WARRANTY; without even the implied warranty of
22 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
23 * GNU General Public License for more details.
25 * You should have received a copy of the GNU General Public License
26 * along with this program; if not, write to the Free Software
27 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
47 #include <epan/emem.h>
48 #include <epan/packet.h>
49 #include <epan/strutil.h>
50 #include <epan/tvbparse.h>
52 #include <epan/report_err.h>
53 #include <epan/filesystem.h>
55 typedef struct _xml_ns_t {
56 /* the name of this namespace */
59 /* its fully qualified name */
62 /* the contents of the whole element from <> to </> */
65 /* chunks of cdata from <> to </> excluding sub tags */
68 /* the subtree for its sub items */
71 GHashTable* attributes;
72 /* key: the attribute name
73 value: hf_id of what's between quotes */
75 /* the namespace's namespaces */
77 /* key: the element name
78 value: the child namespace */
80 GPtrArray* element_names;
81 /* imported directly from the parser and used while building the namespace */
88 proto_item* last_item;
93 struct _attr_reg_data {
99 static gint ett_dtd = -1;
100 static gint ett_xmpli = -1;
102 static int hf_unknowwn_attrib = -1;
103 static int hf_comment = -1;
104 static int hf_xmlpi = -1;
105 static int hf_dtd_tag = -1;
106 static int hf_doctype = -1;
108 /* dissector handles */
109 static dissector_handle_t xml_handle;
111 /* parser definitions */
112 static tvbparse_wanted_t* want;
113 static tvbparse_wanted_t* want_ignore;
115 static GHashTable* xmpli_names;
116 static GHashTable* media_types;
118 static xml_ns_t xml_ns = {"xml","/",-1,-1,-1,NULL,NULL,NULL};
119 static xml_ns_t unknown_ns = {"unknown","?",-1,-1,-1,NULL,NULL,NULL};
120 static xml_ns_t* root_ns;
122 #define XML_CDATA -1000
123 #define XML_SCOPED_NAME -1001
129 static const gchar* default_media_types[] = {
132 "application/soap+xml",
133 "application/xml-dtd",
139 "application/vnd.wv.csp+xml",
140 "application/xcap-el+xml",
141 "application/xcap-att+xml",
142 "application/xcap-error+xml",
143 "application/xcap-caps+xml",
144 "application/auth-policy+xml",
146 "application/cpim-pidf+xml",
147 "application/rdf+xml",
148 "application/xslt+xml",
149 "application/mathml+xml",
151 "application/vnd.wv.csp.xml",
152 "application/resource-lists+xml",
157 dissect_xml(tvbuff_t *tvb, packet_info *pinfo, proto_tree *tree)
160 tvbparse_elem_t* tok = NULL;
161 static GPtrArray* stack = NULL;
162 xml_frame_t* current_frame;
167 g_ptr_array_free(stack,TRUE);
169 stack = g_ptr_array_new();
170 current_frame = ep_alloc(sizeof(xml_frame_t));
171 g_ptr_array_add(stack,current_frame);
173 tt = tvbparse_init(tvb,0,-1,stack,want_ignore);
174 current_frame->start_offset = 0;
178 if (pinfo->match_string)
179 root_ns = g_hash_table_lookup(media_types,pinfo->match_string);
185 current_frame->ns = root_ns;
187 current_frame->item = proto_tree_add_item(tree,current_frame->ns->hf_tag,tvb,0,-1,FALSE);
188 current_frame->tree = proto_item_add_subtree(current_frame->item,current_frame->ns->ett);
189 current_frame->last_item = current_frame->item;
191 while(( tok = tvbparse_get(tt, want) )) ;
195 static void after_token(void* tvbparse_data, const void* wanted_data _U_, tvbparse_elem_t* tok) {
196 GPtrArray* stack = tvbparse_data;
197 xml_frame_t* current_frame = g_ptr_array_index(stack,stack->len - 1);
201 if (tok->id == XML_CDATA) {
202 hfid = current_frame->ns ? current_frame->ns->hf_cdata : xml_ns.hf_cdata;
203 } else if ( tok->id > 0) {
206 hfid = xml_ns.hf_cdata;
209 pi = proto_tree_add_item(current_frame->tree, hfid, tok->tvb, tok->offset, tok->len, FALSE);
211 proto_item_set_text(pi, "%s",
212 tvb_format_text(tok->tvb,tok->offset,tok->len));
215 static void before_xmpli(void* tvbparse_data, const void* wanted_data _U_, tvbparse_elem_t* tok) {
216 GPtrArray* stack = tvbparse_data;
217 xml_frame_t* current_frame = g_ptr_array_index(stack,stack->len - 1);
220 tvbparse_elem_t* name_tok = tok->sub->next;
221 gchar* name = tvb_get_ephemeral_string(name_tok->tvb,name_tok->offset,name_tok->len);
222 xml_ns_t* ns = g_hash_table_lookup(xmpli_names,name);
236 pi = proto_tree_add_item(current_frame->tree,hf_tag,tok->tvb,tok->offset,tok->len,FALSE);
238 proto_item_set_text(pi,tvb_format_text(tok->tvb,tok->offset,(name_tok->offset - tok->offset) + name_tok->len));
240 pt = proto_item_add_subtree(pi,ett);
242 current_frame = ep_alloc(sizeof(xml_frame_t));
243 current_frame->item = pi;
244 current_frame->last_item = pi;
245 current_frame->tree = pt;
246 current_frame->start_offset = tok->offset;
247 current_frame->ns = ns;
249 g_ptr_array_add(stack,current_frame);
253 static void after_xmlpi(void* tvbparse_data, const void* wanted_data _U_, tvbparse_elem_t* tok) {
254 GPtrArray* stack = tvbparse_data;
255 xml_frame_t* current_frame = g_ptr_array_index(stack,stack->len - 1);
257 proto_tree_add_text(current_frame->tree,
258 tok->tvb, tok->offset, tok->len,
259 tvb_format_text(tok->tvb,tok->offset,tok->len));
261 if (stack->len > 1) {
262 g_ptr_array_remove_index_fast(stack,stack->len - 1);
264 proto_tree_add_text(current_frame->tree,tok->tvb,tok->offset,tok->len,"[ ERROR: Closing an unopened xmpli tag ]");
268 static void before_tag(void* tvbparse_data, const void* wanted_data _U_, tvbparse_elem_t* tok) {
269 GPtrArray* stack = tvbparse_data;
270 xml_frame_t* current_frame = g_ptr_array_index(stack,stack->len - 1);
271 tvbparse_elem_t* name_tok = tok->sub->next;
275 xml_frame_t* new_frame;
279 if (name_tok->sub->id == XML_SCOPED_NAME) {
280 tvbparse_elem_t* root_tok = name_tok->sub->sub;
281 tvbparse_elem_t* leaf_tok = name_tok->sub->sub->next->next;
282 xml_ns_t* nameroot_ns;
284 root_name = tvb_get_ephemeral_string(root_tok->tvb,root_tok->offset,root_tok->len);
285 name = tvb_get_ephemeral_string(leaf_tok->tvb,leaf_tok->offset,leaf_tok->len);
287 nameroot_ns = g_hash_table_lookup(xml_ns.elements,root_name);
290 ns = g_hash_table_lookup(nameroot_ns->elements,name);
299 name = tvb_get_ephemeral_string(name_tok->tvb,name_tok->offset,name_tok->len);
302 if(current_frame->ns) {
303 ns = g_hash_table_lookup(current_frame->ns->elements,name);
306 if (! ( ns = g_hash_table_lookup(root_ns->elements,name) ) ) {
315 pi = proto_tree_add_item(current_frame->tree,ns->hf_tag,tok->tvb,tok->offset,tok->len,FALSE);
316 proto_item_set_text(pi,tvb_format_text(tok->tvb,tok->offset,(name_tok->offset - tok->offset) + name_tok->len));
318 pt = proto_item_add_subtree(pi,ns->ett);
320 new_frame = ep_alloc(sizeof(xml_frame_t));
321 new_frame->item = pi;
322 new_frame->last_item = pi;
323 new_frame->tree = pt;
324 new_frame->start_offset = tok->offset;
327 g_ptr_array_add(stack,new_frame);
331 static void after_open_tag(void* tvbparse_data, const void* wanted_data _U_, tvbparse_elem_t* tok _U_) {
332 GPtrArray* stack = tvbparse_data;
333 xml_frame_t* current_frame = g_ptr_array_index(stack,stack->len - 1);
335 proto_item_append_text(current_frame->last_item,">");
338 static void after_closed_tag(void* tvbparse_data, const void* wanted_data _U_, tvbparse_elem_t* tok) {
339 GPtrArray* stack = tvbparse_data;
340 xml_frame_t* current_frame = g_ptr_array_index(stack,stack->len - 1);
342 proto_item_append_text(current_frame->last_item,"/>");
344 if (stack->len > 1) {
345 g_ptr_array_remove_index_fast(stack,stack->len - 1);
347 proto_tree_add_text(current_frame->tree,tok->tvb,tok->offset,tok->len,"[ ERROR: Closing an unopened tag ]");
351 void after_untag(void* tvbparse_data, const void* wanted_data _U_, tvbparse_elem_t* tok){
352 GPtrArray* stack = tvbparse_data;
353 xml_frame_t* current_frame = g_ptr_array_index(stack,stack->len - 1);
355 proto_item_set_len(current_frame->item, (tok->offset - current_frame->start_offset) + tok->len);
357 proto_tree_add_text(current_frame->tree,tok->tvb,tok->offset,tok->len,"%s",
358 tvb_format_text(tok->tvb,tok->offset,tok->len));
360 if (stack->len > 1) {
361 g_ptr_array_remove_index_fast(stack,stack->len - 1);
363 proto_tree_add_text(current_frame->tree,tok->tvb,tok->offset,tok->len,
364 "[ ERROR: Closing an unopened tag ]");
368 static void before_dtd_doctype(void* tvbparse_data, const void* wanted_data _U_, tvbparse_elem_t* tok){
369 GPtrArray* stack = tvbparse_data;
370 xml_frame_t* current_frame = g_ptr_array_index(stack,stack->len - 1);
371 tvbparse_elem_t* name_tok = tok->sub->next->next->next->sub->sub;
372 proto_tree* dtd_item = proto_tree_add_item(current_frame->tree, hf_doctype,
373 name_tok->tvb, name_tok->offset, name_tok->len, FALSE);
375 proto_item_set_text(dtd_item,"%s",tvb_format_text(tok->tvb,tok->offset,tok->len));
377 current_frame = ep_alloc(sizeof(xml_frame_t));
378 current_frame->item = dtd_item;
379 current_frame->last_item = dtd_item;
380 current_frame->tree = proto_item_add_subtree(dtd_item,ett_dtd);
381 current_frame->start_offset = tok->offset;
382 current_frame->ns = NULL;
384 g_ptr_array_add(stack,current_frame);
387 static void pop_stack(void* tvbparse_data, const void* wanted_data _U_, tvbparse_elem_t* tok _U_) {
388 GPtrArray* stack = tvbparse_data;
389 xml_frame_t* current_frame = g_ptr_array_index(stack,stack->len - 1);
391 if (stack->len > 1) {
392 g_ptr_array_remove_index_fast(stack,stack->len - 1);
394 proto_tree_add_text(current_frame->tree,tok->tvb,tok->offset,tok->len,
395 "[ ERROR: Closing an unopened tag ]");
399 static void after_dtd_close(void* tvbparse_data, const void* wanted_data _U_, tvbparse_elem_t* tok){
400 GPtrArray* stack = tvbparse_data;
401 xml_frame_t* current_frame = g_ptr_array_index(stack,stack->len - 1);
403 proto_tree_add_text(current_frame->tree,tok->tvb,tok->offset,tok->len,"%s",
404 tvb_format_text(tok->tvb,tok->offset,tok->len));
405 if (stack->len > 1) {
406 g_ptr_array_remove_index_fast(stack,stack->len - 1);
408 proto_tree_add_text(current_frame->tree,tok->tvb,tok->offset,tok->len,"[ ERROR: Closing an unopened tag ]");
412 static void get_attrib_value(void* tvbparse_data _U_, const void* wanted_data _U_, tvbparse_elem_t* tok) {
413 tok->data = tok->sub;
416 static void after_attrib(void* tvbparse_data, const void* wanted_data _U_, tvbparse_elem_t* tok) {
417 GPtrArray* stack = tvbparse_data;
418 xml_frame_t* current_frame = g_ptr_array_index(stack,stack->len - 1);
419 gchar* name = tvb_get_ephemeral_string(tok->sub->tvb,tok->sub->offset,tok->sub->len);
420 tvbparse_elem_t* value = tok->sub->next->next->data;
425 if(current_frame->ns && (hfidp = g_hash_table_lookup(current_frame->ns->attributes,name) )) {
428 hfid = hf_unknowwn_attrib;
432 current_frame->last_item = proto_tree_add_item(current_frame->tree,hfid,value->tvb,value->offset,value->len,FALSE);
433 proto_item_set_text(current_frame->last_item, "%s", tvb_format_text(tok->tvb,tok->offset,tok->len));
437 static void unrecognized_token(void* tvbparse_data, const void* wanted_data _U_, tvbparse_elem_t* tok _U_){
438 GPtrArray* stack = tvbparse_data;
439 xml_frame_t* current_frame = g_ptr_array_index(stack,stack->len - 1);
441 proto_tree_add_text(current_frame->tree,tok->tvb,tok->offset,tok->len,"[ ERROR: Unrecognized text ]");
447 void init_xml_parser(void) {
448 tvbparse_wanted_t* want_name = tvbparse_chars(-1,1,0,"abcdefghijklmnopqrstuvwxyz-_ABCDEFGHIJKLMNOPQRSTUVWXYZ",NULL,NULL,NULL);
449 tvbparse_wanted_t* want_attr_name = tvbparse_chars(-1,1,0,"abcdefghijklmnopqrstuvwxyz-_ABCDEFGHIJKLMNOPQRSTUVWXYZ:",NULL,NULL,NULL);
451 tvbparse_wanted_t* want_scoped_name = tvbparse_set_seq(XML_SCOPED_NAME, NULL, NULL, NULL,
453 tvbparse_char(-1,":",NULL,NULL,NULL),
457 tvbparse_wanted_t* want_tag_name = tvbparse_set_oneof(0, NULL, NULL, NULL,
462 tvbparse_wanted_t* want_attrib_value = tvbparse_set_oneof(0, NULL, NULL, get_attrib_value,
463 tvbparse_quoted(-1, NULL, NULL, tvbparse_shrink_token_cb,'\"','\\'),
464 tvbparse_quoted(-1, NULL, NULL, tvbparse_shrink_token_cb,'\'','\\'),
465 tvbparse_chars(-1,1,0,"0123456789",NULL,NULL,NULL),
469 tvbparse_wanted_t* want_attributes = tvbparse_one_or_more(-1, NULL, NULL, NULL,
470 tvbparse_set_seq(-1, NULL, NULL, after_attrib,
472 tvbparse_char(-1,"=",NULL,NULL,NULL),
476 tvbparse_wanted_t* want_stoptag = tvbparse_set_oneof(-1,NULL,NULL,NULL,
477 tvbparse_char(-1, ">", NULL, NULL, after_open_tag),
478 tvbparse_string(-1, "/>", NULL, NULL, after_closed_tag),
481 tvbparse_wanted_t* want_stopxmlpi = tvbparse_string(-1,"?>",NULL,NULL,after_xmlpi);
483 tvbparse_wanted_t* want_comment = tvbparse_set_seq(hf_comment,NULL,NULL,after_token,
484 tvbparse_string(-1,"<!--",NULL,NULL,NULL),
485 tvbparse_until(-1,NULL,NULL,NULL,
486 tvbparse_string(-1,"-->",NULL,NULL,NULL),
490 tvbparse_wanted_t* want_xmlpi = tvbparse_set_seq(hf_xmlpi,NULL,before_xmpli,NULL,
491 tvbparse_string(-1,"<?",NULL,NULL,NULL),
493 tvbparse_set_oneof(-1,NULL,NULL,NULL,
495 tvbparse_set_seq(-1,NULL,NULL,NULL,
502 tvbparse_wanted_t* want_closing_tag = tvbparse_set_seq(0,NULL,NULL,after_untag,
503 tvbparse_char(-1, "<", NULL, NULL, NULL),
504 tvbparse_char(-1, "/", NULL, NULL, NULL),
506 tvbparse_char(-1, ">", NULL, NULL, NULL),
509 tvbparse_wanted_t* want_doctype_start = tvbparse_set_seq(-1,NULL,before_dtd_doctype,NULL,
510 tvbparse_char(-1,"<",NULL,NULL,NULL),
511 tvbparse_char(-1,"!",NULL,NULL,NULL),
512 tvbparse_casestring(-1,"DOCTYPE",NULL,NULL,NULL),
513 tvbparse_set_oneof(-1,NULL,NULL,NULL,
514 tvbparse_set_seq(-1,NULL,NULL,NULL,
516 tvbparse_char(-1,"[",NULL,NULL,NULL),
518 tvbparse_set_seq(-1,NULL,NULL,pop_stack,
520 tvbparse_set_oneof(-1,NULL,NULL,NULL,
521 tvbparse_casestring(-1,"PUBLIC",NULL,NULL,NULL),
522 tvbparse_casestring(-1,"SYSTEM",NULL,NULL,NULL),
524 tvbparse_until(-1,NULL,NULL,NULL,
525 tvbparse_char(-1,">",NULL,NULL,NULL),
531 tvbparse_wanted_t* want_dtd_tag = tvbparse_set_seq(hf_dtd_tag,NULL,NULL,after_token,
532 tvbparse_char(-1,"<",NULL,NULL,NULL),
533 tvbparse_char(-1,"!",NULL,NULL,NULL),
534 tvbparse_until(-1,NULL,NULL,NULL,
535 tvbparse_char(-1, ">", NULL, NULL, NULL),
539 tvbparse_wanted_t* want_tag = tvbparse_set_seq(-1, NULL, before_tag, NULL,
540 tvbparse_char(-1,"<",NULL,NULL,NULL),
542 tvbparse_set_oneof(-1,NULL,NULL,NULL,
543 tvbparse_set_seq(-1,NULL,NULL,NULL,
551 tvbparse_wanted_t* want_dtd_close = tvbparse_set_seq(-1,NULL,NULL,after_dtd_close,
552 tvbparse_char(-1,"]",NULL,NULL,NULL),
553 tvbparse_char(-1,">",NULL,NULL,NULL),
556 want_ignore = tvbparse_chars(-1,1,0," \t\r\n",NULL,NULL,NULL);
559 want = tvbparse_set_oneof(-1, NULL, NULL, NULL,
567 tvbparse_not_chars(XML_CDATA,1,0,"<",NULL,NULL,after_token),
568 tvbparse_not_chars(-1,1,0," \t\r\n",NULL,NULL,unrecognized_token),
575 xml_ns_t* xml_new_namespace(GHashTable* hash, gchar* name, ...) {
576 xml_ns_t* ns = g_malloc(sizeof(xml_ns_t));
580 ns->name = g_strdup(name);
584 ns->attributes = g_hash_table_new(g_str_hash,g_str_equal);
585 ns->elements = g_hash_table_new(g_str_hash,g_str_equal);
589 while(( attr_name = va_arg(ap,gchar*) )) {
590 int* hfp = g_malloc(sizeof(int));
592 g_hash_table_insert(ns->attributes,g_strdup(attr_name),hfp);
597 g_hash_table_insert(hash,ns->name,ns);
603 void add_xml_field(GArray* hfs, int* p_id, gchar* name, gchar* fqn) {
604 hf_register_info hfri;
607 hfri.hfinfo.name = name;
608 hfri.hfinfo.abbrev = fqn;
609 hfri.hfinfo.type = FT_STRING;
610 hfri.hfinfo.display = BASE_NONE;
611 hfri.hfinfo.strings = NULL;
612 hfri.hfinfo.bitmask = 0x0;
613 hfri.hfinfo.blurb = "";
615 hfri.hfinfo.parent = 0;
616 hfri.hfinfo.ref_count = 0;
617 hfri.hfinfo.bitshift = 0;
618 hfri.hfinfo.same_name_next = NULL;
619 hfri.hfinfo.same_name_prev = NULL;
621 g_array_append_val(hfs,hfri);
624 void add_xml_attribute_names(gpointer k, gpointer v, gpointer p) {
625 struct _attr_reg_data* d = p;
626 gchar* basename = g_strdup_printf("%s.%s",d->basename,(gchar*)k);
627 add_xml_field(d->hf, (int*) v, (gchar*)k, basename);
631 void add_xmlpi_namespace(gpointer k _U_, gpointer v, gpointer p) {
633 gchar* basename = g_strdup_printf("%s.%s",(gchar*)p,ns->name);
634 gint* ett_p = &(ns->ett);
635 struct _attr_reg_data d;
637 add_xml_field(hf_arr, &(ns->hf_tag), basename, basename);
639 g_array_append_val(ett_arr,ett_p);
641 d.basename = basename;
644 g_hash_table_foreach(ns->attributes,add_xml_attribute_names,&d);
648 static void destroy_dtd_data(dtd_build_data_t* dtd_data) {
650 if(dtd_data->proto_name) g_free(dtd_data->proto_name);
651 if(dtd_data->media_type) g_free(dtd_data->media_type);
652 if(dtd_data->description) g_free(dtd_data->description);
653 if(dtd_data->proto_root) g_free(dtd_data->proto_root);
655 g_string_free(dtd_data->error,TRUE);
658 while(dtd_data->elements->len) {
659 dtd_named_list_t* nl = g_ptr_array_remove_index_fast(dtd_data->elements,0);
660 g_ptr_array_free(nl->list,TRUE);
664 g_ptr_array_free(dtd_data->elements,TRUE);
666 while(dtd_data->attributes->len) {
667 dtd_named_list_t* nl = g_ptr_array_remove_index_fast(dtd_data->elements,0);
668 g_ptr_array_free(nl->list,TRUE);
672 g_ptr_array_free(dtd_data->attributes,TRUE);
679 static void copy_attrib_item(gpointer k, gpointer v _U_, gpointer p) {
680 gchar* key = g_strdup(k);
681 int* value = g_malloc(sizeof(int));
685 g_hash_table_insert(dst,key,value);
689 static GHashTable* copy_attributes_hash(GHashTable* src) {
690 GHashTable* dst = g_hash_table_new(g_str_hash,g_str_equal);
692 g_hash_table_foreach(src,copy_attrib_item,dst);
697 static xml_ns_t* duplicate_element(xml_ns_t* orig) {
698 xml_ns_t* new_item = g_malloc(sizeof(xml_ns_t));
701 new_item->name = g_strdup(orig->name);
702 new_item->hf_tag = -1;
703 new_item->hf_cdata = -1;
705 new_item->attributes = copy_attributes_hash(orig->attributes);
706 new_item->elements = g_hash_table_new(g_str_hash,g_str_equal);
707 new_item->element_names = g_ptr_array_new();
709 for(i=0; i < orig->element_names->len; i++) {
710 g_ptr_array_add(new_item->element_names,
711 g_ptr_array_index(orig->element_names,i));
717 static gchar* fully_qualified_name(GPtrArray* hier, gchar* name) {
719 GString* s = g_string_new("");
722 for (i = 0; i < hier->len; i++) {
723 g_string_sprintfa(s, "%s.",(gchar*)g_ptr_array_index(hier,i));
726 g_string_append(s,name);
728 g_string_free(s,FALSE);
734 static xml_ns_t* make_xml_hier(gchar* elem_name,
736 GHashTable* elements,
745 struct _attr_reg_data d;
746 gboolean recurred = FALSE;
749 if ( g_str_equal(elem_name,root->name) ) {
753 if (! ( orig = g_hash_table_lookup(elements,elem_name) )) {
754 g_string_sprintfa(error,"element '%s' is not defined\n", elem_name);
758 for (i = 0; i < hier->len; i++) {
759 if( strcmp(elem_name,(gchar*) g_ptr_array_index(hier,i) ) == 0 ) {
768 fqn = fully_qualified_name(hier,elem_name);
770 new = duplicate_element(orig);
773 add_xml_field(hfs, &(new->hf_tag), g_strdup(elem_name), fqn);
774 add_xml_field(hfs, &(new->hf_cdata), g_strdup(elem_name), fqn);
777 g_array_append_val(etts,ett_p);
782 g_hash_table_foreach(new->attributes,add_xml_attribute_names,&d);
784 while(new->element_names->len) {
785 gchar* child_name = g_ptr_array_remove_index(new->element_names,0);
786 xml_ns_t* child_element = NULL;
788 g_ptr_array_add(hier,elem_name);
789 child_element = make_xml_hier(child_name, root, elements, hier,error,hfs,etts);
790 g_ptr_array_remove_index_fast(hier,hier->len - 1);
793 g_hash_table_insert(new->elements,child_element->name,child_element);
797 g_ptr_array_free(new->element_names,TRUE);
798 new->element_names = NULL;
802 static gboolean free_both(gpointer k, gpointer v, gpointer p _U_) {
808 static gboolean free_elements(gpointer k _U_, gpointer v, gpointer p _U_) {
811 g_hash_table_foreach_remove(e->attributes,free_both,NULL);
812 g_hash_table_destroy(e->attributes);
813 g_hash_table_destroy(e->elements);
815 while (e->element_names->len) {
816 g_free(g_ptr_array_remove_index(e->element_names,0));
819 g_ptr_array_free(e->element_names,TRUE);
825 static void register_dtd(dtd_build_data_t* dtd_data, GString* errors) {
826 GHashTable* elements = g_hash_table_new(g_str_hash,g_str_equal);
827 gchar* root_name = NULL;
828 xml_ns_t* root_element = NULL;
833 GPtrArray* element_names = g_ptr_array_new();
835 /* we first populate elements with the those coming from the parser */
836 while(dtd_data->elements->len) {
837 dtd_named_list_t* nl = g_ptr_array_remove_index(dtd_data->elements,0);
838 xml_ns_t* element = g_malloc(sizeof(xml_ns_t));
840 /* we will use the first element found as root in case no other one was given. */
841 if (root_name == NULL)
842 root_name = g_strdup(nl->name);
844 element->name = nl->name;
845 element->element_names = nl->list;
846 element->hf_tag = -1;
847 element->hf_cdata = -1;
849 element->attributes = g_hash_table_new(g_str_hash,g_str_equal);
850 element->elements = g_hash_table_new(g_str_hash,g_str_equal);
852 if( g_hash_table_lookup(elements,element->name) ) {
853 g_string_sprintfa(errors,"element %s defined more than once\n", element->name);
854 free_elements(NULL,element,NULL);
856 g_hash_table_insert(elements,element->name,element);
857 g_ptr_array_add(element_names,g_strdup(element->name));
863 /* then we add the attributes to its relative elements */
864 while(dtd_data->attributes->len) {
865 dtd_named_list_t* nl = g_ptr_array_remove_index(dtd_data->attributes,0);
866 xml_ns_t* element = g_hash_table_lookup(elements,nl->name);
869 g_string_sprintfa(errors,"element %s is not defined\n", nl->name);
874 while(nl->list->len) {
875 gchar* name = g_ptr_array_remove_index(nl->list,0);
876 int* id_p = g_malloc(sizeof(int));
879 g_hash_table_insert(element->attributes,name,id_p);
884 g_ptr_array_free(nl->list,TRUE);
888 /* if a proto_root is defined in the dtd we'll use that as root */
889 if( dtd_data->proto_root ) {
892 root_name = g_strdup(dtd_data->proto_root);
895 /* we use a stack with the names to avoid recurring infinitelly */
896 hier = g_ptr_array_new();
899 * if a proto name was given in the dtd the dtd will be used as a protocol
900 * or else the dtd will be loaded as a branch of the xml namespace
902 if( ! dtd_data->proto_name ) {
905 g_ptr_array_add(hier,g_strdup("xml"));
906 root_element = &xml_ns;
909 * if we were given a proto_name the namespace will be registered
910 * as an indipendent protocol with its own hf and ett arrays.
912 hfs = g_array_new(FALSE,FALSE,sizeof(hf_register_info));
913 etts = g_array_new(FALSE,FALSE,sizeof(gint*));
916 /* the root element of the dtd's namespace */
917 root_element = g_malloc(sizeof(xml_ns_t));
918 root_element->name = g_strdup(root_name);
919 root_element->fqn = root_element->name;
920 root_element->hf_tag = -1;
921 root_element->hf_cdata = -1;
922 root_element->ett = -1;
923 root_element->elements = g_hash_table_new(g_str_hash,g_str_equal);
924 root_element->element_names = element_names;
927 * we can either create a namespace as a flat namespace
928 * in which all the elements are at the root level
929 * or we can create a recursive namespace
931 if (dtd_data->recursion) {
934 make_xml_hier(root_name, root_element, elements,hier,errors,hfs,etts);
936 g_hash_table_insert(root_element->elements,root_element->name,root_element);
938 orig_root = g_hash_table_lookup(elements,root_name);
940 /* if the root element was defined copy its attrlist to the child */
942 struct _attr_reg_data d;
944 d.basename = root_name;
947 root_element->attributes = copy_attributes_hash(orig_root->attributes);
948 g_hash_table_foreach(root_element->attributes,add_xml_attribute_names,&d);
950 root_element->attributes = g_hash_table_new(g_str_hash,g_str_equal);
953 /* we then create all the sub hierachies to catch the recurred cases */
954 g_ptr_array_add(hier,root_name);
956 while(root_element->element_names->len) {
957 curr_name = g_ptr_array_remove_index(root_element->element_names,0);
959 if( ! g_hash_table_lookup(root_element->elements,curr_name) ) {
960 xml_ns_t* new = make_xml_hier(curr_name, root_element, elements,hier,errors,hfs,etts);
961 g_hash_table_insert(root_element->elements,new->name,new);
968 /* a flat namespace */
969 g_ptr_array_add(hier,root_name);
971 root_element->attributes = g_hash_table_new(g_str_hash,g_str_equal);
973 while(root_element->element_names->len) {
976 struct _attr_reg_data d;
978 curr_name = g_ptr_array_remove_index(root_element->element_names,0);
979 new = duplicate_element(g_hash_table_lookup(elements,curr_name));
980 new->fqn = fully_qualified_name(hier, curr_name);
982 add_xml_field(hfs, &(new->hf_tag), curr_name, new->fqn);
983 add_xml_field(hfs, &(new->hf_cdata), curr_name, new->fqn);
985 d.basename = new->fqn;
988 g_hash_table_foreach(new->attributes,add_xml_attribute_names,&d);
991 g_array_append_val(etts,ett_p);
993 g_ptr_array_free(new->element_names,TRUE);
995 g_hash_table_insert(root_element->elements,new->name,new);
999 g_ptr_array_free(element_names,TRUE);
1001 g_ptr_array_free(hier,TRUE);
1004 * if we were given a proto_name the namespace will be registered
1005 * as an indipendent protocol.
1007 if( dtd_data->proto_name ) {
1010 if ( ! dtd_data->description) {
1011 dtd_data->description = g_strdup(root_name);
1014 ett_p = &root_element->ett;
1015 g_array_append_val(etts,ett_p);
1017 add_xml_field(hfs, &root_element->hf_cdata, root_element->name, root_element->fqn);
1019 root_element->hf_tag = proto_register_protocol(dtd_data->description, dtd_data->proto_name, root_element->name);
1020 proto_register_field_array(root_element->hf_tag, (hf_register_info*)hfs->data, hfs->len);
1021 proto_register_subtree_array((gint**)etts->data, etts->len);
1023 if (dtd_data->media_type) {
1024 g_hash_table_insert(media_types,dtd_data->media_type,root_element);
1025 dtd_data->media_type = NULL;
1028 dtd_data->description = NULL;
1029 dtd_data->proto_name = NULL;
1030 g_array_free(hfs,FALSE);
1031 g_array_free(etts,TRUE);
1034 g_hash_table_insert(xml_ns.elements,root_element->name,root_element);
1036 g_hash_table_foreach_remove(elements,free_elements,NULL);
1037 g_hash_table_destroy(elements);
1039 destroy_dtd_data(dtd_data);
1045 #if GLIB_MAJOR_VERSION < 2
1046 # define DIRECTORY_T DIR
1047 # define FILE_T struct dirent
1048 # define OPENDIR_OP(name) opendir(name)
1049 # define DIRGETNEXT_OP(dir) readdir(dir)
1050 # define GETFNAME_OP(file) (gchar *)file->d_name
1051 # define CLOSEDIR_OP(dir) closedir(dir)
1053 # define DIRECTORY_T GDir
1054 # define FILE_T gchar
1055 # define OPENDIR_OP(name) g_dir_open(name, 0, dummy)
1056 # define DIRGETNEXT_OP(dir) g_dir_read_name(dir)
1057 # define GETFNAME_OP(file) (file);
1058 # define CLOSEDIR_OP(dir) g_dir_close(dir)
1061 void init_xml_names(void) {
1062 xml_ns_t* xmlpi_xml_ns;
1066 const gchar* filename;
1069 #if GLIB_MAJOR_VERSION >= 2
1070 GError** dummy = g_malloc(sizeof(GError *));
1074 xmpli_names = g_hash_table_new(g_str_hash,g_str_equal);
1075 media_types = g_hash_table_new(g_str_hash,g_str_equal);
1077 unknown_ns.elements = xml_ns.elements = g_hash_table_new(g_str_hash,g_str_equal);
1078 unknown_ns.attributes = xml_ns.attributes = g_hash_table_new(g_str_hash,g_str_equal);
1080 xmlpi_xml_ns = xml_new_namespace(xmpli_names,"xml","version","encoding","standalone",NULL);
1082 g_hash_table_destroy(xmlpi_xml_ns->elements);
1083 xmlpi_xml_ns->elements = NULL;
1086 dirname = get_persconffile_path("dtds", FALSE);
1088 if (test_for_directory(dirname) != EISDIR) {
1089 dirname = get_datafile_path("dtds");
1092 if (test_for_directory(dirname) == EISDIR) {
1094 if ((dir = OPENDIR_OP(dirname)) != NULL) {
1095 while ((file = DIRGETNEXT_OP(dir)) != NULL) {
1097 filename = GETFNAME_OP(file);
1099 namelen = strlen(filename);
1100 if ( namelen > 4 && ( g_strcasecmp(filename+(namelen-4),".dtd") == 0 ) ) {
1101 GString* errors = g_string_new("");
1102 GString* preparsed = dtd_preparse(dirname, filename, errors);
1103 dtd_build_data_t* dtd_data;
1106 report_failure("Dtd Preparser in file %s%c%s: %s",dirname,G_DIR_SEPARATOR,filename,errors->str);
1110 dtd_data = dtd_parse(preparsed);
1112 g_string_free(preparsed,TRUE);
1114 if (dtd_data->error->len) {
1115 report_failure("Dtd Parser in file %s%c%s: %s",dirname,G_DIR_SEPARATOR,filename,dtd_data->error->str);
1116 destroy_dtd_data(dtd_data);
1120 register_dtd(dtd_data,errors);
1123 report_failure("Dtd Registration in file: %s%c%s: %s",dirname,G_DIR_SEPARATOR,filename,errors->str);
1124 g_string_free(errors,TRUE);
1134 for(i=0;i<array_length(default_media_types);i++) {
1135 if( ! g_hash_table_lookup(media_types,default_media_types[i]) ) {
1136 g_hash_table_insert(media_types,(gpointer)default_media_types[i],&xml_ns);
1140 g_hash_table_foreach(xmpli_names,add_xmlpi_namespace,"xml.xmlpi");
1142 #if GLIB_MAJOR_VERSION >= 2
1148 proto_register_xml(void) {
1150 static gint *ett_base[] = {
1157 static hf_register_info hf_base[] = {
1158 { &hf_xmlpi, {"XMLPI", "xml.xmlpi", FT_STRING, BASE_NONE, NULL, 0, "", HFILL }},
1159 { &hf_comment, {"Comment", "xml.comment", FT_STRING, BASE_NONE, NULL, 0, "", HFILL }},
1160 { &hf_unknowwn_attrib, {"Attribute", "xml.attribute", FT_STRING, BASE_NONE, NULL, 0, "", HFILL }},
1161 { &hf_doctype, {"Doctype", "xml.doctype", FT_STRING, BASE_NONE, NULL, 0, "", HFILL }},
1162 { &hf_dtd_tag, {"DTD Tag", "xml.dtdtag", FT_STRING, BASE_NONE, NULL, 0, "", HFILL }},
1163 { &unknown_ns.hf_cdata, {"CDATA", "xml.cdata", FT_STRING, BASE_NONE, NULL, 0, "", HFILL }},
1164 { &unknown_ns.hf_tag, {"Tag", "xml.tag", FT_STRING, BASE_NONE, NULL, 0, "", HFILL }},
1165 { &xml_ns.hf_cdata, {"Unknown", "xml.unknown", FT_STRING, BASE_NONE, NULL, 0, "", HFILL }}
1168 hf_arr = g_array_new(FALSE,FALSE,sizeof(hf_register_info));
1169 ett_arr = g_array_new(FALSE,FALSE,sizeof(gint*));
1171 g_array_append_vals(hf_arr,hf_base,array_length(hf_base));
1172 g_array_append_vals(ett_arr,ett_base,array_length(ett_base));
1176 xml_ns.hf_tag = proto_register_protocol("eXtensible Markup Language", "XML", xml_ns.name);
1178 proto_register_field_array(xml_ns.hf_tag, (hf_register_info*)hf_arr->data, hf_arr->len);
1179 proto_register_subtree_array((gint**)ett_arr->data, ett_arr->len);
1181 g_array_free(hf_arr,FALSE);
1182 g_array_free(ett_arr,TRUE);
1184 register_dissector("xml", dissect_xml, xml_ns.hf_tag);
1190 void add_dissector_media(gpointer k, gpointer v _U_, gpointer p _U_) {
1191 dissector_add_string("media_type", (gchar*)k, xml_handle);
1195 proto_reg_handoff_xml(void)
1198 xml_handle = find_dissector("xml");
1200 g_hash_table_foreach(media_types,add_dissector_media,NULL);