1 /**-*-C-*-**********************************************************************
5 * Utility to convert an ASCII hexdump into a libpcap-format capture file
7 * (c) Copyright 2001 Ashok Narayanan <ashokn@cisco.com>
11 * Wireshark - Network traffic analyzer
12 * By Gerald Combs <gerald@wireshark.org>
13 * Copyright 1998 Gerald Combs
15 * This program is free software; you can redistribute it and/or
16 * modify it under the terms of the GNU General Public License
17 * as published by the Free Software Foundation; either version 2
18 * of the License, or (at your option) any later version.
20 * This program is distributed in the hope that it will be useful,
21 * but WITHOUT ANY WARRANTY; without even the implied warranty of
22 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
23 * GNU General Public License for more details.
25 * You should have received a copy of the GNU General Public License
26 * along with this program; if not, write to the Free Software
27 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
29 *******************************************************************************/
31 /*******************************************************************************
33 * This utility reads in an ASCII hexdump of this common format:
35 * 00000000 00 E0 1E A7 05 6F 00 10 5A A0 B9 12 08 00 46 00 .....o..Z.....F.
36 * 00000010 03 68 00 00 00 00 0A 2E EE 33 0F 19 08 7F 0F 19 .h.......3...
\7f..
37 * 00000020 03 80 94 04 00 00 10 01 16 A2 0A 00 03 50 00 0C .............P..
38 * 00000030 01 01 0F 19 03 80 11 01 1E 61 00 0C 03 01 0F 19 .........a......
40 * Each bytestring line consists of an offset, one or more bytes, and
41 * text at the end. An offset is defined as a hex string of more than
42 * two characters. A byte is defined as a hex string of exactly two
43 * characters. The text at the end is ignored, as is any text before
44 * the offset. Bytes read from a bytestring line are added to the
45 * current packet only if all the following conditions are satisfied:
47 * - No text appears between the offset and the bytes (any bytes appearing after
48 * such text would be ignored)
50 * - The offset must be arithmetically correct, i.e. if the offset is 00000020, then
51 * exactly 32 bytes must have been read into this packet before this. If the offset
52 * is wrong, the packet is immediately terminated
54 * A packet start is signaled by a zero offset.
56 * Lines starting with #TEXT2PCAP are directives. These allow the user
57 * to embed instructions into the capture file which allows text2pcap
58 * to take some actions (e.g. specifying the encapsulation
59 * etc.). Currently no directives are implemented.
61 * Lines beginning with # which are not directives are ignored as
62 * comments. Currently all non-hexdump text is ignored by text2pcap;
63 * in the future, text processing may be added, but lines prefixed
64 * with '#' will still be ignored.
66 * The output is a libpcap packet containing Ethernet frames by
67 * default. This program takes options which allow the user to add
68 * dummy Ethernet, IP and UDP or TCP headers to the packets in order
69 * to allow dumps of L3 or higher protocols to be decoded.
71 * Considerable flexibility is built into this code to read hexdumps
72 * of slightly different formats. For example, any text prefixing the
73 * hexdump line is dropped (including mail forwarding '>'). The offset
74 * can be any hex number of four digits or greater.
76 * This converter cannot read a single packet greater than 64K. Packet
77 * snaplength is automatically set to 64K.
85 * Just make sure we include the prototype for strptime as well
86 * (needed for glibc 2.2) but make sure we do this only if not
94 # define _XOPEN_SOURCE 600
99 * Defining _XOPEN_SOURCE is needed on some platforms, e.g. platforms
100 * using glibc, to expand the set of things system header files define.
102 * Unfortunately, on other platforms, such as some versions of Solaris
103 * (including Solaris 10), it *reduces* that set as well, causing
104 * strptime() not to be declared, presumably because the version of the
105 * X/Open spec that _XOPEN_SOURCE implies doesn't include strptime() and
106 * blah blah blah namespace pollution blah blah blah.
108 * So we define __EXTENSIONS__ so that "strptime()" is declared.
110 #ifndef __EXTENSIONS__
111 # define __EXTENSIONS__
118 #include <wsutil/file_util.h>
131 #include "wsutil/wsgetopt.h"
134 #ifdef NEED_STRPTIME_H
135 # include "wsutil/strptime.h"
138 #include "text2pcap.h"
139 #include "svnversion.h"
142 #include <wsutil/unicode-utils.h>
145 /*--- Options --------------------------------------------------------------------*/
148 static int debug = 0;
150 static int quiet = FALSE;
152 /* Dummy Ethernet header */
153 static int hdr_ethernet = FALSE;
154 static unsigned long hdr_ethernet_proto = 0;
156 /* Dummy IP header */
157 static int hdr_ip = FALSE;
158 static long hdr_ip_proto = 0;
160 /* Dummy UDP header */
161 static int hdr_udp = FALSE;
162 static unsigned long hdr_dest_port = 0;
163 static unsigned long hdr_src_port = 0;
165 /* Dummy TCP header */
166 static int hdr_tcp = FALSE;
168 /* Dummy SCTP header */
169 static int hdr_sctp = FALSE;
170 static unsigned long hdr_sctp_src = 0;
171 static unsigned long hdr_sctp_dest = 0;
172 static unsigned long hdr_sctp_tag = 0;
174 /* Dummy DATA chunk header */
175 static int hdr_data_chunk = FALSE;
176 static unsigned char hdr_data_chunk_type = 0;
177 static unsigned char hdr_data_chunk_bits = 3;
178 static unsigned long hdr_data_chunk_tsn = 0;
179 static unsigned short hdr_data_chunk_sid = 0;
180 static unsigned short hdr_data_chunk_ssn = 0;
181 static unsigned long hdr_data_chunk_ppid = 0;
183 /* ASCII text dump identification */
184 static int identify_ascii = FALSE;
186 /*--- Local date -----------------------------------------------------------------*/
188 /* This is where we store the packet currently being built */
189 #define MAX_PACKET 64000
190 static unsigned char packet_buf[MAX_PACKET];
191 static unsigned long curr_offset = 0;
192 static unsigned long max_offset = MAX_PACKET;
193 static unsigned long packet_start = 0;
194 static void start_new_packet (void);
196 /* This buffer contains strings present before the packet offset 0 */
197 #define PACKET_PREAMBLE_MAX_LEN 2048
198 static unsigned char packet_preamble[PACKET_PREAMBLE_MAX_LEN+1];
199 static int packet_preamble_len = 0;
201 /* Number of packets read and written */
202 static unsigned long num_packets_read = 0;
203 static unsigned long num_packets_written = 0;
205 /* Time code of packet, derived from packet_preamble */
206 static time_t ts_sec = 0;
207 static guint32 ts_usec = 0;
208 static char *ts_fmt = NULL;
209 static struct tm timecode_default;
211 static char new_date_fmt = 0;
212 static unsigned char* pkt_lnstart;
215 static const char *input_filename;
216 static FILE *input_file = NULL;
218 static const char *output_filename;
219 static FILE *output_file = NULL;
221 /* Offset base to parse */
222 static unsigned long offset_base = 16;
226 /* ----- State machine -----------------------------------------------------------*/
228 /* Current state of parser */
230 INIT, /* Waiting for start of new packet */
231 START_OF_LINE, /* Starting from beginning of line */
232 READ_OFFSET, /* Just read the offset */
233 READ_BYTE, /* Just read a byte */
234 READ_TEXT /* Just read text - ignore until EOL */
236 static parser_state_t state = INIT;
238 static const char *state_str[] = {"Init",
245 static const char *token_str[] = {"",
253 /* ----- Skeleton Packet Headers --------------------------------------------------*/
261 static hdr_ethernet_t HDR_ETHERNET = {
262 {0x0a, 0x02, 0x02, 0x02, 0x02, 0x02},
263 {0x0a, 0x01, 0x01, 0x01, 0x01, 0x01},
269 guint16 packet_length;
270 guint16 identification;
275 guint16 hdr_checksum;
280 static hdr_ip_t HDR_IP = {0x45, 0, 0, 0x3412, 0, 0, 0xff, 0, 0,
281 #ifdef WORDS_BIGENDIAN
282 0x0a010101, 0x0a020202
284 0x0101010a, 0x0202020a
288 static struct { /* pseudo header for checksum calculation */
303 static hdr_udp_t HDR_UDP = {0, 0, 0, 0};
317 static hdr_tcp_t HDR_TCP = {0, 0, 0, 0, 0x50, 0, 0, 0, 0};
326 static hdr_sctp_t HDR_SCTP = {0, 0, 0, 0};
338 static hdr_data_chunk_t HDR_DATA_CHUNK = {0, 0, 0, 0, 0, 0, 0};
340 static char tempbuf[64];
342 /*----------------------------------------------------------------------
343 * Stuff for writing a PCap file
345 #define PCAP_MAGIC 0xa1b2c3d4
347 /* "libpcap" file header (minus magic number). */
349 guint32 magic; /* magic */
350 guint16 version_major; /* major version number */
351 guint16 version_minor; /* minor version number */
352 guint32 thiszone; /* GMT to local correction */
353 guint32 sigfigs; /* accuracy of timestamps */
354 guint32 snaplen; /* max length of captured packets, in octets */
355 guint32 network; /* data link type */
358 /* "libpcap" record header. */
360 guint32 ts_sec; /* timestamp seconds */
361 guint32 ts_usec; /* timestamp microseconds */
362 guint32 incl_len; /* number of octets of packet saved in file */
363 guint32 orig_len; /* actual length of packet */
366 /* Link-layer type; see net/bpf.h for details */
367 static unsigned long pcap_link_type = 1; /* Default is DLT-EN10MB */
369 /*----------------------------------------------------------------------
370 * Parse a single hex number
371 * Will abort the program if it can't parse the number
372 * Pass in TRUE if this is an offset, FALSE if not
375 parse_num (const char *str, int offset)
380 num = strtoul(str, &c, offset ? offset_base : 16);
382 fprintf(stderr, "FATAL ERROR: Bad hex number? [%s]\n", str);
388 /*----------------------------------------------------------------------
389 * Write this byte into current packet
392 write_byte (const char *str)
396 num = parse_num(str, FALSE);
397 packet_buf[curr_offset] = (unsigned char) num;
399 if (curr_offset >= max_offset) /* packet full */
403 /*----------------------------------------------------------------------
404 * Remove bytes from the current packet
407 unwrite_bytes (unsigned long nbytes)
409 curr_offset -= nbytes;
412 /*----------------------------------------------------------------------
413 * Compute one's complement checksum (from RFC1071)
416 in_checksum (void *buf, unsigned long count)
418 unsigned long sum = 0;
422 /* This is the inner loop */
423 sum += g_ntohs(* (guint16 *) addr);
428 /* Add left-over byte, if any */
430 sum += g_ntohs(* (guint8 *) addr);
432 /* Fold 32-bit sum to 16 bits */
434 sum = (sum & 0xffff) + (sum >> 16);
440 /* The CRC32C code is taken from draft-ietf-tsvwg-sctpcsum-01.txt.
441 * That code is copyrighted by D. Otis and has been modified.
444 #define CRC32C(c,d) (c=(c>>8)^crc_c[(c^(d))&0xFF])
445 static guint32 crc_c[256] =
447 0x00000000L, 0xF26B8303L, 0xE13B70F7L, 0x1350F3F4L,
448 0xC79A971FL, 0x35F1141CL, 0x26A1E7E8L, 0xD4CA64EBL,
449 0x8AD958CFL, 0x78B2DBCCL, 0x6BE22838L, 0x9989AB3BL,
450 0x4D43CFD0L, 0xBF284CD3L, 0xAC78BF27L, 0x5E133C24L,
451 0x105EC76FL, 0xE235446CL, 0xF165B798L, 0x030E349BL,
452 0xD7C45070L, 0x25AFD373L, 0x36FF2087L, 0xC494A384L,
453 0x9A879FA0L, 0x68EC1CA3L, 0x7BBCEF57L, 0x89D76C54L,
454 0x5D1D08BFL, 0xAF768BBCL, 0xBC267848L, 0x4E4DFB4BL,
455 0x20BD8EDEL, 0xD2D60DDDL, 0xC186FE29L, 0x33ED7D2AL,
456 0xE72719C1L, 0x154C9AC2L, 0x061C6936L, 0xF477EA35L,
457 0xAA64D611L, 0x580F5512L, 0x4B5FA6E6L, 0xB93425E5L,
458 0x6DFE410EL, 0x9F95C20DL, 0x8CC531F9L, 0x7EAEB2FAL,
459 0x30E349B1L, 0xC288CAB2L, 0xD1D83946L, 0x23B3BA45L,
460 0xF779DEAEL, 0x05125DADL, 0x1642AE59L, 0xE4292D5AL,
461 0xBA3A117EL, 0x4851927DL, 0x5B016189L, 0xA96AE28AL,
462 0x7DA08661L, 0x8FCB0562L, 0x9C9BF696L, 0x6EF07595L,
463 0x417B1DBCL, 0xB3109EBFL, 0xA0406D4BL, 0x522BEE48L,
464 0x86E18AA3L, 0x748A09A0L, 0x67DAFA54L, 0x95B17957L,
465 0xCBA24573L, 0x39C9C670L, 0x2A993584L, 0xD8F2B687L,
466 0x0C38D26CL, 0xFE53516FL, 0xED03A29BL, 0x1F682198L,
467 0x5125DAD3L, 0xA34E59D0L, 0xB01EAA24L, 0x42752927L,
468 0x96BF4DCCL, 0x64D4CECFL, 0x77843D3BL, 0x85EFBE38L,
469 0xDBFC821CL, 0x2997011FL, 0x3AC7F2EBL, 0xC8AC71E8L,
470 0x1C661503L, 0xEE0D9600L, 0xFD5D65F4L, 0x0F36E6F7L,
471 0x61C69362L, 0x93AD1061L, 0x80FDE395L, 0x72966096L,
472 0xA65C047DL, 0x5437877EL, 0x4767748AL, 0xB50CF789L,
473 0xEB1FCBADL, 0x197448AEL, 0x0A24BB5AL, 0xF84F3859L,
474 0x2C855CB2L, 0xDEEEDFB1L, 0xCDBE2C45L, 0x3FD5AF46L,
475 0x7198540DL, 0x83F3D70EL, 0x90A324FAL, 0x62C8A7F9L,
476 0xB602C312L, 0x44694011L, 0x5739B3E5L, 0xA55230E6L,
477 0xFB410CC2L, 0x092A8FC1L, 0x1A7A7C35L, 0xE811FF36L,
478 0x3CDB9BDDL, 0xCEB018DEL, 0xDDE0EB2AL, 0x2F8B6829L,
479 0x82F63B78L, 0x709DB87BL, 0x63CD4B8FL, 0x91A6C88CL,
480 0x456CAC67L, 0xB7072F64L, 0xA457DC90L, 0x563C5F93L,
481 0x082F63B7L, 0xFA44E0B4L, 0xE9141340L, 0x1B7F9043L,
482 0xCFB5F4A8L, 0x3DDE77ABL, 0x2E8E845FL, 0xDCE5075CL,
483 0x92A8FC17L, 0x60C37F14L, 0x73938CE0L, 0x81F80FE3L,
484 0x55326B08L, 0xA759E80BL, 0xB4091BFFL, 0x466298FCL,
485 0x1871A4D8L, 0xEA1A27DBL, 0xF94AD42FL, 0x0B21572CL,
486 0xDFEB33C7L, 0x2D80B0C4L, 0x3ED04330L, 0xCCBBC033L,
487 0xA24BB5A6L, 0x502036A5L, 0x4370C551L, 0xB11B4652L,
488 0x65D122B9L, 0x97BAA1BAL, 0x84EA524EL, 0x7681D14DL,
489 0x2892ED69L, 0xDAF96E6AL, 0xC9A99D9EL, 0x3BC21E9DL,
490 0xEF087A76L, 0x1D63F975L, 0x0E330A81L, 0xFC588982L,
491 0xB21572C9L, 0x407EF1CAL, 0x532E023EL, 0xA145813DL,
492 0x758FE5D6L, 0x87E466D5L, 0x94B49521L, 0x66DF1622L,
493 0x38CC2A06L, 0xCAA7A905L, 0xD9F75AF1L, 0x2B9CD9F2L,
494 0xFF56BD19L, 0x0D3D3E1AL, 0x1E6DCDEEL, 0xEC064EEDL,
495 0xC38D26C4L, 0x31E6A5C7L, 0x22B65633L, 0xD0DDD530L,
496 0x0417B1DBL, 0xF67C32D8L, 0xE52CC12CL, 0x1747422FL,
497 0x49547E0BL, 0xBB3FFD08L, 0xA86F0EFCL, 0x5A048DFFL,
498 0x8ECEE914L, 0x7CA56A17L, 0x6FF599E3L, 0x9D9E1AE0L,
499 0xD3D3E1ABL, 0x21B862A8L, 0x32E8915CL, 0xC083125FL,
500 0x144976B4L, 0xE622F5B7L, 0xF5720643L, 0x07198540L,
501 0x590AB964L, 0xAB613A67L, 0xB831C993L, 0x4A5A4A90L,
502 0x9E902E7BL, 0x6CFBAD78L, 0x7FAB5E8CL, 0x8DC0DD8FL,
503 0xE330A81AL, 0x115B2B19L, 0x020BD8EDL, 0xF0605BEEL,
504 0x24AA3F05L, 0xD6C1BC06L, 0xC5914FF2L, 0x37FACCF1L,
505 0x69E9F0D5L, 0x9B8273D6L, 0x88D28022L, 0x7AB90321L,
506 0xAE7367CAL, 0x5C18E4C9L, 0x4F48173DL, 0xBD23943EL,
507 0xF36E6F75L, 0x0105EC76L, 0x12551F82L, 0xE03E9C81L,
508 0x34F4F86AL, 0xC69F7B69L, 0xD5CF889DL, 0x27A40B9EL,
509 0x79B737BAL, 0x8BDCB4B9L, 0x988C474DL, 0x6AE7C44EL,
510 0xBE2DA0A5L, 0x4C4623A6L, 0x5F16D052L, 0xAD7D5351L,
514 crc32c(const guint8* buf, unsigned int len, guint32 crc32_init)
520 for (i = 0; i < len; i++)
521 CRC32C(crc32, buf[i]);
527 finalize_crc32c(guint32 crc32)
530 guint8 byte0,byte1,byte2,byte3;
533 byte0 = result & 0xff;
534 byte1 = (result>>8) & 0xff;
535 byte2 = (result>>16) & 0xff;
536 byte3 = (result>>24) & 0xff;
537 result = ((byte0 << 24) | (byte1 << 16) | (byte2 << 8) | byte3);
542 number_of_padding_bytes (unsigned long length)
544 unsigned long remainder;
546 remainder = length % 4;
551 return 4 - remainder;
554 /*----------------------------------------------------------------------
555 * Write current packet out
558 write_current_packet (void)
561 int proto_length = 0;
563 int eth_trailer_length = 0;
564 int i, padding_length;
566 struct pcaprec_hdr ph;
568 if (curr_offset > 0) {
569 /* Write the packet */
571 /* Compute packet length */
572 length = curr_offset;
573 if (hdr_data_chunk) { length += sizeof(HDR_DATA_CHUNK) + number_of_padding_bytes(curr_offset); }
574 if (hdr_sctp) { length += sizeof(HDR_SCTP); }
575 if (hdr_udp) { length += sizeof(HDR_UDP); proto_length = length; }
576 if (hdr_tcp) { length += sizeof(HDR_TCP); proto_length = length; }
577 if (hdr_ip) { length += sizeof(HDR_IP); ip_length = length; }
579 length += sizeof(HDR_ETHERNET);
582 eth_trailer_length = 60 - length;
587 /* Write PCAP header */
588 ph.ts_sec = (guint32)ts_sec;
589 ph.ts_usec = ts_usec;
590 if (ts_fmt == NULL) { ts_usec++; } /* fake packet counter */
591 ph.incl_len = length;
592 ph.orig_len = length;
593 if (fwrite(&ph, sizeof(ph), 1, output_file) != 1)
594 goto write_current_packet_err;
596 /* Write Ethernet header */
598 HDR_ETHERNET.l3pid = g_htons(hdr_ethernet_proto);
599 if (fwrite(&HDR_ETHERNET, sizeof(HDR_ETHERNET), 1, output_file) != 1)
600 goto write_current_packet_err;
603 /* Write IP header */
605 HDR_IP.packet_length = g_htons(ip_length);
606 HDR_IP.protocol = (guint8) hdr_ip_proto;
607 HDR_IP.hdr_checksum = 0;
608 HDR_IP.hdr_checksum = in_checksum(&HDR_IP, sizeof(HDR_IP));
609 if (fwrite(&HDR_IP, sizeof(HDR_IP), 1, output_file) != 1)
610 goto write_current_packet_err;
613 /* initialize pseudo header for checksum calculation */
614 pseudoh.src_addr = HDR_IP.src_addr;
615 pseudoh.dest_addr = HDR_IP.dest_addr;
617 pseudoh.protocol = (guint8) hdr_ip_proto;
618 pseudoh.length = g_htons(proto_length);
620 /* Write UDP header */
623 HDR_UDP.source_port = g_htons(hdr_src_port);
624 HDR_UDP.dest_port = g_htons(hdr_dest_port);
625 HDR_UDP.length = g_htons(proto_length);
627 /* Note: g_ntohs()/g_htons() macro arg may be eval'd twice so calc value before invoking macro */
628 HDR_UDP.checksum = 0;
629 x16 = in_checksum(&pseudoh, sizeof(pseudoh));
631 x16 = in_checksum(&HDR_UDP, sizeof(HDR_UDP));
633 x16 = in_checksum(packet_buf, curr_offset);
635 x16 = (u & 0xffff) + (u>>16);
636 HDR_UDP.checksum = g_htons(x16);
637 if (HDR_UDP.checksum == 0) /* differentiate between 'none' and 0 */
638 HDR_UDP.checksum = g_htons(1);
640 if (fwrite(&HDR_UDP, sizeof(HDR_UDP), 1, output_file) != 1)
641 goto write_current_packet_err;
644 /* Write TCP header */
647 HDR_TCP.source_port = g_htons(hdr_src_port);
648 HDR_TCP.dest_port = g_htons(hdr_dest_port);
649 /* HDR_TCP.seq_num already correct */
650 HDR_TCP.window = g_htons(0x2000);
652 /* Note: g_ntohs()/g_htons() macro arg may be eval'd twice so calc value before invoking macro */
653 HDR_TCP.checksum = 0;
654 x16 = in_checksum(&pseudoh, sizeof(pseudoh));
656 x16 = in_checksum(&HDR_TCP, sizeof(HDR_TCP));
658 x16 = in_checksum(packet_buf, curr_offset);
660 x16 = (u & 0xffff) + (u>>16);
661 HDR_TCP.checksum = g_htons(x16);
662 if (HDR_TCP.checksum == 0) /* differentiate between 'none' and 0 */
663 HDR_TCP.checksum = g_htons(1);
665 if (fwrite(&HDR_TCP, sizeof(HDR_TCP), 1, output_file) != 1)
666 goto write_current_packet_err;
669 /* Compute DATA chunk header and append padding */
670 if (hdr_data_chunk) {
671 HDR_DATA_CHUNK.type = hdr_data_chunk_type;
672 HDR_DATA_CHUNK.bits = hdr_data_chunk_bits;
673 HDR_DATA_CHUNK.length = g_htons(curr_offset + sizeof(HDR_DATA_CHUNK));
674 HDR_DATA_CHUNK.tsn = g_htonl(hdr_data_chunk_tsn);
675 HDR_DATA_CHUNK.sid = g_htons(hdr_data_chunk_sid);
676 HDR_DATA_CHUNK.ssn = g_htons(hdr_data_chunk_ssn);
677 HDR_DATA_CHUNK.ppid = g_htonl(hdr_data_chunk_ppid);
679 padding_length = number_of_padding_bytes(curr_offset);
680 for (i=0; i<padding_length; i++)
684 /* Write SCTP header */
687 HDR_SCTP.src_port = g_htons(hdr_sctp_src);
688 HDR_SCTP.dest_port = g_htons(hdr_sctp_dest);
689 HDR_SCTP.tag = g_htonl(hdr_sctp_tag);
690 HDR_SCTP.checksum = g_htonl(0);
691 HDR_SCTP.checksum = crc32c((guint8 *)&HDR_SCTP, sizeof(HDR_SCTP), ~0L);
693 HDR_SCTP.checksum = crc32c((guint8 *)&HDR_DATA_CHUNK, sizeof(HDR_DATA_CHUNK), HDR_SCTP.checksum);
694 /* Note: g_ntohl() macro arg may be eval'd twice so calc value before invoking macro */
695 x32 = finalize_crc32c(crc32c(packet_buf, curr_offset, HDR_SCTP.checksum));
696 HDR_SCTP.checksum = g_htonl(x32);
698 if (fwrite(&HDR_SCTP, sizeof(HDR_SCTP), 1, output_file) != 1)
699 goto write_current_packet_err;
702 /* Write DATA chunk header */
703 if (hdr_data_chunk) {
704 if (fwrite(&HDR_DATA_CHUNK, sizeof(HDR_DATA_CHUNK), 1, output_file) != 1)
705 goto write_current_packet_err;
708 if (fwrite(packet_buf, curr_offset, 1, output_file) != 1)
709 goto write_current_packet_err;
711 /* Write Ethernet trailer */
712 if (hdr_ethernet && eth_trailer_length > 0) {
713 memset(tempbuf, 0, eth_trailer_length);
714 if (fwrite(tempbuf, eth_trailer_length, 1, output_file) != 1)
715 goto write_current_packet_err;
719 fprintf(stderr, "Wrote packet of %lu bytes at %u\n", curr_offset, g_ntohl(HDR_TCP.seq_num));
720 num_packets_written ++;
722 HDR_TCP.seq_num = g_ntohl(HDR_TCP.seq_num) + curr_offset;
723 HDR_TCP.seq_num = g_htonl(HDR_TCP.seq_num);
725 packet_start += curr_offset;
729 write_current_packet_err:
730 fprintf(stderr, "File write error [%s] : %s\n",
731 output_filename, g_strerror(errno));
735 /*----------------------------------------------------------------------
736 * Write the PCap file header
739 write_file_header (void)
743 fh.magic = PCAP_MAGIC;
744 fh.version_major = 2;
745 fh.version_minor = 4;
749 fh.network = pcap_link_type;
751 if (fwrite(&fh, sizeof(fh), 1, output_file) != 1) {
752 fprintf(stderr, "File write error [%s] : %s\n",
753 output_filename, g_strerror(errno));
758 /*----------------------------------------------------------------------
759 * Append a token to the packet preamble.
762 append_to_preamble(char *str)
766 if (packet_preamble_len != 0) {
767 if (packet_preamble_len == PACKET_PREAMBLE_MAX_LEN)
768 return; /* no room to add more preamble */
769 /* Add a blank separator between the previous token and this token. */
770 packet_preamble[packet_preamble_len++] = ' ';
772 toklen = strlen(str);
774 if (packet_preamble_len + toklen > PACKET_PREAMBLE_MAX_LEN)
775 return; /* no room to add the token to the preamble */
776 g_strlcpy(&packet_preamble[packet_preamble_len], str, PACKET_PREAMBLE_MAX_LEN);
777 packet_preamble_len += (int) toklen;
780 char xs[PACKET_PREAMBLE_MAX_LEN];
781 g_strlcpy(xs, packet_preamble, PACKET_PREAMBLE_MAX_LEN);
782 while ((c = strchr(xs, '\r')) != NULL) *c=' ';
783 fprintf (stderr, "[[append_to_preamble: \"%s\"]]", xs);
788 /*----------------------------------------------------------------------
789 * Parse the preamble to get the timecode.
793 parse_preamble (void)
802 * If no "-t" flag was specified, don't attempt to parse a packet
803 * preamble to extract a time stamp.
809 * Initialize to today localtime, just in case not all fields
810 * of the date and time are specified.
813 timecode = timecode_default;
817 * Null-terminate the preamble.
819 packet_preamble[packet_preamble_len] = '\0';
821 /* Ensure preamble has more than two chars before attempting to parse.
822 * This should cover line breaks etc that get counted.
824 if ( strlen(packet_preamble) > 2 ) {
825 /* Get Time leaving subseconds */
826 subsecs = strptime( packet_preamble, ts_fmt, &timecode );
827 if (subsecs != NULL) {
828 /* Get the long time from the tm structure */
829 /* (will return -1 if failure) */
830 ts_sec = mktime( &timecode );
832 ts_sec = -1; /* we failed to parse it */
834 /* This will ensure incorrectly parsed dates get set to zero */
837 /* Sanitize - remove all '\r' */
839 while ((c = strchr(packet_preamble, '\r')) != NULL) *c=' ';
840 fprintf (stderr, "Failure processing time \"%s\" using time format \"%s\"\n (defaulting to Jan 1,1970 00:00:00 GMT)\n",
841 packet_preamble, ts_fmt);
843 fprintf(stderr, "timecode: %02d/%02d/%d %02d:%02d:%02d %d\n",
844 timecode.tm_mday, timecode.tm_mon, timecode.tm_year,
845 timecode.tm_hour, timecode.tm_min, timecode.tm_sec, timecode.tm_isdst);
847 ts_sec = 0; /* Jan 1,1970: 00:00 GMT; tshark/wireshark will display date/time as adjusted by timezone */
852 /* Parse subseconds */
853 ts_usec = strtol(subsecs, &p, 10);
859 * Convert that number to a number
860 * of microseconds; if it's N digits
861 * long, it's in units of 10^(-N) seconds,
862 * so, to convert it to units of
863 * 10^-6 seconds, we multiply by
866 subseclen = (int) (p - subsecs);
869 * *More* than 6 digits; 6-N is
870 * negative, so we divide by
873 for (i = subseclen - 6; i != 0; i--)
875 } else if (subseclen < 6) {
876 for (i = 6 - subseclen; i != 0; i--)
884 while ((c = strchr(packet_preamble, '\r')) != NULL) *c=' ';
885 fprintf(stderr, "[[parse_preamble: \"%s\"]]\n", packet_preamble);
886 fprintf(stderr, "Format(%s), time(%u), subsecs(%u)\n", ts_fmt, (guint32)ts_sec, ts_usec);
891 packet_preamble_len = 0;
894 /*----------------------------------------------------------------------
898 start_new_packet (void)
901 fprintf(stderr, "Start new packet\n");
903 /* Write out the current packet, if required */
904 write_current_packet();
907 /* Ensure we parse the packet preamble as it may contain the time */
911 /*----------------------------------------------------------------------
912 * Process a directive
915 process_directive (char *str)
917 fprintf(stderr, "\n--- Directive [%s] currently unsupported ---\n", str+10);
921 /*----------------------------------------------------------------------
922 * Parse a single token (called from the scanner)
925 parse_token (token_t token, char *str)
936 * This is implemented as a simple state machine of five states.
937 * State transitions are caused by tokens being received from the
938 * scanner. The code should be self_documenting.
942 /* Sanitize - remove all '\r' */
944 if (str!=NULL) { while ((c = strchr(str, '\r')) != NULL) *c=' '; }
946 fprintf(stderr, "(%s, %s \"%s\") -> (",
947 state_str[state], token_str[token], str ? str : "");
950 /* First token must be treated as a timestamp if time strip format is
952 if (state == INIT || state == START_OF_LINE) {
953 if (ts_fmt != NULL && new_date_fmt) {
960 /* ----- Waiting for new packet -------------------------------------------*/
964 append_to_preamble(str);
967 process_directive(str);
970 num = parse_num(str, TRUE);
972 /* New packet starts here */
975 pkt_lnstart = packet_buf + num;
979 /* Some describing text may be parsed as offset, but the invalid
980 offset will be checked in the state of START_OF_LINE, so
981 we add this transition to gain flexibility */
982 state = START_OF_LINE;
989 /* ----- Processing packet, start of new line -----------------------------*/
993 append_to_preamble(str);
996 process_directive(str);
999 num = parse_num(str, TRUE);
1001 /* New packet starts here */
1004 state = READ_OFFSET;
1005 } else if ((num - packet_start) != curr_offset) {
1007 * The offset we read isn't the one we expected.
1008 * This may only mean that we mistakenly interpreted
1009 * some text as byte values (e.g., if the text dump
1010 * of packet data included a number with spaces around
1011 * it). If the offset is less than what we expected,
1012 * assume that's the problem, and throw away the putative
1013 * extra byte values.
1015 if (num < curr_offset) {
1016 unwrite_bytes(curr_offset - num);
1017 state = READ_OFFSET;
1019 /* Bad offset; switch to INIT state */
1021 fprintf(stderr, "Inconsistent offset. Expecting %0lX, got %0lX. Ignoring rest of packet\n",
1023 write_current_packet();
1027 state = READ_OFFSET;
1028 pkt_lnstart = packet_buf + num;
1031 state = START_OF_LINE;
1038 /* ----- Processing packet, read offset -----------------------------------*/
1042 /* Record the byte */
1052 state = START_OF_LINE;
1059 /* ----- Processing packet, read byte -------------------------------------*/
1063 /* Record the byte */
1072 if (token == T_EOL) {
1074 state = START_OF_LINE;
1076 if (identify_ascii) {
1077 /* Here a line of pkt bytes reading is finished
1078 compare the ascii and hex to avoid such situation:
1079 "61 62 20 ab ", when ab is ascii dump then it should
1080 not be treat as byte */
1082 /* s2 is the ASCII string, s1 is the HEX string, e.g, when
1083 s2 = "ab ", s1 = "616220"
1084 we should find out the largest tail of s1 matches the head
1085 of s2, it means the matched part in tail is the ASCII dump
1086 of the head byte. These matched should be rollback */
1087 line_size = curr_offset-(int)(pkt_lnstart-packet_buf);
1088 s2 = (char*)g_malloc((line_size+1)/4+1);
1089 /* gather the possible pattern */
1090 for(i=0; i<(line_size+1)/4; i++) {
1091 tmp_str[0] = pkt_lnstart[i*3];
1092 tmp_str[1] = pkt_lnstart[i*3+1];
1094 /* it is a valid convertable string */
1095 if (!isxdigit(tmp_str[0]) || !isxdigit(tmp_str[0])) {
1098 s2[i] = (char)strtoul(tmp_str, (char **)NULL, 16);
1100 /* the 3rd entry is not a delimiter, so the possible byte pattern will not shown */
1101 if (!(pkt_lnstart[i*3+2] == ' ')) {
1107 /* If packet line start contains possible byte pattern, the line end
1108 should contain the matched pattern if the user open the -a flag.
1109 The packet will be possible invalid if the byte pattern cannot find
1110 a matched one in the line of packet buffer.*/
1112 if (strncmp(pkt_lnstart+line_size-rollback, s2, rollback) == 0) {
1113 unwrite_bytes(rollback);
1115 /* Not matched. This line contains invalid packet bytes, so
1116 discard the whole line */
1118 unwrite_bytes(line_size);
1129 /* ----- Processing packet, read text -------------------------------------*/
1133 state = START_OF_LINE;
1141 fprintf(stderr, "FATAL ERROR: Bad state (%d)", state);
1146 fprintf(stderr, ", %s)\n", state_str[state]);
1150 /*----------------------------------------------------------------------
1151 * Print usage string and exit
1159 " (" SVNVERSION " from " SVNPATH ")"
1162 "Generate a capture file from an ASCII hexdump of packets.\n"
1163 "See http://www.wireshark.org for more information.\n"
1165 "Usage: text2pcap [options] <infile> <outfile>\n"
1167 "where <infile> specifies input filename (use - for standard input)\n"
1168 " <outfile> specifies output filename (use - for standard output)\n"
1171 " -o hex|oct|dec parse offsets as (h)ex, (o)ctal or (d)ecimal;\n"
1172 " default is hex.\n"
1173 " -t <timefmt> treat the text before the packet as a date/time code;\n"
1174 " the specified argument is a format string of the sort\n"
1175 " supported by strptime.\n"
1176 " Example: The time \"10:15:14.5476\" has the format code\n"
1177 " \"%%H:%%M:%%S.\"\n"
1178 " NOTE: The subsecond component delimiter, '.', must be\n"
1179 " given, but no pattern is required; the remaining\n"
1180 " number is assumed to be fractions of a second.\n"
1181 " NOTE: Date/time fields from the current date/time are\n"
1182 " used as the default for unspecified fields.\n"
1183 " -a enable ASCII text dump identification.\n"
1184 " It allows to identify the start of the ASCII text\n"
1185 " dump and not include it in the packet even if it\n"
1186 " looks like HEX dump.\n"
1187 " NOTE: Do not enable it if the input file does not\n"
1188 " contain the ASCII text dump.\n"
1191 " -l <typenum> link-layer type number; default is 1 (Ethernet).\n"
1192 " See the file net/bpf.h for list of numbers.\n"
1193 " Use this option if your dump is a complete hex dump\n"
1194 " of an encapsulated packet and you wish to specify\n"
1195 " the exact type of encapsulation.\n"
1196 " Example: -l 7 for ARCNet packets.\n"
1197 " -m <max-packet> max packet length in output; default is %d\n"
1199 "Prepend dummy header:\n"
1200 " -e <l3pid> prepend dummy Ethernet II header with specified L3PID\n"
1202 " Example: -e 0x806 to specify an ARP packet.\n"
1203 " -i <proto> prepend dummy IP header with specified IP protocol\n"
1205 " Automatically prepends Ethernet header as well.\n"
1207 " -u <srcp>,<destp> prepend dummy UDP header with specified\n"
1208 " dest and source ports (in DECIMAL).\n"
1209 " Automatically prepends Ethernet & IP headers as well.\n"
1210 " Example: -u 1000,69 to make the packets look like\n"
1211 " TFTP/UDP packets.\n"
1212 " -T <srcp>,<destp> prepend dummy TCP header with specified\n"
1213 " dest and source ports (in DECIMAL).\n"
1214 " Automatically prepends Ethernet & IP headers as well.\n"
1215 " Example: -T 50,60\n"
1216 " -s <srcp>,<dstp>,<tag> prepend dummy SCTP header with specified\n"
1217 " dest/source ports and verification tag (in DECIMAL).\n"
1218 " Automatically prepends Ethernet & IP headers as well.\n"
1219 " Example: -s 30,40,34\n"
1220 " -S <srcp>,<dstp>,<ppi> prepend dummy SCTP header with specified\n"
1221 " dest/source ports and verification tag 0.\n"
1222 " Automatically prepends a dummy SCTP DATA\n"
1223 " chunk header with payload protocol identifier ppi.\n"
1224 " Example: -S 30,40,34\n"
1227 " -h display this help and exit.\n"
1228 " -d show detailed debug of parser states.\n"
1229 " -q generate no output at all (automatically turns off -d).\n"
1231 VERSION, MAX_PACKET);
1236 /*----------------------------------------------------------------------
1240 parse_options (int argc, char *argv[])
1246 arg_list_utf_16to8(argc, argv);
1249 /* Scan CLI parameters */
1250 while ((c = getopt(argc, argv, "Ddhqe:i:l:m:o:u:s:S:t:T:a")) != -1) {
1252 case '?': usage(); break;
1253 case 'h': usage(); break;
1254 case 'D': new_date_fmt = 1; break;
1255 case 'd': if (!quiet) debug++; break;
1256 case 'q': quiet = TRUE; debug = FALSE; break;
1257 case 'l': pcap_link_type = strtol(optarg, NULL, 0); break;
1258 case 'm': max_offset = strtol(optarg, NULL, 0); break;
1260 if (optarg[0]!='h' && optarg[0] != 'o' && optarg[0] != 'd') {
1261 fprintf(stderr, "Bad argument for '-o': %s\n", optarg);
1265 case 'o': offset_base = 8; break;
1266 case 'h': offset_base = 16; break;
1267 case 'd': offset_base = 10; break;
1271 hdr_ethernet = TRUE;
1272 if (sscanf(optarg, "%lx", &hdr_ethernet_proto) < 1) {
1273 fprintf(stderr, "Bad argument for '-e': %s\n", optarg);
1280 hdr_ip_proto = strtol(optarg, &p, 10);
1281 if (p == optarg || *p != '\0' || hdr_ip_proto < 0 ||
1282 hdr_ip_proto > 255) {
1283 fprintf(stderr, "Bad argument for '-i': %s\n", optarg);
1286 hdr_ethernet = TRUE;
1287 hdr_ethernet_proto = 0x800;
1292 hdr_sctp_src = strtol(optarg, &p, 10);
1293 if (p == optarg || (*p != ',' && *p != '\0')) {
1294 fprintf(stderr, "Bad src port for '-%c'\n", c);
1298 fprintf(stderr, "No dest port specified for '-%c'\n", c);
1303 hdr_sctp_dest = strtol(optarg, &p, 10);
1304 if (p == optarg || (*p != ',' && *p != '\0')) {
1305 fprintf(stderr, "Bad dest port for '-s'\n");
1309 fprintf(stderr, "No tag specified for '-%c'\n", c);
1314 hdr_sctp_tag = strtol(optarg, &p, 10);
1315 if (p == optarg || *p != '\0') {
1316 fprintf(stderr, "Bad tag for '-%c'\n", c);
1322 hdr_ethernet = TRUE;
1323 hdr_ethernet_proto = 0x800;
1327 hdr_data_chunk = TRUE;
1328 hdr_sctp_src = strtol(optarg, &p, 10);
1329 if (p == optarg || (*p != ',' && *p != '\0')) {
1330 fprintf(stderr, "Bad src port for '-%c'\n", c);
1334 fprintf(stderr, "No dest port specified for '-%c'\n", c);
1339 hdr_sctp_dest = strtol(optarg, &p, 10);
1340 if (p == optarg || (*p != ',' && *p != '\0')) {
1341 fprintf(stderr, "Bad dest port for '-s'\n");
1345 fprintf(stderr, "No ppi specified for '-%c'\n", c);
1350 hdr_data_chunk_ppid = strtoul(optarg, &p, 10);
1351 if (p == optarg || *p != '\0') {
1352 fprintf(stderr, "Bad ppi for '-%c'\n", c);
1358 hdr_ethernet = TRUE;
1359 hdr_ethernet_proto = 0x800;
1369 hdr_src_port = strtol(optarg, &p, 10);
1370 if (p == optarg || (*p != ',' && *p != '\0')) {
1371 fprintf(stderr, "Bad src port for '-u'\n");
1375 fprintf(stderr, "No dest port specified for '-u'\n");
1380 hdr_dest_port = strtol(optarg, &p, 10);
1381 if (p == optarg || *p != '\0') {
1382 fprintf(stderr, "Bad dest port for '-u'\n");
1387 hdr_ethernet = TRUE;
1388 hdr_ethernet_proto = 0x800;
1394 hdr_src_port = strtol(optarg, &p, 10);
1395 if (p == optarg || (*p != ',' && *p != '\0')) {
1396 fprintf(stderr, "Bad src port for '-T'\n");
1400 fprintf(stderr, "No dest port specified for '-u'\n");
1405 hdr_dest_port = strtol(optarg, &p, 10);
1406 if (p == optarg || *p != '\0') {
1407 fprintf(stderr, "Bad dest port for '-T'\n");
1412 hdr_ethernet = TRUE;
1413 hdr_ethernet_proto = 0x800;
1417 identify_ascii = TRUE;
1425 if (optind >= argc || argc-optind < 2) {
1426 fprintf(stderr, "Must specify input and output filename\n");
1430 if (strcmp(argv[optind], "-")) {
1431 input_filename = g_strdup(argv[optind]);
1432 input_file = ws_fopen(input_filename, "rb");
1434 fprintf(stderr, "Cannot open file [%s] for reading: %s\n",
1435 input_filename, g_strerror(errno));
1439 input_filename = "Standard input";
1443 if (strcmp(argv[optind+1], "-")) {
1444 output_filename = g_strdup(argv[optind+1]);
1445 output_file = ws_fopen(output_filename, "wb");
1447 fprintf(stderr, "Cannot open file [%s] for writing: %s\n",
1448 output_filename, g_strerror(errno));
1452 output_filename = "Standard output";
1453 output_file = stdout;
1456 /* Some validation */
1457 if (pcap_link_type != 1 && hdr_ethernet) {
1458 fprintf(stderr, "Dummy headers (-e, -i, -u, -s, -S -T) cannot be specified with link type override (-l)\n");
1462 /* Set up our variables */
1465 input_filename = "Standard input";
1468 output_file = stdout;
1469 output_filename = "Standard output";
1472 ts_sec = time(0); /* initialize to current time */
1473 timecode_default = *localtime(&ts_sec);
1474 timecode_default.tm_isdst = -1; /* Unknown for now, depends on time given to the strptime() function */
1476 /* Display summary of our state */
1478 fprintf(stderr, "Input from: %s\n", input_filename);
1479 fprintf(stderr, "Output to: %s\n", output_filename);
1481 if (hdr_ethernet) fprintf(stderr, "Generate dummy Ethernet header: Protocol: 0x%0lX\n",
1482 hdr_ethernet_proto);
1483 if (hdr_ip) fprintf(stderr, "Generate dummy IP header: Protocol: %ld\n",
1485 if (hdr_udp) fprintf(stderr, "Generate dummy UDP header: Source port: %ld. Dest port: %ld\n",
1486 hdr_src_port, hdr_dest_port);
1487 if (hdr_tcp) fprintf(stderr, "Generate dummy TCP header: Source port: %ld. Dest port: %ld\n",
1488 hdr_src_port, hdr_dest_port);
1489 if (hdr_sctp) fprintf(stderr, "Generate dummy SCTP header: Source port: %ld. Dest port: %ld. Tag: %ld\n",
1490 hdr_sctp_src, hdr_sctp_dest, hdr_sctp_tag);
1491 if (hdr_data_chunk) fprintf(stderr, "Generate dummy DATA chunk header: TSN: %lu. SID: %d. SSN: %d. PPID: %lu\n",
1492 hdr_data_chunk_tsn, hdr_data_chunk_sid, hdr_data_chunk_ssn, hdr_data_chunk_ppid);
1497 main(int argc, char *argv[])
1499 parse_options(argc, argv);
1501 assert(input_file != NULL);
1502 assert(output_file != NULL);
1504 write_file_header();
1509 write_current_packet();
1511 fclose(output_file);
1513 fprintf(stderr, "\n-------------------------\n");
1515 fprintf(stderr, "Read %ld potential packet%s, wrote %ld packet%s\n",
1516 num_packets_read, (num_packets_read==1) ?"":"s",
1517 num_packets_written, (num_packets_written==1)?"":"s");