Replace tabs in files with editor modeline "expandtab"
[metze/wireshark/wip.git] / epan / ftypes / ftype-pcre.c
index d5f58aa681d9fed582e4b6e6e0b61ea998801747..959215ac08976b89e6d6ff7b902b43d96ee99c3a 100644 (file)
@@ -1,6 +1,4 @@
 /*
- * $Id$
- *
  * Wireshark - Network traffic analyzer
  * By Gerald Combs <gerald@wireshark.org>
  * Copyright 2001 Gerald Combs
  *
  * You should have received a copy of the GNU General Public License
  * along with this program; if not, write to the Free Software
- * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
  */
 
 /* Perl-Compatible Regular Expression (PCRE) internal field type.
  * Used with the "matches" dfilter operator, allowing efficient
  * compilation and studying of a PCRE pattern in dfilters.
- *
- * PCRE is provided with libpcre (http://www.pcre.org/).
  */
 
-#ifdef HAVE_CONFIG_H
 #include "config.h"
-#endif
 
 #include <ftypes-int.h>
 
-#ifdef HAVE_LIBPCRE
-
+#include <glib.h>
 #include <string.h>
 
-#include <pcre.h>
-
-/* Create a pcre_tuple_t object based on the given string pattern */ 
-static pcre_tuple_t *
-pcre_tuple_new(const char *value)
-{
-       pcre_tuple_t *tuple;
-       const char *pcre_error_text;
-       int pcre_error_offset;
-
-       tuple = g_malloc(sizeof(pcre_tuple_t));
-       tuple->string = g_strdup(value); /* The RE as string */
-       tuple->ex = NULL;
-       /* Compile the RE */
-       tuple->re = pcre_compile(
-                       value,                          /* pattern */
-                       0,                                      /* PCRE options */
-                       &pcre_error_text,       /* PCRE constant error string */
-                       &pcre_error_offset,     /* Start offset of error in pattern */
-                       NULL                            /* Default char tables (C locale) */
-                       );
-       if (pcre_error_text) {
-               tuple->error = g_strdup_printf("In regular expression \"%s\":\n"
-                               "%s (character position %d)",
-                               value, pcre_error_text, pcre_error_offset);
-               return tuple;
-       } else {
-               tuple->error = NULL;
-       }
-       /* Study the RE */
-       tuple->ex = pcre_study(tuple->re, 0, &pcre_error_text);
-       if (pcre_error_text) {
-               if (tuple->error) {
-                       tuple->error = g_strdup_printf("In regular expression \"%s\":\n"
-                                       "%s. %s",
-                                       value, tuple->error, pcre_error_text);
-               } else {
-                       tuple->error = g_strdup_printf("In regular expression \"%s\":\n"
-                                       "%s",
-                                       value, pcre_error_text);
-               }
-       }
-       return tuple;
-}
-
 static void
-pcre_tuple_free(pcre_tuple_t *tuple)
+gregex_fvalue_new(fvalue_t *fv)
 {
-       if (tuple) {
-               if (tuple->string) g_free(tuple->string);
-               if (tuple->re) g_free(tuple->re);
-               if (tuple->ex) g_free(tuple->ex);
-               if (tuple->error) g_free(tuple->error);
-               g_free(tuple);
-       }
+    fv->value.re = NULL;
 }
 
 static void
-pcre_fvalue_new(fvalue_t *fv)
+gregex_fvalue_free(fvalue_t *fv)
 {
-       fv->value.re = NULL;
+    if (fv->value.re) {
+        g_regex_unref(fv->value.re);
+        fv->value.re = NULL;
+    }
 }
 
-static void
-pcre_fvalue_free(fvalue_t *fv)
+/* Determines whether pattern needs to match raw byte sequences */
+static gboolean
+raw_flag_needed(const gchar *pattern)
 {
-       if (fv->value.re) {
-               pcre_tuple_free(fv->value.re);
-       }
+    gboolean found = FALSE;
+    const gchar *s = pattern;
+    size_t i, len;
+
+    /* find any character whose hex value is two letters */
+    len = strlen(s);
+    for (i = 0; i < len; i++) {
+        /* Upper and lower-nibble must be >= 0xA */
+        if ((guchar)(s[i] & 0xF0) >= 0xA0 &&
+            (guchar)(s[i] & 0x0F) >= 0x0A)
+        {
+            found = TRUE;
+            break;
+        }
+    }
+    return found;
 }
 
 /* Generate a FT_PCRE from a parsed string pattern.
- * Uses the specified logfunc() to report errors. */
+ * On failure, if err_msg is non-null, set *err_msg to point to a
+ * g_malloc()ed error message. */
 static gboolean
-val_from_string(fvalue_t *fv, char *pattern, LogFunc logfunc)
+val_from_string(fvalue_t *fv, const char *pattern, gchar **err_msg)
 {
-       /* Free up the old value, if we have one */
-       pcre_fvalue_free(fv);
-
-       fv->value.re = pcre_tuple_new(pattern);
-       if (fv->value.re->error) {
-               logfunc(fv->value.re->error);
-               return FALSE;
-       }
-       return TRUE;
+    GError *regex_error = NULL;
+    GRegexCompileFlags cflags = G_REGEX_OPTIMIZE;
+
+    /* Set RAW flag only if pattern requires matching raw byte
+       sequences. Otherwise, omit it so that GRegex treats its
+       input as UTF8-encoded string. */
+    if (raw_flag_needed(pattern)) {
+        cflags = (GRegexCompileFlags)(G_REGEX_OPTIMIZE | G_REGEX_RAW);
+    }
+
+    /* Free up the old value, if we have one */
+    gregex_fvalue_free(fv);
+
+    fv->value.re = g_regex_new(
+            pattern,            /* pattern */
+            cflags,             /* Compile options */
+            (GRegexMatchFlags)0,                  /* Match options */
+            &regex_error        /* Compile / study errors */
+            );
+
+    if (regex_error) {
+        if (err_msg) {
+            *err_msg = g_strdup(regex_error->message);
+        }
+        g_error_free(regex_error);
+        if (fv->value.re) {
+            g_regex_unref(fv->value.re);
+        }
+        return FALSE;
+    }
+    return TRUE;
 }
 
 /* Generate a FT_PCRE from an unparsed string pattern.
- * Uses the specified logfunc() to report errors. */
+ * On failure, if err_msg is non-null, set *err_msg to point to a
+ * g_malloc()ed error message. */
 static gboolean
-val_from_unparsed(fvalue_t *fv, char *pattern, gboolean allow_partial_value _U_, LogFunc logfunc)
+val_from_unparsed(fvalue_t *fv, const char *pattern, gboolean allow_partial_value _U_, gchar **err_msg)
 {
-       /* Free up the old value, if we have one */
-       pcre_fvalue_free(fv);
-       g_assert(! allow_partial_value);
+    g_assert(! allow_partial_value);
 
-       fv->value.re = pcre_tuple_new(pattern);
-       if (fv->value.re->error) {
-               logfunc(fv->value.re->error);
-               return FALSE;
-       }
-       return TRUE;
+    return val_from_string(fv, pattern, err_msg);
 }
 
 static int
-pcre_repr_len(fvalue_t *fv, ftrepr_t rtype)
+gregex_repr_len(fvalue_t *fv, ftrepr_t rtype, int field_display _U_)
 {
-       g_assert(rtype == FTREPR_DFILTER);
-       return strlen(fv->value.re->string);
+    g_assert(rtype == FTREPR_DFILTER);
+    return (int)strlen(g_regex_get_pattern(fv->value.re));
 }
 
 static void
-pcre_to_repr(fvalue_t *fv, ftrepr_t rtype, char *buf)
+gregex_to_repr(fvalue_t *fv, ftrepr_t rtype, int field_display _U_, char *buf)
 {
-       g_assert(rtype == FTREPR_DFILTER);
-       strcpy(buf, fv->value.re->string);
+    g_assert(rtype == FTREPR_DFILTER);
+    strcpy(buf, g_regex_get_pattern(fv->value.re));
 }
 
 /* BEHOLD - value contains the string representation of the regular expression,
  * and we want to store the compiled PCRE RE object into the value. */
 static void
-pcre_fvalue_set(fvalue_t *fv, gpointer value, gboolean already_copied)
+gregex_fvalue_set(fvalue_t *fv, const char *value)
 {
-       g_assert(value != NULL);
-       /* Free up the old value, if we have one */
-       pcre_fvalue_free(fv);
-       g_assert(! already_copied);
-       fv->value.re = pcre_tuple_new(value);
+    g_assert(value != NULL);
+    /* Free up the old value, if we have one */
+    gregex_fvalue_free(fv);
+    val_from_unparsed(fv, value, FALSE, NULL);
 }
 
 static gpointer
-pcre_fvalue_get(fvalue_t *fv)
+gregex_fvalue_get(fvalue_t *fv)
 {
-       return fv->value.re;
+    return fv->value.re;
 }
 
 void
 ftype_register_pcre(void)
 {
-       static ftype_t pcre_type = {
-               FT_PCRE,                /* ftype */
-               "FT_PCRE",              /* name */
-               "Compiled Perl-Compatible Regular Expression object", /* pretty_name */
-               0,                      /* wire_size */
-               pcre_fvalue_new,        /* new_value */
-               pcre_fvalue_free,       /* free_value */
-               val_from_unparsed,      /* val_from_unparsed */
-               val_from_string,        /* val_from_string */
-               pcre_to_repr,           /* val_to_string_repr */
-               pcre_repr_len,          /* len_string_repr */
-
-               pcre_fvalue_set,        /* set_value */
-               NULL,                   /* set_value_integer */
-               NULL,                   /* set_value_integer64 */
-               NULL,                   /* set_value_floating */
-
-               pcre_fvalue_get,        /* get_value */
-               NULL,                   /* get_value_integer */
-               NULL,                   /* get_value_integer64 */
-               NULL,                   /* get_value_floating */
-
-               NULL,                   /* cmp_eq */
-               NULL,                   /* cmp_ne */
-               NULL,                   /* cmp_gt */
-               NULL,                   /* cmp_ge */
-               NULL,                   /* cmp_lt */
-               NULL,                   /* cmp_le */
-               NULL,                   /* cmp_bitwise_and */
-               NULL,                   /* cmp_contains */
-               NULL,                   /* cmp_matches */
-
-               NULL,                   /* len */
-               NULL,                   /* slice */
-       };
-       ftype_register(FT_PCRE, &pcre_type);
+    static ftype_t pcre_type = {
+        FT_PCRE,            /* ftype */
+        "FT_PCRE",          /* name */
+        "Compiled Perl-Compatible Regular Expression (GRegex) object", /* pretty_name */
+        0,                  /* wire_size */
+        gregex_fvalue_new,  /* new_value */
+        gregex_fvalue_free, /* free_value */
+        val_from_unparsed,  /* val_from_unparsed */
+        val_from_string,    /* val_from_string */
+        gregex_to_repr,     /* val_to_string_repr */
+        gregex_repr_len,    /* len_string_repr */
+
+        NULL,               /* set_value_byte_array */
+        NULL,               /* set_value_bytes */
+        NULL,               /* set_value_guid */
+        NULL,               /* set_value_time */
+        gregex_fvalue_set,  /* set_value_string */
+        NULL,               /* set_value_tvbuff */
+        NULL,               /* set_value_uinteger */
+        NULL,               /* set_value_sinteger */
+        NULL,               /* set_value_uinteger64 */
+        NULL,               /* set_value_sinteger64 */
+        NULL,               /* set_value_floating */
+
+        gregex_fvalue_get,  /* get_value */
+        NULL,               /* get_value_uinteger */
+        NULL,               /* get_value_sinteger */
+        NULL,               /* get_value_uinteger64 */
+        NULL,               /* get_value_sinteger64 */
+        NULL,               /* get_value_floating */
+
+        NULL,               /* cmp_eq */
+        NULL,               /* cmp_ne */
+        NULL,               /* cmp_gt */
+        NULL,               /* cmp_ge */
+        NULL,               /* cmp_lt */
+        NULL,               /* cmp_le */
+        NULL,               /* cmp_bitwise_and */
+        NULL,               /* cmp_contains */
+        NULL,               /* cmp_matches */
+
+        NULL,               /* len */
+        NULL,               /* slice */
+    };
+    ftype_register(FT_PCRE, &pcre_type);
 }
 
-#else /* HAVE_LIBPCRE */
-
-void
-ftype_register_pcre(void)
-{
-       static ftype_t pcre_type = {
-               FT_PCRE,                /* ftype */
-               "FT_PCRE",                      /* name */
-               "Compiled Perl-Compatible Regular Expression object", /* pretty_name */
-               0,                              /* wire_size */
-               NULL,                           /* new_value */
-               NULL,                           /* free_value */
-               NULL,                           /* val_from_unparsed */
-               NULL,                           /* val_from_string */
-               NULL,                           /* val_to_string_repr */
-               NULL,                           /* len_string_repr */
-
-               NULL,                           /* set_value */
-               NULL,                           /* set_value_uinteger */
-               NULL,                           /* set_value_sinteger */
-               NULL,                           /* set_value_integer64 */
-               NULL,                           /* set_value_floating */
-
-               NULL,                           /* get_value */
-               NULL,                           /* get_value_uinteger */
-               NULL,                           /* get_value_sinteger */
-               NULL,                           /* get_value_integer64 */
-               NULL,                           /* get_value_floating */ 
-
-               NULL,                           /* cmp_eq */
-               NULL,                           /* cmp_ne */
-               NULL,                           /* cmp_gt */
-               NULL,                           /* cmp_ge */
-               NULL,                           /* cmp_lt */
-               NULL,                           /* cmp_le */
-               NULL,                           /* cmp_bitwise_and */
-               NULL,                           /* cmp_contains */
-               NULL,                           /* cmp_matches */
-
-               NULL,                           /* len */
-               NULL,                           /* slice */
-       };
-       ftype_register(FT_PCRE, &pcre_type);
-}
-
-#endif /* HAVE_LIBPCRE */
+/*
+ * Editor modelines  -  http://www.wireshark.org/tools/modelines.html
+ *
+ * Local variables:
+ * c-basic-offset: 4
+ * tab-width: 8
+ * indent-tabs-mode: nil
+ * End:
+ *
+ * vi: set shiftwidth=4 tabstop=8 expandtab:
+ * :indentSize=4:tabSize=8:noTabs=true:
+ */