Split GRegex into GRegex and GMatchInfo. (#419368, Marco Barisione)

author Matthias Clasen <mclasen@redhat.com>

Mon, 30 Apr 2007 16:02:26 +0000 (16:02 +0000)

committer Matthias Clasen <matthiasc@src.gnome.org>

Mon, 30 Apr 2007 16:02:26 +0000 (16:02 +0000)
author Matthias Clasen <mclasen@redhat.com>
Mon, 30 Apr 2007 16:02:26 +0000 (16:02 +0000)
committer Matthias Clasen <matthiasc@src.gnome.org>
Mon, 30 Apr 2007 16:02:26 +0000 (16:02 +0000)
diff --git a/ChangeLog b/ChangeLog

index d4e32e7..36f9958 100644 (file)
--- a/ChangeLog
+++ b/ChangeLog
@@ -1,3 +1,11 @@
+2007-04-30  Matthias Clasen  <mclasen@redhat.com>
+
+       * glib/glib.symbols:
+       * glib/gregex.[hc]: Split GRegex into GRegex and GMatchInfo.
+       (#419368, Marco Barisione)
+
+       * tests/regex-test.c: Adapt.
+
  2007-04-30  Chris Wilson  <chris@chris-wilson.co.uk>
  
         * glib/gbookmarkfile.c (g_bookmark_file_get_app_info):
diff --git a/docs/reference/ChangeLog b/docs/reference/ChangeLog

index 643fe90..7633c90 100644 (file)
--- a/docs/reference/ChangeLog
+++ b/docs/reference/ChangeLog
@@ -1,3 +1,9 @@
+2007-04-30  Matthias Clasen  <mclasen@redhat.com>
+
+       * glib/glib-sections.txt: 
+       * glib/tmpl/gregex.sgml: Update for the GRegex/GMatchInfo
+       split.
+
  2007-04-24  Matthias Clasen  <mclasen@redhat.com>
  
         * glib/glib-sections.txt: Add g_option_context_get_help.
diff --git a/docs/reference/glib/glib-sections.txt b/docs/reference/glib/glib-sections.txt

index 8eb60dc..4aa8656 100644 (file)
--- a/docs/reference/glib/glib-sections.txt
+++ b/docs/reference/glib/glib-sections.txt
@@ -874,35 +874,31 @@ GRegex
  GRegexEvalCallback
  g_regex_new
  g_regex_free
-g_regex_optimize
-g_regex_copy
  g_regex_get_pattern
-g_regex_clear
+g_regex_get_string_number
+g_regex_escape_string
  g_regex_match_simple
  g_regex_match
  g_regex_match_full
-g_regex_match_next
-g_regex_match_next_full
  g_regex_match_all
  g_regex_match_all_full
-g_regex_get_match_count
-g_regex_is_partial_match
-g_regex_fetch
-g_regex_fetch_pos
-g_regex_fetch_named
-g_regex_fetch_named_pos
-g_regex_fetch_all
-g_regex_get_string_number
  g_regex_split_simple
  g_regex_split
  g_regex_split_full
-g_regex_split_next
-g_regex_split_next_full
-g_regex_expand_references
  g_regex_replace
  g_regex_replace_literal
  g_regex_replace_eval
-g_regex_escape_string
+GMatchInfo
+g_match_info_free
+g_match_info_next
+g_match_info_get_match_count
+g_match_info_is_partial_match
+g_match_info_expand_references
+g_match_info_fetch
+g_match_info_fetch_pos
+g_match_info_fetch_named
+g_match_info_fetch_named_pos
+g_match_info_fetch_all
  <SUBSECTION Private>
  g_regex_error_quark
  </SECTION>
diff --git a/docs/reference/glib/tmpl/gregex.sgml b/docs/reference/glib/tmpl/gregex.sgml

index e1577c2..54b6806 100644 (file)
--- a/docs/reference/glib/tmpl/gregex.sgml
+++ b/docs/reference/glib/tmpl/gregex.sgml
@@ -56,10 +56,10 @@ encountered. This indicates a comment that lasts until after the next
  newline.
  </para>
  <para>
-If you have two threads manipulating the same #GRegex, they must use a
-lock to synchronize their operation, as these functions are not threadsafe.
-Creating and manipulating different #GRegex structures from different
-threads is not a problem.
+Creating and manipulating the same #GRegex structure from different
+threads is not a problem as #GRegex does not modify its internal
+state between creation and destruction, on the other hand #GMatchInfo is
+not threadsafe.
  </para>
  <para>
  The regular expressions low level functionalities are obtained through
@@ -81,7 +81,7 @@ Error codes returned by regular expressions functions.
  </para>
  
  @G_REGEX_ERROR_COMPILE: Compilation of the regular expression in g_regex_new() failed.
-@G_REGEX_ERROR_OPTIMIZE: Optimization of the regular expression in g_regex_optimize() failed.
+@G_REGEX_ERROR_OPTIMIZE: Optimization of the regular expression failed.
  @G_REGEX_ERROR_REPLACE: Replacement failed due to an ill-formed replacement string.
  @G_REGEX_ERROR_MATCH: The match process failed.
  @Since: 2.14
@@ -139,6 +139,9 @@ flag they are considered as a raw sequence of bytes.
  parentheses in the pattern. Any opening parenthesis that is not followed
  by "?" behaves as if it were followed by "?:" but named parentheses can
  still be used for capturing (and they acquire numbers in the usual way).
+@G_REGEX_OPTIMIZE: Optimize the regular expression. If the pattern will
+be used many times, then it may be worth the effort to optimize it to
+improve the speed of matches.
  @G_REGEX_DUPNAMES: Names used to identify capturing subpatterns need not
  be unique. This can be helpful for certain types of pattern when it is known
  that only one instance of the named subpattern can ever be matched.
@@ -204,17 +207,12 @@ It is called for each occurance of the pattern @regex in @string, and it
  should append the replacement to @result.
  </para>
  
-<para>
-Do not call on @regex functions that modify its internal state, such as
-g_regex_match(); if you need it you can create a temporary copy of
-@regex using g_regex_copy().
-</para>
-
-@Param1: a #GRegex.
-@Param2: the string used to perform matches against.
-@Param3: a #GString containing the new string.
-@Param4: user data passed to g_regex_replace_eval().
-@Returns: %FALSE to continue the replacement process, %TRUE to stop it.
+@Param1: the #GRegex passed to g_regex_replace_eval()
+@Param2: the #GMatchInfo generated by the match
+@Param3: the string used to perform matches against
+@Param4: a #GString containing the new string
+@Param5: user data passed to g_regex_replace_eval()
+@Returns: %FALSE to continue the replacement process, %TRUE to stop it
  @Since: 2.14
  
  
@@ -238,42 +236,35 @@ g_regex_match(); if you need it you can create a temporary copy of
  @regex: 
  
  
-<!-- ##### FUNCTION g_regex_optimize ##### -->
+<!-- ##### FUNCTION g_regex_get_pattern ##### -->
  <para>
  
  </para>
  
  @regex: 
-@error: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_copy ##### -->
+<!-- ##### FUNCTION g_regex_get_string_number ##### -->
  <para>
  
  </para>
  
  @regex: 
+@name: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_get_pattern ##### -->
+<!-- ##### FUNCTION g_regex_escape_string ##### -->
  <para>
  
  </para>
  
-@regex: 
+@string: 
+@length: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_clear ##### -->
-<para>
-
-</para>
-
-@regex: 
-
-
  <!-- ##### FUNCTION g_regex_match_simple ##### -->
  <para>
  
@@ -294,6 +285,7 @@ g_regex_match(); if you need it you can create a temporary copy of
  @regex: 
  @string: 
  @match_options: 
+@match_info: 
  @Returns: 
  
  
@@ -307,11 +299,12 @@ g_regex_match(); if you need it you can create a temporary copy of
  @string_len: 
  @start_position: 
  @match_options: 
+@match_info: 
  @error: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_match_next ##### -->
+<!-- ##### FUNCTION g_regex_match_all ##### -->
  <para>
  
  </para>
@@ -319,10 +312,11 @@ g_regex_match(); if you need it you can create a temporary copy of
  @regex: 
  @string: 
  @match_options: 
+@match_info: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_match_next_full ##### -->
+<!-- ##### FUNCTION g_regex_match_all_full ##### -->
  <para>
  
  </para>
@@ -332,247 +326,201 @@ g_regex_match(); if you need it you can create a temporary copy of
  @string_len: 
  @start_position: 
  @match_options: 
+@match_info: 
  @error: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_match_all ##### -->
+<!-- ##### FUNCTION g_regex_split_simple ##### -->
  <para>
  
  </para>
  
-@regex: 
+@pattern: 
  @string: 
+@compile_options: 
  @match_options: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_match_all_full ##### -->
+<!-- ##### FUNCTION g_regex_split ##### -->
  <para>
  
  </para>
  
  @regex: 
  @string: 
-@string_len: 
-@start_position: 
  @match_options: 
-@error: 
-@Returns: 
-
-
-<!-- ##### FUNCTION g_regex_get_match_count ##### -->
-<para>
-
-</para>
-
-@regex: 
-@Returns: 
-
-
-<!-- ##### FUNCTION g_regex_is_partial_match ##### -->
-<para>
-
-</para>
-
-@regex: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_fetch ##### -->
+<!-- ##### FUNCTION g_regex_split_full ##### -->
  <para>
  
  </para>
  
  @regex: 
-@match_num: 
  @string: 
+@string_len: 
+@start_position: 
+@match_options: 
+@max_tokens: 
+@error: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_fetch_pos ##### -->
-<para>
-
-</para>
-
-@regex: 
-@match_num: 
-@start_pos: 
-@end_pos: 
-@Returns: 
-
-
-<!-- ##### FUNCTION g_regex_fetch_named ##### -->
+<!-- ##### FUNCTION g_regex_replace ##### -->
  <para>
  
  </para>
  
  @regex: 
-@name: 
  @string: 
+@string_len: 
+@start_position: 
+@replacement: 
+@match_options: 
+@error: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_fetch_named_pos ##### -->
+<!-- ##### FUNCTION g_regex_replace_literal ##### -->
  <para>
  
  </para>
  
  @regex: 
-@name: 
-@start_pos: 
-@end_pos: 
+@string: 
+@string_len: 
+@start_position: 
+@replacement: 
+@match_options: 
+@error: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_fetch_all ##### -->
+<!-- ##### FUNCTION g_regex_replace_eval ##### -->
  <para>
  
  </para>
  
  @regex: 
  @string: 
+@string_len: 
+@start_position: 
+@match_options: 
+@eval: 
+@user_data: 
+@error: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_get_string_number ##### -->
+<!-- ##### STRUCT GMatchInfo ##### -->
  <para>
-
+#GMatchInfo is used to retrieve information about the regular expression match
+which created it.
+This structure is opaque and its fields cannot be accessed directly.
  </para>
  
-@regex: 
-@name: 
-@Returns: 
-
+@Since: 2.14
  
-<!-- ##### FUNCTION g_regex_split_simple ##### -->
+<!-- ##### FUNCTION g_match_info_free ##### -->
  <para>
  
  </para>
  
-@pattern: 
-@string: 
-@compile_options: 
-@match_options: 
-@Returns: 
+@match_info: 
  
  
-<!-- ##### FUNCTION g_regex_split ##### -->
+<!-- ##### FUNCTION g_match_info_next ##### -->
  <para>
  
  </para>
  
-@regex: 
-@string: 
-@match_options: 
+@match_info: 
+@error: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_split_full ##### -->
+<!-- ##### FUNCTION g_match_info_get_match_count ##### -->
  <para>
  
  </para>
  
-@regex: 
-@string: 
-@string_len: 
-@start_position: 
-@match_options: 
-@max_tokens: 
-@error: 
+@match_info: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_split_next ##### -->
+<!-- ##### FUNCTION g_match_info_is_partial_match ##### -->
  <para>
  
  </para>
  
-@regex: 
-@string: 
-@match_options: 
+@match_info: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_split_next_full ##### -->
+<!-- ##### FUNCTION g_match_info_expand_references ##### -->
  <para>
  
  </para>
  
-@regex: 
-@string: 
-@string_len: 
-@start_position: 
-@match_options: 
+@match_info: 
+@string_to_expand: 
  @error: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_expand_references ##### -->
+<!-- ##### FUNCTION g_match_info_fetch ##### -->
  <para>
  
  </para>
  
-@regex: 
-@string: 
-@string_to_expand: 
-@error: 
+@match_info: 
+@match_num: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_replace ##### -->
+<!-- ##### FUNCTION g_match_info_fetch_pos ##### -->
  <para>
  
  </para>
  
-@regex: 
-@string: 
-@string_len: 
-@start_position: 
-@replacement: 
-@match_options: 
-@error: 
+@match_info: 
+@match_num: 
+@start_pos: 
+@end_pos: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_replace_literal ##### -->
+<!-- ##### FUNCTION g_match_info_fetch_named ##### -->
  <para>
  
  </para>
  
-@regex: 
-@string: 
-@string_len: 
-@start_position: 
-@replacement: 
-@match_options: 
-@error: 
+@match_info: 
+@name: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_replace_eval ##### -->
+<!-- ##### FUNCTION g_match_info_fetch_named_pos ##### -->
  <para>
  
  </para>
  
-@regex: 
-@string: 
-@string_len: 
-@start_position: 
-@match_options: 
-@eval: 
-@user_data: 
-@error: 
+@match_info: 
+@name: 
+@start_pos: 
+@end_pos: 
  @Returns: 
  
  
-<!-- ##### FUNCTION g_regex_escape_string ##### -->
+<!-- ##### FUNCTION g_match_info_fetch_all ##### -->
  <para>
  
  </para>
  
-@string: 
-@length: 
+@match_info: 
  @Returns: 
  
  
diff --git a/glib/glib.symbols b/glib/glib.symbols

index 57de381..89da36c 100644 (file)
--- a/glib/glib.symbols
+++ b/glib/glib.symbols
@@ -1424,35 +1424,31 @@ g_get_codeset
  g_regex_error_quark
  g_regex_new
  g_regex_free
-g_regex_optimize
-g_regex_copy
  g_regex_get_pattern
-g_regex_clear
+g_regex_get_string_number
+g_regex_escape_string
  g_regex_match_simple
  g_regex_match
  g_regex_match_full
-g_regex_match_next
-g_regex_match_next_full
  g_regex_match_all
  g_regex_match_all_full
-g_regex_get_match_count
-g_regex_is_partial_match
-g_regex_fetch
-g_regex_fetch_pos
-g_regex_fetch_named
-g_regex_fetch_named_pos
-g_regex_fetch_all
-g_regex_get_string_number
  g_regex_split_simple
  g_regex_split
  g_regex_split_full
-g_regex_split_next
-g_regex_split_next_full
-g_regex_expand_references
  g_regex_replace
  g_regex_replace_literal
  g_regex_replace_eval
-g_regex_escape_string
+g_match_info_free
+g_match_info_next
+g_match_info_matches
+g_match_info_get_match_count
+g_match_info_is_partial_match
+g_match_info_expand_references
+g_match_info_fetch
+g_match_info_fetch_pos
+g_match_info_fetch_named
+g_match_info_fetch_named_pos
+g_match_info_fetch_all
  #endif
  #endif
  
diff --git a/glib/gregex.c b/glib/gregex.c

index 043ec64..756c1a1 100644 (file)
--- a/glib/gregex.c
+++ b/glib/gregex.c
@@ -45,6 +45,7 @@
                               G_REGEX_UNGREEDY          | \
                               G_REGEX_RAW               | \
                               G_REGEX_NO_AUTO_CAPTURE   | \
+                             G_REGEX_OPTIMIZE          | \
                               G_REGEX_DUPNAMES          | \
                               G_REGEX_NEWLINE_CR        | \
                               G_REGEX_NEWLINE_LF        | \
@@ -63,54 +64,54 @@
  
  /* if the string is in UTF-8 use g_utf8_ functions, else use
   * use just +/- 1. */
-#define NEXT_CHAR(re, s) (((re)->pattern->compile_opts & PCRE_UTF8) ? \
+#define NEXT_CHAR(re, s) (((re)->compile_opts & PCRE_UTF8) ? \
                                 g_utf8_next_char (s) : \
                                 ((s) + 1))
-#define PREV_CHAR(re, s) (((re)->pattern->compile_opts & PCRE_UTF8) ? \
+#define PREV_CHAR(re, s) (((re)->compile_opts & PCRE_UTF8) ? \
                                 g_utf8_prev_char (s) : \
                                 ((s) - 1))
  
-#define WORKSPACE_INITIAL 1000
-#define OFFSETS_DFA_MIN_SIZE 21
-
-/* atomically returns the pcre_extra struct in the regex. */
-#define REGEX_GET_EXTRA(re) ((pcre_extra *)g_atomic_pointer_get (&(re)->pattern->extra))
-
-/* this struct can be shared by more regexes */
-typedef struct
+struct _GMatchInfo
  {
-  volatile guint ref_count;    /* the ref count for the immutable part */
-  gchar *pattern;              /* the pattern */
-  pcre *pcre_re;               /* compiled form of the pattern */
-  GRegexCompileFlags compile_opts;     /* options used at compile time on the pattern */
+  GRegex *regex;               /* the regex */
    GRegexMatchFlags match_opts; /* options used at match time on the regex */
-  pcre_extra *extra;           /* data stored when g_regex_optimize() is used */
-} GRegexPattern;
-
-/* this struct is used only by a single regex */
-typedef struct
-{
    gint matches;                        /* number of matching sub patterns */
    gint pos;                    /* position in the string where last match left off */
    gint *offsets;               /* array of offsets paired 0,1 ; 2,3 ; 3,4 etc */
    gint n_offsets;              /* number of offsets */
    gint *workspace;             /* workspace for pcre_dfa_exec() */
    gint n_workspace;            /* number of workspace elements */
-  gssize string_len;           /* length of the string last used against */
-  GSList *delims;              /* delimiter sub strings from split next */
-  gint last_separator_end;     /* position of the last separator for split_next_full() */
-  gboolean last_match_is_empty;        /* was the last match in split_next_full() 0 bytes long? */
-} GRegexMatch;
+  const gchar *string;         /* string passed to the match function */
+  gssize string_len;           /* length of string */
+};
  
  struct _GRegex
  {
-  GRegexPattern *pattern;      /* immutable part, shared */
-  GRegexMatch *match;          /* mutable part, not shared */
+  volatile guint ref_count;    /* the ref count for the immutable part */
+  gchar *pattern;              /* the pattern */
+  pcre *pcre_re;               /* compiled form of the pattern */
+  GRegexCompileFlags compile_opts;     /* options used at compile time on the pattern */
+  GRegexMatchFlags match_opts; /* options used at match time on the regex */
+  pcre_extra *extra;           /* data stored when G_REGEX_OPTIMIZE is used */
  };
  
  /* TRUE if ret is an error code, FALSE otherwise. */
  #define IS_PCRE_ERROR(ret) ((ret) < PCRE_ERROR_NOMATCH && (ret) != PCRE_ERROR_PARTIAL)
  
+static GRegex  *regex_ref      (GRegex *regex);
+static void     regex_unref    (GRegex *regex);
+
+typedef struct _InterpolationData InterpolationData;
+static gboolean         interpolate_replacement        (const GRegex *regex,
+                                                const GMatchInfo *match_info,
+                                                const gchar *string,
+                                                GString *result,
+                                                gpointer data);
+static GList   *split_replacement              (const gchar *replacement,
+                                                GError **error);
+static void     free_interpolation_data        (InterpolationData *data);
+
+
  static const gchar *
  match_error (gint errcode)
  {
@@ -159,7 +160,7 @@ match_error (gint errcode)
      case PCRE_ERROR_DFA_UCOND:
        return _("back references as conditions are not supported for partial matching");
      case PCRE_ERROR_DFA_UMLIMIT:
-      /* the match_field field is not udes in GRegex */
+      /* the match_field field is not used in GRegex */
        break;
      case PCRE_ERROR_DFA_WSSIZE:
        /* handled expanding the workspace */
@@ -177,1064 +178,1021 @@ match_error (gint errcode)
    return _("unknown error");
  }
  
-GQuark
-g_regex_error_quark (void)
-{
-  static GQuark error_quark = 0;
-
-  if (error_quark == 0)
-    error_quark = g_quark_from_static_string ("g-regex-error-quark");
  
-  return error_quark;
-}
+/* GMatchInfo */
  
-static GRegexPattern *
-regex_pattern_new (pcre              *re,
-                  const gchar       *pattern,
-                  GRegexCompileFlags compile_options,
-                  GRegexMatchFlags   match_options)
+static GMatchInfo *
+match_info_new (const GRegex *regex,
+               const gchar  *string,
+               gint          string_len,
+               gint          start_position,
+               gint          match_options,
+               gboolean      is_dfa)
  {
-  GRegexPattern *rp = g_new0 (GRegexPattern, 1);
-  rp->ref_count = 1;
-  rp->pcre_re = re;
-  rp->pattern = g_strdup (pattern);
-  rp->compile_opts = compile_options;
-  rp->match_opts = match_options;
-  return rp;
-}
+  GMatchInfo *match_info;
  
-static GRegexPattern *
-regex_pattern_ref (GRegexPattern *rp)
-{
-  /* increases the ref count of the immutable part of the GRegex */
-  g_atomic_int_inc ((gint*) &rp->ref_count);
-  return rp;
-}
+  if (string_len < 0)
+    string_len = strlen (string);
  
-static void
-regex_pattern_unref (GRegexPattern *rp)
-{
-  /* decreases the ref count of the immutable part of the GRegex
-   * and deletes it if the ref count went to 0 */
-  if (g_atomic_int_exchange_and_add ((gint *) &rp->ref_count, -1) - 1 == 0)
+  match_info = g_new0 (GMatchInfo, 1);
+  match_info->regex = regex_ref ((GRegex *)regex);
+  match_info->string = string;
+  match_info->string_len = string_len;
+  match_info->matches = PCRE_ERROR_NOMATCH;
+  match_info->pos = start_position;
+  match_info->match_opts = match_options;
+
+  if (is_dfa)
      {
-      g_free (rp->pattern);
-      if (rp->pcre_re != NULL)
-       pcre_free (rp->pcre_re);
-      if (rp->extra != NULL)
-       pcre_free (rp->extra);
-      g_free (rp);
+      /* These values should be enough for most cases, if they are not
+       * enough g_regex_match_all_full() will expand them. */
+      match_info->n_offsets = 24;
+      match_info->n_workspace = 100;
+      match_info->workspace = g_new (gint, match_info->n_workspace);
      }
-}
-
-static void
-regex_match_free (GRegexMatch *rm)
-{
-  if (rm == NULL)
-    return;
+  else
+    {
+      gint capture_count;
+      pcre_fullinfo (regex->pcre_re, regex->extra,
+                     PCRE_INFO_CAPTURECOUNT, &capture_count);
+      match_info->n_offsets = (capture_count + 1) * 3;
+    }
+  match_info->offsets = g_new0 (gint, match_info->n_offsets);
  
-  g_slist_foreach (rm->delims, (GFunc) g_free, NULL);
-  g_slist_free (rm->delims);
-  g_free (rm->offsets);
-  g_free (rm->workspace);
-  g_free (rm);
+  return match_info;
  }
  
-static void
-regex_lazy_init_match (GRegex *regex,
-                      gint    min_offsets)
+/**
+ * g_match_info_free:
+ * @match_info: a #GMatchInfo
+ *
+ * Frees all the memory associated with the #GMatchInfo structure.
+ *
+ * Since: 2.14
+ */
+void
+g_match_info_free (GMatchInfo *match_info)
  {
-  gint n_offsets;
-
-  if (regex->match != NULL)
-    return;
-
-  pcre_fullinfo (regex->pattern->pcre_re,
-                REGEX_GET_EXTRA (regex),
-                PCRE_INFO_CAPTURECOUNT, &n_offsets);
-  n_offsets = (MAX (n_offsets, min_offsets) + 1) * 3;
-
-  regex->match = g_new0 (GRegexMatch, 1);
-  regex->match->string_len = -1;
-  regex->match->matches = -1000;
-  regex->match->n_offsets = n_offsets;
-  regex->match->offsets = g_new0 (gint, n_offsets);
+  regex_unref (match_info->regex);
+  g_free (match_info->offsets);
+  g_free (match_info->workspace);
+  g_free (match_info);
  }
  
-/** 
- * g_regex_new:
- * @pattern: the regular expression
- * @compile_options: compile options for the regular expression
- * @match_options: match options for the regular expression
- * @error: return location for a #GError
- * 
- * Compiles the regular expression to an internal form, and does the initial
- * setup of the #GRegex structure.  
- * 
- * Returns: a #GRegex structure
+/**
+ * g_match_info_next:
+ * @match_info: a #GMatchInfo structure
+ * @error: location to store the error occuring, or NULL to ignore errors
+ *
+ * Scans for the next match using the same parameters of the previous
+ * call to g_regex_match_full() or g_regex_match() that returned
+ * @match_info.
+ *
+ * The match is done on the string passed to the match function, so you
+ * cannot free it before calling this function.
+ *
+ * Returns: %TRUE is the string matched, %FALSE otherwise
   *
   * Since: 2.14
   */
-GRegex *
-g_regex_new (const gchar         *pattern, 
-            GRegexCompileFlags   compile_options,
-            GRegexMatchFlags     match_options,
-            GError             **error)
+gboolean
+g_match_info_next (GMatchInfo  *match_info,
+                  GError     **error)
  {
-  pcre *re;
-  const gchar *errmsg;
-  gint erroffset;
-  static gboolean initialized = FALSE;
-  
-  g_return_val_if_fail (pattern != NULL, NULL);
-  g_return_val_if_fail (error == NULL || *error == NULL, NULL);
-  g_return_val_if_fail ((compile_options & ~G_REGEX_COMPILE_MASK) == 0, NULL);
-  g_return_val_if_fail ((match_options & ~G_REGEX_MATCH_MASK) == 0, NULL);
-
-  if (!initialized)
+  g_return_val_if_fail (match_info != NULL, FALSE);
+  g_return_val_if_fail (error == NULL || *error == NULL, FALSE);
+  g_return_val_if_fail (match_info->pos >= 0, FALSE);
+
+  match_info->matches = pcre_exec (match_info->regex->pcre_re,
+                                  match_info->regex->extra,
+                                  match_info->string,
+                                  match_info->string_len,
+                                  match_info->pos,
+                                  match_info->regex->match_opts |
+                                  match_info->match_opts,
+                                  match_info->offsets,
+                                   match_info->n_offsets);
+  if (IS_PCRE_ERROR (match_info->matches))
      {
-      gint support;
-      const gchar *msg;
-
-      pcre_config (PCRE_CONFIG_UTF8, &support);
-      if (!support)
-       {
-         msg = N_("PCRE library is compiled without UTF8 support");
-         g_critical (msg);
-         g_set_error (error, G_REGEX_ERROR, G_REGEX_ERROR_COMPILE, gettext (msg));
-         return NULL;
-       }
-
-      pcre_config (PCRE_CONFIG_UNICODE_PROPERTIES, &support);
-      if (!support)
-       {
-         msg = N_("PCRE library is compiled without UTF8 properties support");
-         g_critical (msg);
-         g_set_error (error, G_REGEX_ERROR, G_REGEX_ERROR_COMPILE, gettext (msg));
-         return NULL;
-       }
-
-      initialized = TRUE;
+      g_set_error (error, G_REGEX_ERROR, G_REGEX_ERROR_MATCH,
+                  _("Error while matching regular expression %s: %s"),
+                  match_info->regex->pattern, match_error (match_info->matches));
+      return FALSE;
      }
  
-  /* In GRegex the string are, by default, UTF-8 encoded. PCRE
-   * instead uses UTF-8 only if required with PCRE_UTF8. */
-  if (compile_options & G_REGEX_RAW)
+  /* avoid infinite loops if the pattern is an empty string or something
+   * equivalent */
+  if (match_info->pos == match_info->offsets[1])
      {
-      /* disable utf-8 */
-      compile_options &= ~G_REGEX_RAW;
+      if (match_info->pos > match_info->string_len)
+       {
+         /* we have reached the end of the string */
+         match_info->pos = -1;
+          match_info->matches = PCRE_ERROR_NOMATCH;
+         return FALSE;
+        }
+      match_info->pos = NEXT_CHAR (match_info->regex,
+                                  &match_info->string[match_info->pos]) -
+                                  match_info->string;
      }
    else
      {
-      /* enable utf-8 */
-      compile_options |= PCRE_UTF8 | PCRE_NO_UTF8_CHECK;
-      match_options |= PCRE_NO_UTF8_CHECK;
+      match_info->pos = match_info->offsets[1];
      }
  
-  /* compile the pattern */
-  re = pcre_compile (pattern, compile_options, &errmsg, &erroffset, NULL);
-
-  /* if the compilation failed, set the error member and return 
-   * immediately */
-  if (re == NULL)
-    {
-      GError *tmp_error = g_error_new (G_REGEX_ERROR, 
-                                      G_REGEX_ERROR_COMPILE,
-                                      _("Error while compiling regular "
-                                        "expression %s at char %d: %s"),
-                                      pattern, erroffset, errmsg);
-      g_propagate_error (error, tmp_error);
-
-      return NULL;
-    }
-  else
-    {
-      GRegex *regex = g_new0 (GRegex, 1);
-      regex->pattern = regex_pattern_new (re, pattern,
-                                         compile_options, match_options);
-      return regex;
-    }
+  return match_info->matches >= 0;
  }
  
  /**
- * g_regex_free:
- * @regex: a #GRegex
+ * g_match_info_matches:
+ * @match_info: a #GMatchInfo structure
   *
- * Frees all the memory associated with the regex structure.
+ * Returns: %TRUE if the previous match operation succeeded, %FALSE
+ * otherwise
   *
   * Since: 2.14
   */
-void
-g_regex_free (GRegex *regex)
+gboolean
+g_match_info_matches (const GMatchInfo *match_info)
  {
-  if (regex == NULL)
-    return;
+  g_return_val_if_fail (match_info != NULL, FALSE);
  
-  regex_pattern_unref (regex->pattern);
-  regex_match_free (regex->match);
-  g_free (regex);
+  return match_info->matches >= 0;
  }
  
  /**
- * g_regex_copy:
- * @regex: a #GRegex structure from g_regex_new()
+ * g_match_info_get_match_count:
+ * @match_info: a #GMatchInfo structure
   *
- * Copies a #GRegex. The returned #Gregex is in the same state as after
- * a call to g_regex_clear(), so it does not contain information on the
- * last match. If @regex is %NULL it returns %NULL.
+ * Retrieves the number of matched substrings (including substring 0, that
+ * is the whole matched text), so 1 is returned if the pattern has no
+ * substrings in it and 0 is returned if the match failed.
   *
- * The returned copy shares some of its internal state with the original
- * @regex, and the other internal variables are created only when needed,
- * so the copy is a lightweight operation.
+ * If the last match was obtained using the DFA algorithm, that is using
+ * g_regex_match_all() or g_regex_match_all_full(), the retrieved
+ * count is not that of the number of capturing parentheses but that of
+ * the number of matched substrings.
   *
- * Returns: a newly-allocated copy of @regex, or %NULL if an error
- *          occurred
+ * Returns:  Number of matched substrings, or -1 if an error occurred
   *
   * Since: 2.14
   */
-GRegex *
-g_regex_copy (const GRegex *regex)
+gint
+g_match_info_get_match_count (const GMatchInfo *match_info)
  {
-  GRegex *copy;
-
-  if (regex == NULL)
-    return NULL;
+  g_return_val_if_fail (match_info, -1);
  
-  copy = g_new0 (GRegex, 1);
-  copy->pattern = regex_pattern_ref (regex->pattern);
-
-  return copy;
+  if (match_info->matches == PCRE_ERROR_NOMATCH)
+    /* no match */
+    return 0;
+  else if (match_info->matches < PCRE_ERROR_NOMATCH)
+    /* error */
+    return -1;
+  else
+    /* match */
+    return match_info->matches;
  }
  
  /**
- * g_regex_get_pattern:
- * @regex: a #GRegex structure
+ * g_match_info_is_partial_match:
+ * @match_info: a #GMatchInfo structure
   *
- * Gets the pattern string associated with @regex, i.e. a copy of 
- * the string passed to g_regex_new().
+ * Usually if the string passed to g_regex_match*() matches as far as
+ * it goes, but is too short to match the entire pattern, %FALSE is
+ * returned. There are circumstances where it might be helpful to
+ * distinguish this case from other cases in which there is no match.
   *
- * Returns: the pattern of @regex
+ * Consider, for example, an application where a human is required to
+ * type in data for a field with specific formatting requirements. An
+ * example might be a date in the form ddmmmyy, defined by the pattern
+ * "^\d?\d(jan|feb|mar|apr|may|jun|jul|aug|sep|oct|nov|dec)\d\d$".
+ * If the application sees the user’s keystrokes one by one, and can
+ * check that what has been typed so far is potentially valid, it is
+ * able to raise an error as soon as a mistake is made.
   *
- * Since: 2.14
- */
-const gchar *
-g_regex_get_pattern (const GRegex *regex)
-{
-  g_return_val_if_fail (regex != NULL, NULL);
-
-  return regex->pattern->pattern;
-}
-
-/**
- * g_regex_clear:
- * @regex: a #GRegex structure
+ * GRegex supports the concept of partial matching by means of the
+ * #G_REGEX_MATCH_PARTIAL flag. When this is set the return code for
+ * g_regex_match() or g_regex_match_full() is, as usual, %TRUE
+ * for a complete match, %FALSE otherwise. But, when this functions
+ * returns %FALSE, you can check if the match was partial calling
+ * g_match_info_is_partial_match().
+ *
+ * When using partial matching you cannot use g_match_info_fetch*().
+ *
+ * Because of the way certain internal optimizations are implemented the
+ * partial matching algorithm cannot be used with all patterns. So repeated
+ * single characters such as "a{2,4}" and repeated single metasequences such
+ * as "\d+" are not permitted if the maximum number of occurrences is
+ * greater than one. Optional items such as "\d?" (where the maximum is one)
+ * are permitted. Quantifiers with any values are permitted after
+ * parentheses, so the invalid examples above can be coded thus "(a){2,4}"
+ * and "(\d)+". If #G_REGEX_MATCH_PARTIAL is set for a pattern that does
+ * not conform to the restrictions, matching functions return an error.
   *
- * Clears out the members of @regex that are holding information about the
- * last set of matches for this pattern.  g_regex_clear() needs to be
- * called between uses of g_regex_match_next() or g_regex_match_next_full()
- * against new target strings. 
+ * Returns: %TRUE if the match was partial, %FALSE otherwise
   *
   * Since: 2.14
   */
-void
-g_regex_clear (GRegex *regex)
+gboolean
+g_match_info_is_partial_match (const GMatchInfo *match_info)
  {
-  g_return_if_fail (regex != NULL);
-
-  if (regex->match == NULL)
-    return;
-
-  regex->match->matches = -1000; /* an error code not used by PCRE */
-  regex->match->string_len = -1;
-  regex->match->pos = 0;
+  g_return_val_if_fail (match_info != NULL, FALSE);
  
-  /* if the pattern was used with g_regex_split_next(), it may have
-   * delimiter offsets stored.  Free up those guys as well. */
-  if (regex->match->delims != NULL)
-    {
-      g_slist_foreach (regex->match->delims, (GFunc) g_free, NULL);
-      g_slist_free (regex->match->delims);
-      regex->match->delims = NULL;
-    }
+  return match_info->matches == PCRE_ERROR_PARTIAL;
  }
  
  /**
- * g_regex_optimize:
- * @regex: a #GRegex structure
- * @error: return location for a #GError
+ * g_match_info_expand_references:
+ * @match_info: a #GMatchInfo
+ * @string_to_expand: the string to expand
+ * @error: location to store the error occuring, or %NULL to ignore errors
+ *
+ * Returns a new string containing the text in @string_to_expand with
+ * references expanded. References refer to the last match done with
+ * @string against @regex and have the same syntax used by g_regex_replace().
+ *
+ * The @string_to_expand must be UTF-8 encoded even if #G_REGEX_RAW was
+ * passed to g_regex_new().
   *
- * If the pattern will be used many times, then it may be worth the
- * effort to optimize it to improve the speed of matches.
+ * The backreferences are extracted from the string passed to the match
+ * function, so you cannot free it before calling this function.
   *
- * Returns: %TRUE if @regex has been optimized or was already optimized,
- *          %FALSE otherwise
+ * Returns: the expanded string, or %NULL if an error occurred
   *
   * Since: 2.14
   */
-gboolean
-g_regex_optimize (GRegex  *regex,
-                 GError **error)
+gchar *
+g_match_info_expand_references (const GMatchInfo *match_info, 
+                               const gchar      *string_to_expand,
+                               GError          **error)
  {
-  const gchar *errmsg;
-  pcre_extra *extra;
-  pcre_extra G_GNUC_MAY_ALIAS **extra_p;
-
-  g_return_val_if_fail (regex != NULL, FALSE);
-  g_return_val_if_fail (error == NULL || *error == NULL, FALSE);
-
-  if (REGEX_GET_EXTRA (regex) != NULL)
-    /* already optimized. */
-    return TRUE;
+  GString *result;
+  GList *list;
+  GError *tmp_error = NULL;
  
-  extra = pcre_study (regex->pattern->pcre_re, 0, &errmsg);
+  g_return_val_if_fail (match_info != NULL, NULL);
+  g_return_val_if_fail (string_to_expand != NULL, NULL);
+  g_return_val_if_fail (error == NULL || *error == NULL, NULL);
  
-  if (errmsg != NULL)
+  list = split_replacement (string_to_expand, &tmp_error);
+  if (tmp_error != NULL)
      {
-      GError *tmp_error = g_error_new (G_REGEX_ERROR,
-                                      G_REGEX_ERROR_OPTIMIZE, 
-                                      _("Error while optimizing "
-                                        "regular expression %s: %s"),
-                                      regex->pattern->pattern,
-                                      errmsg);
        g_propagate_error (error, tmp_error);
-      return FALSE;
+      return NULL;
      }
  
-  if (extra == NULL)
-    return TRUE;
+  result = g_string_sized_new (strlen (string_to_expand));
+  interpolate_replacement (match_info->regex, match_info,
+                          match_info->string, result, list);
  
-  extra_p = &regex->pattern->extra;
-  if (!g_atomic_pointer_compare_and_exchange ((gpointer *)extra_p, NULL, extra))
-    /* someone else has optimized the regex while this function was running */
-    pcre_free (extra);
+  g_list_foreach (list, (GFunc)free_interpolation_data, NULL);
+  g_list_free (list);
  
-  return TRUE;
+  return g_string_free (result, FALSE);
  }
  
  /**
- * g_regex_match_simple:
- * @pattern: the regular expression
- * @string: the string to scan for matches
- * @compile_options: compile options for the regular expression
- * @match_options: match options
+ * g_match_info_fetch:
+ * @match_info: #GMatchInfo structure
+ * @match_num: number of the sub expression
   *
- * Scans for a match in @string for @pattern.
+ * Retrieves the text matching the @match_num<!-- -->'th capturing parentheses.
+ * 0 is the full text of the match, 1 is the first paren set, 2 the second,
+ * and so on.
   *
- * This function is equivalent to g_regex_match() but it does not
- * require to compile the pattern with g_regex_new(), avoiding some
- * lines of code when you need just to do a match without extracting
- * substrings, capture counts, and so on.
+ * If @match_num is a valid sub pattern but it didn't match anything (e.g.
+ * sub pattern 1, matching "b" against "(a)?b") then an empty string is
+ * returned.
   *
- * If this function is to be called on the same @pattern more than
- * once, it's more efficient to compile the pattern once with
- * g_regex_new() and then use g_regex_match().
+ * If the match was obtained using the DFA algorithm, that is using
+ * g_regex_match_all() or g_regex_match_all_full(), the retrieved
+ * string is not that of a set of parentheses but that of a matched
+ * substring. Substrings are matched in reverse order of length, so 0 is
+ * the longest match.
   *
- * Returns: %TRUE is the string matched, %FALSE otherwise
+ * The string is fetched from the string passed to the match function,
+ * so you cannot free it before calling this function.
+ *
+ * Returns: The matched substring, or %NULL if an error occurred.
+ *          You have to free the string yourself
   *
   * Since: 2.14
   */
-gboolean
-g_regex_match_simple (const gchar        *pattern, 
-                     const gchar        *string, 
-                     GRegexCompileFlags  compile_options,
-                     GRegexMatchFlags    match_options)
+gchar *
+g_match_info_fetch (const GMatchInfo *match_info,
+                   gint              match_num)
  {
-  GRegex *regex;
-  gboolean result;
+  /* we cannot use pcre_get_substring() because it allocates the
+   * string using pcre_malloc(). */
+  gchar *match = NULL;
+  gint start, end;
  
-  regex = g_regex_new (pattern, compile_options, 0, NULL);
-  if (!regex)
-    return FALSE;
-  result = g_regex_match_full (regex, string, -1, 0, match_options, NULL);
-  g_regex_free (regex);
-  return result;
+  g_return_val_if_fail (match_info != NULL, NULL);
+  g_return_val_if_fail (match_num >= 0, NULL);
+
+  /* match_num does not exist or it didn't matched, i.e. matching "b"
+   * against "(a)?b" then group 0 is empty. */
+  if (!g_match_info_fetch_pos (match_info, match_num, &start, &end))
+    match = NULL;
+  else if (start == -1)
+    match = g_strdup ("");
+  else
+    match = g_strndup (&match_info->string[start], end - start);
+
+  return match;
  }
  
  /**
- * g_regex_match:
- * @regex: a #GRegex structure from g_regex_new()
- * @string: the string to scan for matches
- * @match_options: match options
+ * g_match_info_fetch_pos:
+ * @match_info: #GMatchInfo structure
+ * @match_num: number of the sub expression
+ * @start_pos: pointer to location where to store the start position
+ * @end_pos: pointer to location where to store the end position
   *
- * Scans for a match in string for the pattern in @regex. The @match_options
- * are combined with the match options specified when the @regex structure
- * was created, letting you have more flexibility in reusing #GRegex
- * structures.
+ * Retrieves the position of the @match_num<!-- -->'th capturing parentheses.
+ * 0 is the full text of the match, 1 is the first paren set, 2 the second,
+ * and so on.
   *
- * Returns: %TRUE is the string matched, %FALSE otherwise
+ * If @match_num is a valid sub pattern but it didn't match anything (e.g.
+ * sub pattern 1, matching "b" against "(a)?b") then @start_pos and @end_pos
+ * are set to -1 and %TRUE is returned.
+ *
+ * If the match was obtained using the DFA algorithm, that is using
+ * g_regex_match_all() or g_regex_match_all_full(), the retrieved
+ * position is not that of a set of parentheses but that of a matched
+ * substring. Substrings are matched in reverse order of length, so 0 is
+ * the longest match.
+ *
+ * Returns: %TRUE if the position was fetched, %FALSE otherwise. If the
+ *          position cannot be fetched, @start_pos and @end_pos are left
+ *          unchanged.
   *
   * Since: 2.14
   */
  gboolean
-g_regex_match (GRegex          *regex, 
-              const gchar     *string, 
-              GRegexMatchFlags match_options)
+g_match_info_fetch_pos (const GMatchInfo *match_info,
+                       gint              match_num,
+                       gint             *start_pos,
+                       gint             *end_pos)
  {
-  return g_regex_match_full (regex, string, -1, 0,
-                            match_options, NULL);
+  g_return_val_if_fail (match_info != NULL, FALSE);
+  g_return_val_if_fail (match_num >= 0, FALSE);
+ 
+  /* make sure the sub expression number they're requesting is less than
+   * the total number of sub expressions that were matched. */
+  if (match_num >= match_info->matches)
+    return FALSE;
+
+  if (start_pos != NULL)
+    *start_pos = match_info->offsets[2 * match_num];
+
+  if (end_pos != NULL)
+    *end_pos = match_info->offsets[2 * match_num + 1];
+
+  return TRUE;
  }
  
  /**
- * g_regex_match_full:
- * @regex: a #GRegex structure from g_regex_new()
- * @string: the string to scan for matches
- * @string_len: the length of @string, or -1 if @string is nul-terminated
- * @start_position: starting index of the string to match
- * @match_options: match options
- * @error: location to store the error occuring, or %NULL to ignore errors
+ * g_match_info_fetch_named:
+ * @match_info: #GMatchInfo structure
+ * @name: name of the subexpression
   *
- * Scans for a match in string for the pattern in @regex. The @match_options
- * are combined with the match options specified when the @regex structure
- * was created, letting you have more flexibility in reusing #GRegex
- * structures.
+ * Retrieves the text matching the capturing parentheses named @name.
   *
- * Setting @start_position differs from just passing over a shortened string
- * and  setting #G_REGEX_MATCH_NOTBOL in the case of a pattern that begins
- * with any kind of lookbehind assertion, such as "\b".
+ * If @name is a valid sub pattern name but it didn't match anything (e.g.
+ * sub pattern "X", matching "b" against "(?P&lt;X&gt;a)?b") then an empty
+ * string is returned.
   *
- * Returns: %TRUE is the string matched, %FALSE otherwise
+ * The string is fetched from the string passed to the match function,
+ * so you cannot free it before calling this function.
+ *
+ * Returns: The matched substring, or %NULL if an error occurred.
+ *          You have to free the string yourself
   *
   * Since: 2.14
   */
-gboolean
-g_regex_match_full (GRegex          *regex,
-                   const gchar       *string,
-                   gssize             string_len,
-                   gint               start_position,
-                   GRegexMatchFlags match_options,
-                   GError           **error)
+gchar *
+g_match_info_fetch_named (const GMatchInfo *match_info,
+                         const gchar      *name)
  {
-  g_return_val_if_fail (regex != NULL, FALSE);
-  g_return_val_if_fail (string != NULL, FALSE);
-  g_return_val_if_fail (start_position >= 0, FALSE);
-  g_return_val_if_fail (error == NULL || *error == NULL, FALSE);
-  g_return_val_if_fail ((match_options & ~G_REGEX_MATCH_MASK) == 0, FALSE);
-
-  regex_lazy_init_match (regex, 0);
-
-  if (string_len < 0)
-    string_len = strlen (string);
-
-  regex->match->string_len = string_len;
-
-  /* create regex->match->offsets if it does not exist */
-  regex_lazy_init_match (regex, 0);
-
-  /* perform the match */
-  regex->match->matches = pcre_exec (regex->pattern->pcre_re,
-                                    REGEX_GET_EXTRA (regex),
-                                    string, regex->match->string_len,
-                                    start_position,
-                                    regex->pattern->match_opts | match_options,
-                                    regex->match->offsets, regex->match->n_offsets);
-  if (IS_PCRE_ERROR (regex->match->matches))
-    {
-      g_set_error (error, G_REGEX_ERROR, G_REGEX_ERROR_MATCH,
-                  _("Error while matching regular expression %s: %s"),
-                  regex->pattern->pattern, match_error (regex->match->matches));
-      return FALSE;
-    }
+  /* we cannot use pcre_get_named_substring() because it allocates the
+   * string using pcre_malloc(). */
+  gint num;
  
-  /* set regex->match->pos to -1 so that a call to g_regex_match_next()
-   * fails without a previous call to g_regex_clear(). */
-  regex->match->pos = -1;
+  g_return_val_if_fail (match_info != NULL, NULL);
+  g_return_val_if_fail (name != NULL, NULL);
  
-  return regex->match->matches >= 0;
+  num = g_regex_get_string_number (match_info->regex, name);
+  if (num == -1)
+    return NULL;
+  else
+    return g_match_info_fetch (match_info, num);
  }
  
  /**
- * g_regex_match_next:
- * @regex: a #GRegex structure
- * @string: the string to scan for matches
- * @match_options: the match options
+ * g_match_info_fetch_named_pos:
+ * @match_info: #GMatchInfo structure
+ * @name: name of the subexpression
+ * @start_pos: pointer to location where to store the start position
+ * @end_pos: pointer to location where to store the end position
   *
- * Scans for the next match in @string of the pattern in @regex.
- * array.  The match options are combined with the match options set when
- * the @regex was created.
+ * Retrieves the position of the capturing parentheses named @name.
   *
- * You have to call g_regex_clear() to reuse the same pattern on a new
- * string.
+ * If @name is a valid sub pattern name but it didn't match anything (e.g.
+ * sub pattern "X", matching "b" against "(?P&lt;X&gt;a)?b") then @start_pos and
+ * @end_pos are set to -1 and %TRUE is returned.
   *
- * Returns: %TRUE is the string matched, %FALSE otherwise
+ * Returns: %TRUE if the position was fetched, %FALSE otherwise. If the
+ *          position cannot be fetched, @start_pos and @end_pos are left
+ *          unchanged.
   *
   * Since: 2.14
   */
  gboolean
-g_regex_match_next (GRegex          *regex, 
-                   const gchar     *string, 
-                   GRegexMatchFlags match_options)
+g_match_info_fetch_named_pos (const GMatchInfo *match_info,
+                             const gchar      *name,
+                             gint             *start_pos,
+                             gint             *end_pos)
  {
-  return g_regex_match_next_full (regex, string, -1, 0,
-                                 match_options, NULL);
+  gint num;
+
+  g_return_val_if_fail (match_info != NULL, FALSE);
+  g_return_val_if_fail (name != NULL, FALSE);
+ 
+  num = g_regex_get_string_number (match_info->regex, name);
+  if (num == -1)
+    return FALSE;
+
+  return g_match_info_fetch_pos (match_info, num, start_pos, end_pos);
  }
  
  /**
- * g_regex_match_next_full:
- * @regex: a #GRegex structure
- * @string: the string to scan for matches
- * @string_len: the length of @string, or -1 if @string is nul-terminated
- * @start_position: starting index of the string to match
- * @match_options: the match options
- * @error: location to store the error occuring, or %NULL to ignore errors
+ * g_match_info_fetch_all:
+ * @match_info: a #GMatchInfo structure
   *
- * Scans for the next match in @string of the pattern in @regex. Calling
- * g_regex_match_next_full() until it returns %FALSE, you can retrieve
- * all the non-overlapping matches of the pattern in @string. Empty matches
- * are included, so matching the string "ab" with the pattern "b*" will
- * find three matches: "" at position 0, "b" from position 1 to 2 and
- * "" at position 2.
+ * Bundles up pointers to each of the matching substrings from a match
+ * and stores them in an array of gchar pointers. The first element in
+ * the returned array is the match number 0, i.e. the entire matched
+ * text.
   *
- * The match options are combined with the match options set when the
- * @regex was created.
+ * If a sub pattern didn't match anything (e.g. sub pattern 1, matching
+ * "b" against "(a)?b") then an empty string is inserted.
   *
- * You have to call g_regex_clear() to reuse the same pattern on a new
- * string.
+ * If the last match was obtained using the DFA algorithm, that is using
+ * g_regex_match_all() or g_regex_match_all_full(), the retrieved
+ * strings are not that matched by sets of parentheses but that of the
+ * matched substring. Substrings are matched in reverse order of length,
+ * so the first one is the longest match.
   *
- * Setting @start_position differs from just passing over a shortened string
- * and  setting #G_REGEX_MATCH_NOTBOL in the case of a pattern that begins
- * with any kind of lookbehind assertion, such as "\b".
+ * The strings are fetched from the string passed to the match function,
+ * so you cannot free it before calling this function.
   *
- * Returns: %TRUE is the string matched, %FALSE otherwise
+ * Returns: a %NULL-terminated array of gchar * pointers. It must be freed
+ *          using g_strfreev(). If the previous match failed %NULL is
+ *          returned.
   *
   * Since: 2.14
   */
-gboolean
-g_regex_match_next_full (GRegex          *regex,
-                        const gchar     *string,
-                        gssize           string_len,
-                        gint             start_position,
-                        GRegexMatchFlags match_options,
-                        GError         **error)
+gchar **
+g_match_info_fetch_all (const GMatchInfo *match_info)
  {
-  g_return_val_if_fail (regex != NULL, FALSE);
-  g_return_val_if_fail (string != NULL, FALSE);
-  g_return_val_if_fail (start_position >= 0, FALSE);
-  g_return_val_if_fail (error == NULL || *error == NULL, FALSE);
-  g_return_val_if_fail ((match_options & ~G_REGEX_MATCH_MASK) == 0, FALSE);
+  /* we cannot use pcre_get_substring_list() because the returned value
+   * isn't suitable for g_strfreev(). */
+  gchar **result;
+  gint i;
  
-  regex_lazy_init_match (regex, 0);
+  g_return_val_if_fail (match_info != NULL, FALSE);
  
-  if (G_UNLIKELY (regex->match->pos < 0))
-    {
-      const gchar *msg = _("g_regex_match_next_full: called without a "
-                           "previous call to g_regex_clear()");
-      g_log (G_LOG_DOMAIN, G_LOG_LEVEL_CRITICAL, msg);
-      g_set_error (error, G_REGEX_ERROR, G_REGEX_ERROR_MATCH, msg);
-      return FALSE;
-    }
+  if (match_info->matches < 0)
+    return NULL;
  
-  /* if this regex hasn't been used on this string before, then we
-   * need to calculate the length of the string, and set pos to the
-   * start of it.  
-   * Knowing if this regex has been used on this string is a bit of
-   * a challenge.  For now, we require the user to call g_regex_clear()
-   * in between usages on a new string.  Not perfect, but not such a
-   * bad solution either.
-   */
-  if (regex->match->string_len == -1)
-    {
-      if (string_len < 0)
-        string_len = strlen (string);
-      regex->match->string_len = string_len;
+  result = g_new (gchar *, match_info->matches + 1);
+  for (i = 0; i < match_info->matches; i++)
+    result[i] = g_match_info_fetch (match_info, i);
+  result[i] = NULL;
  
-      regex->match->pos = start_position;
-    }
+  return result;
+}
  
-  /* create regex->match->offsets if it does not exist */
-  regex_lazy_init_match (regex, 0);
-
-  /* perform the match */
-  regex->match->matches = pcre_exec (regex->pattern->pcre_re,
-                                    REGEX_GET_EXTRA (regex),
-                                    string, regex->match->string_len,
-                                    regex->match->pos,
-                                    regex->pattern->match_opts | match_options,
-                                    regex->match->offsets, regex->match->n_offsets);
-  if (IS_PCRE_ERROR (regex->match->matches))
-    {
-      g_set_error (error, G_REGEX_ERROR, G_REGEX_ERROR_MATCH,
-                  _("Error while matching regular expression %s: %s"),
-                  regex->pattern->pattern, match_error (regex->match->matches));
-      return FALSE;
-    }
  
-  /* avoid infinite loops if regex is an empty string or something
-   * equivalent */
-  if (regex->match->pos == regex->match->offsets[1])
-    {
-      if (regex->match->pos > regex->match->string_len)
-       {
-         /* we have reached the end of the string */
-         regex->match->pos = -1;
-         return FALSE;
-        }
-      regex->match->pos = NEXT_CHAR (regex, &string[regex->match->pos]) - string;
-    }
-  else
-    {
-      regex->match->pos = regex->match->offsets[1];
-    }
+/* GRegex */
+
+GQuark
+g_regex_error_quark (void)
+{
+  static GQuark error_quark = 0;
+
+  if (error_quark == 0)
+    error_quark = g_quark_from_static_string ("g-regex-error-quark");
  
-  return regex->match->matches >= 0;
+  return error_quark;
  }
  
-/**
- * g_regex_match_all:
- * @regex: a #GRegex structure from g_regex_new()
- * @string: the string to scan for matches
- * @match_options: match options
- *
- * Using the standard algorithm for regular expression matching only the
- * longest match in the string is retrieved. This function uses a
- * different algorithm so it can retrieve all the possible matches.
- * For more documentation see g_regex_match_all_full().
- *
- * Returns: %TRUE is the string matched, %FALSE otherwise
- *
- * Since: 2.14
- */
-gboolean
-g_regex_match_all (GRegex          *regex,
-                  const gchar     *string,
-                  GRegexMatchFlags match_options)
+static GRegex *
+regex_ref (GRegex *regex)
  {
-  return g_regex_match_all_full (regex, string, -1, 0,
-                                match_options, NULL);
+  g_atomic_int_inc ((gint*) &regex->ref_count);
+  return regex;
  }
  
-/**
- * g_regex_match_all_full:
- * @regex: a #GRegex structure from g_regex_new()
- * @string: the string to scan for matches
- * @string_len: the length of @string, or -1 if @string is nul-terminated
- * @start_position: starting index of the string to match
- * @match_options: match options
- * @error: location to store the error occuring, or %NULL to ignore errors
- *
- * Using the standard algorithm for regular expression matching only the
- * longest match in the string is retrieved, it is not possibile to obtain
- * all the available matches. For instance matching
- * "&lt;a&gt; &lt;b&gt; &lt;c&gt;" against the pattern "&lt;.*&gt;" you get
- * "&lt;a&gt; &lt;b&gt; &lt;c&gt;".
- *
- * This function uses a different algorithm (called DFA, i.e. deterministic
- * finite automaton), so it can retrieve all the possible matches, all
- * starting at the same point in the string. For instance matching
- * "&lt;a&gt; &lt;b&gt; &lt;c&gt;" against the pattern "&lt;.*&gt;" you
- * would obtain three matches: "&lt;a&gt; &lt;b&gt; &lt;c&gt;",
- * "&lt;a&gt; &lt;b&gt;" and "&lt;a&gt;".
- *
- * The number of matched strings is retrieved using
- * g_regex_get_match_count().
- * To obtain the matched strings and their position you can use,
- * respectively, g_regex_fetch() and g_regex_fetch_pos(). Note that the
- * strings are returned in reverse order of length; that is, the longest
- * matching string is given first.
- *
- * Note that the DFA algorithm is slower than the standard one and it is not
- * able to capture substrings, so backreferences do not work.
- *
- * Setting @start_position differs from just passing over a shortened string
- * and  setting #G_REGEX_MATCH_NOTBOL in the case of a pattern that begins
- * with any kind of lookbehind assertion, such as "\b".
- *
- * Returns: %TRUE is the string matched, %FALSE otherwise
+static void
+regex_unref (GRegex *regex)
+{
+  if (g_atomic_int_exchange_and_add ((gint *) &regex->ref_count, -1) - 1 == 0)
+    {
+      g_free (regex->pattern);
+      if (regex->pcre_re != NULL)
+       pcre_free (regex->pcre_re);
+      if (regex->extra != NULL)
+       pcre_free (regex->extra);
+      g_free (regex);
+    }
+}
+
+/** 
+ * g_regex_new:
+ * @pattern: the regular expression
+ * @compile_options: compile options for the regular expression
+ * @match_options: match options for the regular expression
+ * @error: return location for a #GError
+ * 
+ * Compiles the regular expression to an internal form, and does the initial
+ * setup of the #GRegex structure.  
+ * 
+ * Returns: a #GRegex structure
   *
   * Since: 2.14
   */
-gboolean
-g_regex_match_all_full (GRegex          *regex,
-                       const gchar     *string,
-                       gssize           string_len,
-                       gint             start_position,
-                       GRegexMatchFlags match_options,
-                       GError         **error)
+GRegex *
+g_regex_new (const gchar         *pattern, 
+            GRegexCompileFlags   compile_options,
+            GRegexMatchFlags     match_options,
+            GError             **error)
  {
-  g_return_val_if_fail (regex != NULL, FALSE);
-  g_return_val_if_fail (string != NULL, FALSE);
-  g_return_val_if_fail (start_position >= 0, FALSE);
-  g_return_val_if_fail (error == NULL || *error == NULL, FALSE);
-  g_return_val_if_fail ((match_options & ~G_REGEX_MATCH_MASK) == 0, FALSE);
+  GRegex *regex;
+  pcre *re;
+  const gchar *errmsg;
+  gint erroffset;
+  gboolean optimize = FALSE;
+  static gboolean initialized = FALSE;
+  
+  g_return_val_if_fail (pattern != NULL, NULL);
+  g_return_val_if_fail (error == NULL || *error == NULL, NULL);
+  g_return_val_if_fail ((compile_options & ~G_REGEX_COMPILE_MASK) == 0, NULL);
+  g_return_val_if_fail ((match_options & ~G_REGEX_MATCH_MASK) == 0, NULL);
+
+  if (!initialized)
+    {
+      gint support;
+      const gchar *msg;
+
+      pcre_config (PCRE_CONFIG_UTF8, &support);
+      if (!support)
+       {
+         msg = N_("PCRE library is compiled without UTF8 support");
+         g_critical (msg);
+         g_set_error (error, G_REGEX_ERROR, G_REGEX_ERROR_COMPILE, gettext (msg));
+         return NULL;
+       }
  
-  regex_lazy_init_match (regex, 0);
+      pcre_config (PCRE_CONFIG_UNICODE_PROPERTIES, &support);
+      if (!support)
+       {
+         msg = N_("PCRE library is compiled without UTF8 properties support");
+         g_critical (msg);
+         g_set_error (error, G_REGEX_ERROR, G_REGEX_ERROR_COMPILE, gettext (msg));
+         return NULL;
+       }
  
-  if (string_len < 0)
-    string_len = strlen (string);
+      initialized = TRUE;
+    }
  
-  regex->match->string_len = string_len;
+  /* G_REGEX_OPTIMIZE has the same numeric value of PCRE_NO_UTF8_CHECK,
+   * as we do not need to wrap PCRE_NO_UTF8_CHECK. */
+  if (compile_options & G_REGEX_OPTIMIZE)
+    optimize = TRUE;
  
-  if (regex->match->workspace == NULL)
+  /* In GRegex the string are, by default, UTF-8 encoded. PCRE
+   * instead uses UTF-8 only if required with PCRE_UTF8. */
+  if (compile_options & G_REGEX_RAW)
      {
-      regex->match->n_workspace = WORKSPACE_INITIAL;
-      regex->match->workspace = g_new (gint, regex->match->n_workspace);
+      /* disable utf-8 */
+      compile_options &= ~G_REGEX_RAW;
      }
-
-  if (regex->match->n_offsets < OFFSETS_DFA_MIN_SIZE)
+  else
      {
-      regex->match->n_offsets = OFFSETS_DFA_MIN_SIZE;
-      regex->match->offsets = g_realloc (regex->match->offsets,
-                                        regex->match->n_offsets * sizeof(gint));
+      /* enable utf-8 */
+      compile_options |= PCRE_UTF8 | PCRE_NO_UTF8_CHECK;
+      match_options |= PCRE_NO_UTF8_CHECK;
      }
  
-  /* perform the match */
-  regex->match->matches = pcre_dfa_exec (regex->pattern->pcre_re,
-                                        REGEX_GET_EXTRA (regex), 
-                                        string, regex->match->string_len,
-                                        start_position,
-                                        regex->pattern->match_opts | match_options,
-                                        regex->match->offsets, regex->match->n_offsets,
-                                        regex->match->workspace,
-                                        regex->match->n_workspace);
-  if (regex->match->matches == PCRE_ERROR_DFA_WSSIZE)
+  /* PCRE_NEWLINE_ANY is the default for the internal PCRE but
+   * not for the system one. */
+  if (!(compile_options & G_REGEX_NEWLINE_CR) &&
+      !(compile_options & G_REGEX_NEWLINE_LF))
      {
-      /* regex->match->workspace is too small. */
-      regex->match->n_workspace *= 2;
-      regex->match->workspace = g_realloc (regex->match->workspace,
-                                          regex->match->n_workspace * sizeof (gint));
-      return g_regex_match_all_full (regex, string, string_len,
-                                    start_position, match_options, error);
+      compile_options |= PCRE_NEWLINE_ANY;
      }
-  else if (regex->match->matches == 0)
+
+  /* compile the pattern */
+  re = pcre_compile (pattern, compile_options, &errmsg, &erroffset, NULL);
+
+  /* if the compilation failed, set the error member and return 
+   * immediately */
+  if (re == NULL)
      {
-      /* regex->match->offsets is too small. */
-      regex->match->n_offsets *= 2;
-      regex->match->offsets = g_realloc (regex->match->offsets,
-                                        regex->match->n_offsets * sizeof (gint));
-      return g_regex_match_all_full (regex, string, string_len,
-                                    start_position, match_options, error);
+      GError *tmp_error = g_error_new (G_REGEX_ERROR, 
+                                      G_REGEX_ERROR_COMPILE,
+                                      _("Error while compiling regular "
+                                        "expression %s at char %d: %s"),
+                                      pattern, erroffset, errmsg);
+      g_propagate_error (error, tmp_error);
+
+      return NULL;
      }
-  else if (IS_PCRE_ERROR (regex->match->matches))
+
+  regex = g_new0 (GRegex, 1);
+  regex->ref_count = 1;
+  regex->pattern = g_strdup (pattern);
+  regex->pcre_re = re;
+  regex->compile_opts = compile_options;
+  regex->match_opts = match_options;
+
+  if (optimize)
      {
-      g_set_error (error, G_REGEX_ERROR, G_REGEX_ERROR_MATCH,
-                  _("Error while matching regular expression %s: %s"),
-                  regex->pattern->pattern, match_error (regex->match->matches));
-      return FALSE;
+      regex->extra = pcre_study (regex->pcre_re, 0, &errmsg);
+      if (errmsg != NULL)
+        {
+          GError *tmp_error = g_error_new (G_REGEX_ERROR,
+                                           G_REGEX_ERROR_OPTIMIZE, 
+                                           _("Error while optimizing "
+                                             "regular expression %s: %s"),
+                                           regex->pattern,
+                                           errmsg);
+          g_propagate_error (error, tmp_error);
+          return NULL;
+       }
      }
  
-  /* set regex->match->pos to -1 so that a call to g_regex_match_next()
-   * fails without a previous call to g_regex_clear(). */
-  regex->match->pos = -1;
-
-  return regex->match->matches >= 0;
+  return regex;
  }
  
  /**
- * g_regex_get_match_count:
- * @regex: a #GRegex structure
- *
- * Retrieves the number of matched substrings (including substring 0, that
- * is the whole matched text) in the last call to g_regex_match*(), so 1
- * is returned if the pattern has no substrings in it and 0 is returned if
- * the match failed.
- *
- * If the last match was obtained using the DFA algorithm, that is using
- * g_regex_match_all() or g_regex_match_all_full(), the retrieved
- * count is not that of the number of capturing parentheses but that of
- * the number of matched substrings.
+ * g_regex_free:
+ * @regex: a #GRegex
   *
- * Returns:  Number of matched substrings, or -1 if an error occurred
+ * Frees all the memory associated with the regex structure.
   *
   * Since: 2.14
   */
-gint
-g_regex_get_match_count (const GRegex *regex)
+void
+g_regex_free (GRegex *regex)
  {
-  g_return_val_if_fail (regex != NULL, -1);
-
-  if (regex->match == NULL)
-    return -1;
+  if (regex == NULL)
+    return;
  
-  if (regex->match->matches == PCRE_ERROR_NOMATCH)
-    /* no match */
-    return 0;
-  else if (regex->match->matches < PCRE_ERROR_NOMATCH)
-    /* error */
-    return -1;
-  else
-    /* match */
-    return regex->match->matches;
+  regex_unref (regex);
  }
  
  /**
- * g_regex_is_partial_match:
+ * g_regex_get_pattern:
   * @regex: a #GRegex structure
   *
- * Usually if the string passed to g_regex_match*() matches as far as
- * it goes, but is too short to match the entire pattern, %FALSE is
- * returned. There are circumstances where it might be helpful to
- * distinguish this case from other cases in which there is no match.
- *
- * Consider, for example, an application where a human is required to
- * type in data for a field with specific formatting requirements. An
- * example might be a date in the form ddmmmyy, defined by the pattern
- * "^\d?\d(jan|feb|mar|apr|may|jun|jul|aug|sep|oct|nov|dec)\d\d$".
- * If the application sees the user’s keystrokes one by one, and can
- * check that what has been typed so far is potentially valid, it is
- * able to raise an error as soon as a mistake is made.
- *
- * GRegex supports the concept of partial matching by means of the
- * #G_REGEX_MATCH_PARTIAL flag. When this is set the return code for
- * g_regex_match() or g_regex_match_full() is, as usual, %TRUE
- * for a complete match, %FALSE otherwise. But, when this functions
- * returns %FALSE, you can check if the match was partial calling
- * g_regex_is_partial_match().
- *
- * When using partial matching you cannot use g_regex_fetch*().
- *
- * Because of the way certain internal optimizations are implemented the
- * partial matching algorithm cannot be used with all patterns. So repeated
- * single characters such as "a{2,4}" and repeated single metasequences such
- * as "\d+" are not permitted if the maximum number of occurrences is
- * greater than one. Optional items such as "\d?" (where the maximum is one)
- * are permitted. Quantifiers with any values are permitted after
- * parentheses, so the invalid examples above can be coded thus "(a){2,4}"
- * and "(\d)+". If #G_REGEX_MATCH_PARTIAL is set for a pattern that does
- * not conform to the restrictions, matching functions return an error.
+ * Gets the pattern string associated with @regex, i.e. a copy of 
+ * the string passed to g_regex_new().
   *
- * Returns: %TRUE if the match was partial, %FALSE otherwise
+ * Returns: the pattern of @regex
   *
   * Since: 2.14
   */
-gboolean
-g_regex_is_partial_match (const GRegex *regex)
+const gchar *
+g_regex_get_pattern (const GRegex *regex)
  {
-  g_return_val_if_fail (regex != NULL, FALSE);
-
-  if (regex->match == NULL)
-    return FALSE;
+  g_return_val_if_fail (regex != NULL, NULL);
  
-  return regex->match->matches == PCRE_ERROR_PARTIAL;
+  return regex->pattern;
  }
  
  /**
- * g_regex_fetch:
- * @regex: #GRegex structure used in last match
- * @match_num: number of the sub expression
- * @string: the string on which the last match was made
+ * g_regex_match_simple:
+ * @pattern: the regular expression
+ * @string: the string to scan for matches
+ * @compile_options: compile options for the regular expression
+ * @match_options: match options
   *
- * Retrieves the text matching the @match_num<!-- -->'th capturing parentheses.
- * 0 is the full text of the match, 1 is the first paren set, 2 the second,
- * and so on.
+ * Scans for a match in @string for @pattern.
   *
- * If @match_num is a valid sub pattern but it didn't match anything (e.g.
- * sub pattern 1, matching "b" against "(a)?b") then an empty string is
- * returned.
+ * This function is equivalent to g_regex_match() but it does not
+ * require to compile the pattern with g_regex_new(), avoiding some
+ * lines of code when you need just to do a match without extracting
+ * substrings, capture counts, and so on.
   *
- * If the last match was obtained using the DFA algorithm, that is using
- * g_regex_match_all() or g_regex_match_all_full(), the retrieved
- * string is not that of a set of parentheses but that of a matched
- * substring. Substrings are matched in reverse order of length, so 0 is
- * the longest match.
+ * If this function is to be called on the same @pattern more than
+ * once, it's more efficient to compile the pattern once with
+ * g_regex_new() and then use g_regex_match().
   *
- * Returns: The matched substring, or %NULL if an error occurred.
- *          You have to free the string yourself.
+ * Returns: %TRUE is the string matched, %FALSE otherwise
   *
   * Since: 2.14
   */
-gchar *
-g_regex_fetch (const GRegex *regex,
-              gint          match_num,
-              const gchar  *string)
+gboolean
+g_regex_match_simple (const gchar        *pattern, 
+                     const gchar        *string, 
+                     GRegexCompileFlags  compile_options,
+                     GRegexMatchFlags    match_options)
  {
-  /* we cannot use pcre_get_substring() because it allocates the
-   * string using pcre_malloc(). */
-  gchar *match = NULL;
-  gint start, end;
-
-  g_return_val_if_fail (regex != NULL, NULL);
-  g_return_val_if_fail (match_num >= 0, NULL);
-
-  if (regex->match == NULL)
-    return NULL;
-
-  if (regex->match->string_len < 0)
-    return NULL;
-
-  /* match_num does not exist or it didn't matched, i.e. matching "b"
-   * against "(a)?b" then group 0 is empty. */
-  if (!g_regex_fetch_pos (regex, match_num, &start, &end))
-    match = NULL;
-  else if (start == -1)
-    match = g_strdup ("");
-  else
-    match = g_strndup (&string[start], end - start);
+  GRegex *regex;
+  gboolean result;
  
-  return match;
+  regex = g_regex_new (pattern, compile_options, 0, NULL);
+  if (!regex)
+    return FALSE;
+  result = g_regex_match_full (regex, string, -1, 0, match_options, NULL, NULL);
+  g_regex_free (regex);
+  return result;
  }
  
  /**
- * g_regex_fetch_pos:
- * @regex: #GRegex structure used in last match
- * @match_num: number of the sub expression
- * @start_pos: pointer to location where to store the start position
- * @end_pos: pointer to location where to store the end position
- *
- * Retrieves the position of the @match_num<!-- -->'th capturing parentheses.
- * 0 is the full text of the match, 1 is the first paren set, 2 the second,
- * and so on.
+ * g_regex_match:
+ * @regex: a #GRegex structure from g_regex_new()
+ * @string: the string to scan for matches
+ * @match_options: match options
+ * @match_info: pointer to location where to store the #GMatchInfo, or
+ * %NULL if you do not nedd it
   *
- * If @match_num is a valid sub pattern but it didn't match anything (e.g.
- * sub pattern 1, matching "b" against "(a)?b") then @start_pos and @end_pos
- * are set to -1 and %TRUE is returned.
+ * Scans for a match in string for the pattern in @regex. The @match_options
+ * are combined with the match options specified when the @regex structure
+ * was created, letting you have more flexibility in reusing #GRegex
+ * structures.
   *
- * If the last match was obtained using the DFA algorithm, that is using
- * g_regex_match_all() or g_regex_match_all_full(), the retrieved
- * position is not that of a set of parentheses but that of a matched
- * substring. Substrings are matched in reverse order of length, so 0 is
- * the longest match.
+ * A #GMatchInfo structure, used to get information on the match, is stored
+ * in @match_info if not %NULL.
+ *
+ * To retrieve all the non-overlapping matches of the pattern in string you
+ * can use g_match_info_next().
+ *
+ * <informalexample><programlisting>
+ * static void
+ * print_uppercase_words (const gchar *string)
+ * {
+ *   /&ast; Print all uppercase-only words. &ast;/
+ *   GRegex *regex;
+ *   GMatchInfo *match_info;
+ *   &nbsp;
+ *   regex = g_regex_new ("[A-Z]+", 0, 0, NULL);
+ *   g_regex_match (regex, string, 0, &match_info);
+ *   while (g_match_info_matches (match_info))
+ *     {
+ *       gchar *word = g_match_info_fetch (match_info, 0);
+ *       g_print ("Found: %s\n", word);
+ *       g_free (word);
+ *       g_match_info_next (match_info, NULL);
+ *     }
+ *   g_match_info_free (match_info);
+ *   g_regex_free (regex);
+ * }
+ * </programlisting></informalexample>
   *
- * Returns: %TRUE if the position was fetched, %FALSE otherwise. If the
- *          position cannot be fetched, @start_pos and @end_pos are left
- *          unchanged.
+ * Returns: %TRUE is the string matched, %FALSE otherwise
   *
   * Since: 2.14
   */
  gboolean
-g_regex_fetch_pos (const GRegex *regex,
-                  gint          match_num,
-                  gint         *start_pos,
-                  gint         *end_pos)
+g_regex_match (const GRegex    *regex, 
+              const gchar     *string, 
+              GRegexMatchFlags match_options,
+              GMatchInfo     **match_info)
  {
-  g_return_val_if_fail (regex != NULL, FALSE);
-  g_return_val_if_fail (match_num >= 0, FALSE);
- 
-  if (regex->match == NULL)
-    return FALSE;
-
-  /* make sure the sub expression number they're requesting is less than
-   * the total number of sub expressions that were matched. */
-  if (match_num >= regex->match->matches)
-    return FALSE;
-
-  if (start_pos != NULL)
-    *start_pos = regex->match->offsets[2 * match_num];
-
-  if (end_pos != NULL)
-    *end_pos = regex->match->offsets[2 * match_num + 1];
-
-  return TRUE;
+  return g_regex_match_full (regex, string, -1, 0, match_options,
+                            match_info, NULL);
  }
  
  /**
- * g_regex_fetch_named:
- * @regex: #GRegex structure used in last match
- * @name: name of the subexpression
- * @string: the string on which the last match was made
+ * g_regex_match_full:
+ * @regex: a #GRegex structure from g_regex_new()
+ * @string: the string to scan for matches
+ * @string_len: the length of @string, or -1 if @string is nul-terminated
+ * @start_position: starting index of the string to match
+ * @match_options: match options
+ * @match_info: pointer to location where to store the #GMatchInfo, or
+ * %NULL if you do not nedd it
+ * @error: location to store the error occuring, or %NULL to ignore errors
   *
- * Retrieves the text matching the capturing parentheses named @name.
+ * Scans for a match in string for the pattern in @regex. The @match_options
+ * are combined with the match options specified when the @regex structure
+ * was created, letting you have more flexibility in reusing #GRegex
+ * structures.
   *
- * If @name is a valid sub pattern name but it didn't match anything (e.g.
- * sub pattern "X", matching "b" against "(?P&lt;X&gt;a)?b") then an empty
- * string is returned.
+ * Setting @start_position differs from just passing over a shortened string
+ * and  setting #G_REGEX_MATCH_NOTBOL in the case of a pattern that begins
+ * with any kind of lookbehind assertion, such as "\b".
   *
- * Returns: The matched substring, or %NULL if an error occurred.
- *          You have to free the string yourself.
+ * A #GMatchInfo structure, used to get information on the match, is stored
+ * in @match_info if not %NULL.
+ *
+ * To retrieve all the non-overlapping matches of the pattern in string you
+ * can use g_match_info_next().
+ *
+ * <informalexample><programlisting>
+ * static void
+ * print_uppercase_words (const gchar *string)
+ * {
+ *   /&ast; Print all uppercase-only words. &ast;/
+ *   GRegex *regex;
+ *   GMatchInfo *match_info;
+ *   GError *error = NULL;
+ *   &nbsp;
+ *   regex = g_regex_new ("[A-Z]+", 0, 0, NULL);
+ *   g_regex_match_full (regex, string, -1, 0, 0, &match_info, &error);
+ *   while (g_match_info_matches (match_info))
+ *     {
+ *       gchar *word = g_match_info_fetch (match_info, 0);
+ *       g_print ("Found: %s\n", word);
+ *       g_free (word);
+ *       g_match_info_next (match_info, &error);
+ *     }
+ *   g_match_info_free (match_info);
+ *   g_regex_free (regex);
+ *   if (error != NULL)
+ *     {
+ *       g_printerr ("Error while matching: %s\n", error->message);
+ *       g_error_free (error);
+ *     }
+ * }
+ * </programlisting></informalexample>
+ *
+ * Returns: %TRUE is the string matched, %FALSE otherwise
   *
   * Since: 2.14
   */
-gchar *
-g_regex_fetch_named (const GRegex *regex,
-                    const gchar  *name,
-                    const gchar  *string)
+gboolean
+g_regex_match_full (const GRegex    *regex,
+                   const gchar     *string,
+                   gssize           string_len,
+                   gint             start_position,
+                   GRegexMatchFlags match_options,
+                   GMatchInfo     **match_info,
+                   GError         **error)
  {
-  /* we cannot use pcre_get_named_substring() because it allocates the
-   * string using pcre_malloc(). */
-  gint num;
+  GMatchInfo *info;
+  gboolean match_ok;
  
-  g_return_val_if_fail (regex != NULL, NULL);
-  g_return_val_if_fail (string != NULL, NULL);
-  g_return_val_if_fail (name != NULL, NULL);
+  g_return_val_if_fail (regex != NULL, FALSE);
+  g_return_val_if_fail (string != NULL, FALSE);
+  g_return_val_if_fail (start_position >= 0, FALSE);
+  g_return_val_if_fail (error == NULL || *error == NULL, FALSE);
+  g_return_val_if_fail ((match_options & ~G_REGEX_MATCH_MASK) == 0, FALSE);
  
-  num = g_regex_get_string_number (regex, name);
-  if (num == -1)
-    return NULL;
+  info = match_info_new (regex, string, string_len, start_position,
+                        match_options, FALSE);
+  match_ok = g_match_info_next (info, error);
+  if (match_info != NULL)
+    *match_info = info;
    else
-    return g_regex_fetch (regex, num, string);
+    g_match_info_free (info);
+
+  return match_ok;
  }
  
  /**
- * g_regex_fetch_named_pos:
- * @regex: #GRegex structure used in last match
- * @name: name of the subexpression
- * @start_pos: pointer to location where to store the start position
- * @end_pos: pointer to location where to store the end position
+ * g_regex_match_all:
+ * @regex: a #GRegex structure from g_regex_new()
+ * @string: the string to scan for matches
+ * @match_options: match options
+ * @match_info: pointer to location where to store the #GMatchInfo, or
+ * %NULL if you do not nedd it
   *
- * Retrieves the position of the capturing parentheses named @name.
+ * Using the standard algorithm for regular expression matching only the
+ * longest match in the string is retrieved. This function uses a
+ * different algorithm so it can retrieve all the possible matches.
+ * For more documentation see g_regex_match_all_full().
   *
- * If @name is a valid sub pattern name but it didn't match anything (e.g.
- * sub pattern "X", matching "b" against "(?P&lt;X&gt;a)?b") then @start_pos and
- * @end_pos are set to -1 and %TRUE is returned.
+ * A #GMatchInfo structure, used to get information on the match, is stored
+ * in @match_info if not %NULL.
   *
- * Returns: %TRUE if the position was fetched, %FALSE otherwise. If the
- *          position cannot be fetched, @start_pos and @end_pos are left
- *          unchanged.
+ * Returns: %TRUE is the string matched, %FALSE otherwise
   *
   * Since: 2.14
   */
  gboolean
-g_regex_fetch_named_pos (const GRegex *regex,
-                        const gchar  *name,
-                        gint         *start_pos,
-                        gint         *end_pos)
+g_regex_match_all (const GRegex    *regex,
+                  const gchar     *string,
+                  GRegexMatchFlags match_options,
+                  GMatchInfo     **match_info)
  {
-  gint num;
-
-  num = g_regex_get_string_number (regex, name);
-  if (num == -1)
-    return FALSE;
-
-  return g_regex_fetch_pos (regex, num, start_pos, end_pos);
+  return g_regex_match_all_full (regex, string, -1, 0, match_options,
+                                match_info, NULL);
  }
  
  /**
- * g_regex_fetch_all:
- * @regex: a #GRegex structure
- * @string: the string on which the last match was made
+ * g_regex_match_all_full:
+ * @regex: a #GRegex structure from g_regex_new()
+ * @string: the string to scan for matches
+ * @string_len: the length of @string, or -1 if @string is nul-terminated
+ * @start_position: starting index of the string to match
+ * @match_options: match options
+ * @match_info: pointer to location where to store the #GMatchInfo, or
+ * %NULL if you do not nedd it
+ * @error: location to store the error occuring, or %NULL to ignore errors
   *
- * Bundles up pointers to each of the matching substrings from a match
- * and stores them in an array of gchar pointers. The first element in
- * the returned array is the match number 0, i.e. the entire matched
- * text.
+ * Using the standard algorithm for regular expression matching only the
+ * longest match in the string is retrieved, it is not possibile to obtain
+ * all the available matches. For instance matching
+ * "&lt;a&gt; &lt;b&gt; &lt;c&gt;" against the pattern "&lt;.*&gt;" you get
+ * "&lt;a&gt; &lt;b&gt; &lt;c&gt;".
   *
- * If a sub pattern didn't match anything (e.g. sub pattern 1, matching
- * "b" against "(a)?b") then an empty string is inserted.
+ * This function uses a different algorithm (called DFA, i.e. deterministic
+ * finite automaton), so it can retrieve all the possible matches, all
+ * starting at the same point in the string. For instance matching
+ * "&lt;a&gt; &lt;b&gt; &lt;c&gt;" against the pattern "&lt;.*&gt;" you
+ * would obtain three matches: "&lt;a&gt; &lt;b&gt; &lt;c&gt;",
+ * "&lt;a&gt; &lt;b&gt;" and "&lt;a&gt;".
   *
- * If the last match was obtained using the DFA algorithm, that is using
- * g_regex_match_all() or g_regex_match_all_full(), the retrieved
- * strings are not that matched by sets of parentheses but that of the
- * matched substring. Substrings are matched in reverse order of length,
- * so the first one is the longest match.
+ * The number of matched strings is retrieved using
+ * g_match_info_get_match_count().
+ * To obtain the matched strings and their position you can use,
+ * respectively, g_match_info_fetch() and g_match_info_fetch_pos(). Note that
+ * the strings are returned in reverse order of length; that is, the longest
+ * matching string is given first.
   *
- * Returns: a %NULL-terminated array of gchar * pointers. It must be freed
- *          using g_strfreev(). If the memory can't be allocated, returns
- *          %NULL.
+ * Note that the DFA algorithm is slower than the standard one and it is not
+ * able to capture substrings, so backreferences do not work.
+ *
+ * Setting @start_position differs from just passing over a shortened string
+ * and  setting #G_REGEX_MATCH_NOTBOL in the case of a pattern that begins
+ * with any kind of lookbehind assertion, such as "\b".
+ *
+ * A #GMatchInfo structure, used to get information on the match, is stored
+ * in @match_info if not %NULL.
+ *
+ * Returns: %TRUE is the string matched, %FALSE otherwise
   *
   * Since: 2.14
   */
-gchar **
-g_regex_fetch_all (const GRegex *regex,
-                  const gchar  *string)
+gboolean
+g_regex_match_all_full (const GRegex    *regex,
+                       const gchar     *string,
+                       gssize           string_len,
+                       gint             start_position,
+                       GRegexMatchFlags match_options,
+                       GMatchInfo     **match_info,
+                       GError         **error)
  {
-  /* we cannot use pcre_get_substring_list() because the returned value
-   * isn't suitable for g_strfreev(). */
-  gchar **result;
-  gint i;
+  GMatchInfo *info;
+  gboolean done;
  
    g_return_val_if_fail (regex != NULL, FALSE);
    g_return_val_if_fail (string != NULL, FALSE);
+  g_return_val_if_fail (start_position >= 0, FALSE);
+  g_return_val_if_fail (error == NULL || *error == NULL, FALSE);
+  g_return_val_if_fail ((match_options & ~G_REGEX_MATCH_MASK) == 0, FALSE);
  
-  if (regex->match == NULL)
-    return NULL;
+  info = match_info_new (regex, string, string_len, start_position,
+                        match_options, TRUE);
  
-  if (regex->match->matches < 0)
-    return NULL;
+  done = FALSE;
+  while (!done)
+    {
+      done = TRUE;
+      info->matches = pcre_dfa_exec (regex->pcre_re, regex->extra,
+                                    info->string, info->string_len,
+                                    info->pos,
+                                    regex->match_opts | match_options,
+                                    info->offsets, info->n_offsets,
+                                    info->workspace, info->n_workspace);
+      if (info->matches == PCRE_ERROR_DFA_WSSIZE)
+       {
+         /* info->workspace is too small. */
+         info->n_workspace *= 2;
+         info->workspace = g_realloc (info->workspace,
+                                      info->n_workspace * sizeof (gint));
+         done = FALSE;
+       }
+      else if (info->matches == 0)
+       {
+         /* info->offsets is too small. */
+         info->n_offsets *= 2;
+         info->offsets = g_realloc (info->offsets,
+                                    info->n_offsets * sizeof (gint));
+         done = FALSE;
+       }
+      else if (IS_PCRE_ERROR (info->matches))
+       {
+         g_set_error (error, G_REGEX_ERROR, G_REGEX_ERROR_MATCH,
+                      _("Error while matching regular expression %s: %s"),
+                      regex->pattern, match_error (info->matches));
+       }
+    }
  
-  result = g_new (gchar *, regex->match->matches + 1);
-  for (i = 0; i < regex->match->matches; i++)
-    result[i] = g_regex_fetch (regex, i, string);
-  result[i] = NULL;
+  /* set info->pos to -1 so that a call to g_match_info_next() fails. */
+  info->pos = -1;
  
-  return result;
+  if (match_info != NULL)
+    *match_info = info;
+  else
+    g_match_info_free (info);
+
+  return info->matches >= 0;
  }
  
  /**
@@ -1244,7 +1202,7 @@ g_regex_fetch_all (const GRegex *regex,
   *
   * Retrieves the number of the subexpression named @name.
   *
- * Returns: The number of the subexpression or -1 if @name does not exists.
+ * Returns: The number of the subexpression or -1 if @name does not exists
   *
   * Since: 2.14
   */
@@ -1257,7 +1215,7 @@ g_regex_get_string_number (const GRegex *regex,
    g_return_val_if_fail (regex != NULL, -1);
    g_return_val_if_fail (name != NULL, -1);
  
-  num = pcre_get_stringnumber (regex->pattern->pcre_re, name);
+  num = pcre_get_stringnumber (regex->pcre_re, name);
    if (num == PCRE_ERROR_NOSUBSTRING)
      num = -1;
  
@@ -1298,7 +1256,7 @@ g_regex_get_string_number (const GRegex *regex,
   * For example splitting "ab c" using as a separator "\s*", you will get
   * "a", "b" and "c".
   *
- * Returns: a %NULL-terminated gchar ** array. Free it using g_strfreev().
+ * Returns: a %NULL-terminated gchar ** array. Free it using g_strfreev()
   *
   * Since: 2.14
   **/
@@ -1343,12 +1301,12 @@ g_regex_split_simple (const gchar        *pattern,
   * For example splitting "ab c" using as a separator "\s*", you will get
   * "a", "b" and "c".
   *
- * Returns: a %NULL-terminated gchar ** array. Free it using g_strfreev().
+ * Returns: a %NULL-terminated gchar ** array. Free it using g_strfreev()
   *
   * Since: 2.14
   **/
  gchar **
-g_regex_split (GRegex           *regex, 
+g_regex_split (const GRegex     *regex, 
                const gchar      *string, 
                GRegexMatchFlags  match_options)
  {
@@ -1364,7 +1322,7 @@ g_regex_split (GRegex           *regex,
   * @start_position: starting index of the string to match
   * @match_options: match time option flags
   * @max_tokens: the maximum number of tokens to split @string into. If this
- *    is less than 1, the string is split completely.
+ *    is less than 1, the string is split completely
   * @error: return location for a #GError
   *
   * Breaks the string on the pattern, and returns an array of the tokens.
@@ -1389,12 +1347,12 @@ g_regex_split (GRegex           *regex,
   * and  setting #G_REGEX_MATCH_NOTBOL in the case of a pattern that begins
   * with any kind of lookbehind assertion, such as "\b".
   *
- * Returns: a %NULL-terminated gchar ** array. Free it using g_strfreev().
+ * Returns: a %NULL-terminated gchar ** array. Free it using g_strfreev()
   *
   * Since: 2.14
   **/
  gchar **
-g_regex_split_full (GRegex           *regex, 
+g_regex_split_full (const GRegex     *regex, 
                     const gchar      *string, 
                     gssize            string_len,
                     gint              start_position,
@@ -1402,11 +1360,18 @@ g_regex_split_full (GRegex           *regex,
                     gint              max_tokens,
                     GError          **error)
  {
-  gchar **string_list;         /* The array of char **s worked on */
-  gint pos;
-  gint tokens;
-  GList *list, *last;
    GError *tmp_error = NULL;
+  GMatchInfo *match_info;
+  GList *list, *last;
+  gint i;
+  gint token_count;
+  gboolean match_ok;
+  /* position of the last separator. */
+  gint last_separator_end;
+  /* was the last match 0 bytes long? */
+  gboolean last_match_is_empty;
+  /* the returned array of char **s */
+  gchar **string_list;
  
    g_return_val_if_fail (regex != NULL, NULL);
    g_return_val_if_fail (string != NULL, NULL);
@@ -1414,254 +1379,127 @@ g_regex_split_full (GRegex           *regex,
    g_return_val_if_fail (error == NULL || *error == NULL, NULL);
    g_return_val_if_fail ((match_options & ~G_REGEX_MATCH_MASK) == 0, NULL);
  
-  regex_lazy_init_match (regex, 0);
-
    if (max_tokens <= 0)
      max_tokens = G_MAXINT;
  
    if (string_len < 0)
      string_len = strlen (string);
  
+  /* zero-length string */
    if (string_len - start_position == 0)
      return g_new0 (gchar *, 1);
  
-  /* clear out the regex for reuse, just in case */
-  g_regex_clear (regex);
+  if (max_tokens == 1)
+    {
+      string_list = g_new0 (gchar *, 2);
+      string_list[0] = g_strndup (&string[start_position],
+                                 string_len - start_position);
+      return string_list;
+    }
  
    list = NULL;
-  tokens = 0;
-  while (TRUE)
+  token_count = 0;
+  last_separator_end = start_position;
+  last_match_is_empty = FALSE;
+
+  match_ok = g_regex_match_full (regex, string, string_len, start_position,
+                                match_options, &match_info, &tmp_error);
+  while (tmp_error == NULL)
      {
-      gchar *token;
+      if (match_ok)
+        {
+          last_match_is_empty =
+                    (match_info->offsets[0] == match_info->offsets[1]);
+
+          /* we need to skip empty separators at the same position of the end
+           * of another separator. e.g. the string is "a b" and the separator
+           * is " *", so from 1 to 2 we have a match and at position 2 we have
+           * an empty match. */
+          if (last_separator_end != match_info->offsets[1])
+            {
+              gchar *token;
+              gint match_count;
+
+              token = g_strndup (string + last_separator_end,
+                                match_info->offsets[0] - last_separator_end);
+              list = g_list_prepend (list, token);
+              token_count++;
+
+              /* if there were substrings, these need to be added to
+               * the list. */
+              match_count = g_match_info_get_match_count (match_info);
+              if (match_count > 1)
+                {
+                  for (i = 1; i < match_count; i++)
+                    list = g_list_prepend (list, g_match_info_fetch (match_info, i));
+                }
+            }
+        }
+      else
+        {
+          /* if there was no match, copy to end of string. */
+          if (!last_match_is_empty)
+            {
+              gchar *token = g_strndup (string + last_separator_end,
+                                       match_info->string_len - last_separator_end);
+              list = g_list_prepend (list, token);
+            }
+          /* no more tokens, end the loop. */
+          break;
+        }
  
        /* -1 to leave room for the last part. */
-      if (tokens >= max_tokens - 1)
+      if (token_count >= max_tokens - 1)
         {
           /* we have reached the maximum number of tokens, so we copy
            * the remaining part of the string. */
-         if (regex->match->last_match_is_empty)
+         if (last_match_is_empty)
             {
               /* the last match was empty, so we have moved one char
                * after the real position to avoid empty matches at the
                * same position. */
-             regex->match->pos = PREV_CHAR (regex, &string[regex->match->pos]) - string;
+             match_info->pos = PREV_CHAR (regex, &string[match_info->pos]) - string;
             }
           /* the if is needed in the case we have terminated the available
            * tokens, but we are at the end of the string, so there are no
            * characters left to copy. */
-         if (string_len > regex->match->pos)
+         if (string_len > match_info->pos)
             {
-             token = g_strndup (string + regex->match->pos,
-                                string_len - regex->match->pos);
+             gchar *token = g_strndup (string + match_info->pos,
+                                       string_len - match_info->pos);
               list = g_list_prepend (list, token);
             }
           /* end the loop. */
           break;
         }
  
-      token = g_regex_split_next_full (regex, string, string_len, start_position,
-                                       match_options, &tmp_error);
-      if (tmp_error != NULL)
-       {
-         g_propagate_error (error, tmp_error);
-         g_list_foreach (list, (GFunc)g_free, NULL);
-         g_list_free (list);
-         regex->match->pos = -1;
-         return NULL;
-       }
-
-      if (token == NULL)
-       /* no more tokens. */
-       break;
-
-      tokens++;
-      list = g_list_prepend (list, token);
-    }
-
-  string_list = g_new (gchar *, g_list_length (list) + 1);
-  pos = 0;
-  for (last = g_list_last (list); last; last = g_list_previous (last))
-    string_list[pos++] = last->data;
-  string_list[pos] = 0;
-
-  regex->match->pos = -1;
-  g_list_free (list);
-
-  return string_list;
-}
-
-/**
- * g_regex_split_next:
- * @regex: a #GRegex structure from g_regex_new()
- * @string: the string to split on pattern
- * @match_options: match time options for the regex
- *
- * g_regex_split_next() breaks the string on pattern, and returns the
- * tokens, one per call.  If the pattern contains capturing parentheses,
- * then the text for each of the substrings will also be returned.
- * If the pattern does not match anywhere in the string, then the whole
- * string is returned as the first token.
- *
- * A pattern that can match empty strings splits @string into separate
- * characters wherever it matches the empty string between characters.
- * For example splitting "ab c" using as a separator "\s*", you will get
- * "a", "b" and "c".
- *
- * You have to call g_regex_clear() to reuse the same pattern on a new
- * string.
- *
- * Returns:  a gchar * to the next token of the string
- *
- * Since: 2.14
- */
-gchar *
-g_regex_split_next (GRegex          *regex,
-                   const gchar     *string,
-                   GRegexMatchFlags match_options)
-{
-  return g_regex_split_next_full (regex, string, -1, 0, match_options,
-                                  NULL);
-}
-
-/**
- * g_regex_split_next_full:
- * @regex: a #GRegex structure from g_regex_new()
- * @string: the string to split on pattern
- * @string_len: the length of @string, or -1 if @string is nul-terminated
- * @start_position: starting index of the string to match
- * @match_options: match time options for the regex
- * @error: return location for a #GError
- *
- * g_regex_split_next_full() breaks the string on pattern, and returns
- * the tokens, one per call.  If the pattern contains capturing parentheses,
- * then the text for each of the substrings will also be returned.
- * If the pattern does not match anywhere in the string, then the whole
- * string is returned as the first token.
- *
- * A pattern that can match empty strings splits @string into separate
- * characters wherever it matches the empty string between characters.
- * For example splitting "ab c" using as a separator "\s*", you will get
- * "a", "b" and "c".
- *
- * You have to call g_regex_clear() to reuse the same pattern on a new
- * string.
- *
- * Setting @start_position differs from just passing over a shortened string
- * and  setting #G_REGEX_MATCH_NOTBOL in the case of a pattern that begins
- * with any kind of lookbehind assertion, such as "\b".
- *
- * Returns:  a gchar * to the next token of the string
- *
- * Since: 2.14
- */
-gchar *
-g_regex_split_next_full (GRegex          *regex,
-                        const gchar     *string,
-                        gssize           string_len,
-                        gint             start_position,
-                        GRegexMatchFlags match_options,
-                        GError         **error)
-{
-  gint new_pos;
-  gchar *token = NULL;
-  gboolean match_ok;
-  gint match_count;
-  GError *tmp_error = NULL;
-
-  g_return_val_if_fail (regex != NULL, NULL);
-  g_return_val_if_fail (string != NULL, NULL);
-  g_return_val_if_fail (error == NULL || *error == NULL, NULL);
-  g_return_val_if_fail ((match_options & ~G_REGEX_MATCH_MASK) == 0, NULL);
-
-  regex_lazy_init_match (regex, 0);
-
-  new_pos = MAX (regex->match->pos, start_position);
-  if (regex->match->last_match_is_empty)
-    /* if the last match was empty, g_regex_match_next_full() has moved
-     * forward to avoid infinite loops, but we still need to copy that
-     * character. */
-    new_pos = PREV_CHAR (regex, &string[new_pos]) - string;
+      last_separator_end = match_info->pos;
+      if (last_match_is_empty)
+        /* if the last match was empty, g_match_info_next() has moved
+         * forward to avoid infinite loops, but we still need to copy that
+         * character. */
+        last_separator_end = PREV_CHAR (regex, &string[last_separator_end]) - string;
  
-  /* if there are delimiter substrings stored, return those one at a
-   * time.  
-   */
-  if (regex->match->delims != NULL)
-    {
-      token = regex->match->delims->data;
-      regex->match->delims = g_slist_remove (regex->match->delims, token);
-      return token;
-    }
-
-  if (regex->match->pos == -1)
-    /* the last call to g_regex_match_next_full() returned NULL. */
-    return NULL;
-
-  if (regex->match->string_len < 0)
-    {
-      regex->match->last_match_is_empty = FALSE;
-      /* initialize last_separator_end to start_position to skip the
-       * empty token at the beginning of the string. */
-      regex->match->last_separator_end = start_position;
+      match_ok = g_match_info_next (match_info, &tmp_error);
      }
-
-  /* use g_regex_match_next() to find the next occurance of the pattern
-   * in the string. We use new_pos to keep track of where the stuff
-   * up to the current match starts. Copy that token of the string off
-   * and append it to the buffer using g_strndup. */
-  match_ok = g_regex_match_next_full (regex, string, string_len,
-                                      start_position, match_options,
-                                      &tmp_error);
+  g_match_info_free (match_info);
    if (tmp_error != NULL)
      {
        g_propagate_error (error, tmp_error);
+      g_list_foreach (list, (GFunc)g_free, NULL);
+      g_list_free (list);
+      match_info->pos = -1;
        return NULL;
      }
  
-  if (match_ok)
-    {
-      regex->match->last_match_is_empty =
-               (regex->match->offsets[0] == regex->match->offsets[1]);
-
-      /* we need to skip empty separators at the same position of the end
-       * of another separator. e.g. the string is "a b" and the separator
-       * is "*", so from 1 to 2 we have a match and at position 2 we have
-       * an empty match. */
-      if (regex->match->last_separator_end != regex->match->offsets[1])
-       {
-         token = g_strndup (string + new_pos, regex->match->offsets[0] - new_pos);
-
-         /* if there were substrings, these need to get added to the
-          * list of delims */
-         match_count = g_regex_get_match_count (regex);
-         if (match_count > 1)
-           {
-             gint i;
-             for (i = 1; i < match_count; i++)
-               regex->match->delims = g_slist_append (regex->match->delims,
-                                                      g_regex_fetch (regex, i, string));
-           }
-
-         regex->match->last_separator_end = regex->match->offsets[1];
-       }
-      else
-       {
-         /* we have skipped an empty separator so we need to find the
-          * next match. */
-         return g_regex_split_next_full (regex, string, string_len,
-                                         start_position, match_options,
-                                         error);
-       }
-    }
-  else
-    {
-      /* if there was no match, copy to end of string. */
-      if (!regex->match->last_match_is_empty)
-       token = g_strndup (string + new_pos, regex->match->string_len - new_pos);
-      else
-       token = NULL;
-    }
+  string_list = g_new (gchar *, g_list_length (list) + 1);
+  i = 0;
+  for (last = g_list_last (list); last; last = g_list_previous (last))
+    string_list[i++] = last->data;
+  string_list[i] = 0;
+  g_list_free (list);
  
-  return token;
+  return string_list;
  }
  
  enum
@@ -1685,14 +1523,14 @@ typedef enum
    CHANGE_CASE_UPPER_MASK   = CHANGE_CASE_UPPER | CHANGE_CASE_UPPER_SINGLE
  } ChangeCase;
  
-typedef struct 
+struct _InterpolationData
  {
    gchar     *text;   
    gint       type;   
    gint       num;
    gchar      c;
    ChangeCase change_case;
-} InterpolationData;
+};
  
  static void
  free_interpolation_data (InterpolationData *data)
@@ -2037,10 +1875,11 @@ string_append (GString     *string,
  }
  
  static gboolean
-interpolate_replacement (const GRegex *regex,
-                        const gchar  *string,
-                        GString      *result,
-                        gpointer      data)
+interpolate_replacement (const GRegex     *regex,
+                        const GMatchInfo *match_info,
+                        const gchar      *string,
+                        GString          *result,
+                        gpointer          data)
  {
    GList *list;
    InterpolationData *idata;
@@ -2061,16 +1900,16 @@ interpolate_replacement (const GRegex *regex,
              change_case = CHANGE_CASE_NONE;
           break;
         case REPL_TYPE_NUMERIC_REFERENCE:
-         match = g_regex_fetch (regex, idata->num, string);
-         if (match) 
+         match = g_match_info_fetch (match_info, idata->num);
+         if (match)
             {
               string_append (result, match, &change_case);
               g_free (match);
             }
           break;
         case REPL_TYPE_SYMBOLIC_REFERENCE:
-         match = g_regex_fetch_named (regex, idata->text, string);
-         if (match) 
+         match = g_match_info_fetch_named (match_info, idata->text);
+         if (match)
             {
               string_append (result, match, &change_case);
               g_free (match);
@@ -2086,55 +1925,6 @@ interpolate_replacement (const GRegex *regex,
  }
  
  /**
- * g_regex_expand_references:
- * @regex: #GRegex structure used in last match
- * @string: the string on which the last match was made
- * @string_to_expand: the string to expand
- * @error: location to store the error occuring, or %NULL to ignore errors
- *
- * Returns a new string containing the text in @string_to_expand with
- * references expanded. References refer to the last match done with
- * @string against @regex and have the same syntax used by g_regex_replace().
- *
- * The @string_to_expand must be UTF-8 encoded even if #G_REGEX_RAW was
- * passed to g_regex_new().
- *
- * Returns: the expanded string, or %NULL if an error occurred
- *
- * Since: 2.14
- */
-gchar *
-g_regex_expand_references (GRegex            *regex, 
-                          const gchar       *string, 
-                          const gchar       *string_to_expand,
-                          GError           **error)
-{
-  GString *result;
-  GList *list;
-  GError *tmp_error = NULL;
-
-  g_return_val_if_fail (regex != NULL, NULL);
-  g_return_val_if_fail (string != NULL, NULL);
-  g_return_val_if_fail (string_to_expand != NULL, NULL);
-  g_return_val_if_fail (error == NULL || *error == NULL, NULL);
-
-  list = split_replacement (string_to_expand, &tmp_error);
-  if (tmp_error != NULL)
-    {
-      g_propagate_error (error, tmp_error);
-      return NULL;
-    }
-
-  result = g_string_sized_new (strlen (string_to_expand));
-  interpolate_replacement (regex, string, result, list);
-
-  g_list_foreach (list, (GFunc)free_interpolation_data, NULL);
-  g_list_free (list);
-
-  return g_string_free (result, FALSE);
-}
-
-/**
   * g_regex_replace:
   * @regex: a #GRegex structure
   * @string: the string to perform matches against
@@ -2196,7 +1986,7 @@ g_regex_expand_references (GRegex            *regex,
   * Since: 2.14
   */
  gchar *
-g_regex_replace (GRegex            *regex, 
+g_regex_replace (const GRegex      *regex, 
                  const gchar       *string, 
                  gssize             string_len,
                  gint               start_position,
@@ -2238,10 +2028,11 @@ g_regex_replace (GRegex            *regex,
  }
  
  static gboolean
-literal_replacement (const GRegex *regex,
-                    const gchar  *string,
-                    GString      *result,
-                    gpointer      data)
+literal_replacement (const GRegex     *regex,
+                    const GMatchInfo *match_info,
+                    const gchar      *string,
+                    GString          *result,
+                    gpointer          data)
  {
    g_string_append (result, data);
    return FALSE;
@@ -2270,7 +2061,7 @@ literal_replacement (const GRegex *regex,
   * Since: 2.14
   */
  gchar *
-g_regex_replace_literal (GRegex          *regex,
+g_regex_replace_literal (const GRegex    *regex,
                          const gchar     *string,
                          gssize           string_len,
                          gint             start_position,
@@ -2312,7 +2103,7 @@ g_regex_replace_literal (GRegex          *regex,
   * Since: 2.14
   */
  gchar *
-g_regex_replace_eval (GRegex            *regex,
+g_regex_replace_eval (const GRegex      *regex,
                       const gchar       *string,
                       gssize             string_len,
                       gint               start_position,
@@ -2321,6 +2112,7 @@ g_regex_replace_eval (GRegex            *regex,
                       gpointer           user_data,
                       GError           **error)
  {
+  GMatchInfo *match_info;
    GString *result;
    gint str_pos = 0;
    gboolean done = FALSE;
@@ -2332,28 +2124,24 @@ g_regex_replace_eval (GRegex            *regex,
    g_return_val_if_fail (eval != NULL, NULL);
    g_return_val_if_fail ((match_options & ~G_REGEX_MATCH_MASK) == 0, NULL);
  
-  regex_lazy_init_match (regex, 0);
-
    if (string_len < 0)
      string_len = strlen (string);
  
-  /* clear out the regex for reuse, just in case */
-  g_regex_clear (regex);
-
    result = g_string_sized_new (string_len);
  
    /* run down the string making matches. */
-  while (!done &&
-        g_regex_match_next_full (regex, string, string_len,
-                                 start_position, match_options, &tmp_error))
+  g_regex_match_full (regex, string, string_len, start_position,
+                     match_options, &match_info, &tmp_error);
+  while (!done && g_match_info_matches (match_info))
      {
        g_string_append_len (result,
                            string + str_pos,
-                          regex->match->offsets[0] - str_pos);
-      done = (*eval) (regex, string, result, user_data);
-      str_pos = regex->match->offsets[1];
+                          match_info->offsets[0] - str_pos);
+      done = (*eval) (regex, match_info, string, result, user_data);
+      str_pos = match_info->offsets[1];
+      g_match_info_next (match_info, &tmp_error);
      }
-
+  g_match_info_free (match_info);
    if (tmp_error != NULL)
      {
        g_propagate_error (error, tmp_error);
@@ -2362,7 +2150,6 @@ g_regex_replace_eval (GRegex            *regex,
      }
  
    g_string_append_len (result, string + str_pos, string_len - str_pos);
-
    return g_string_free (result, FALSE);
  }
  
diff --git a/glib/gregex.h b/glib/gregex.h

index 365b739..5d4eaaa 100644 (file)
--- a/glib/gregex.h
+++ b/glib/gregex.h
@@ -2,7 +2,7 @@
   *
   * Copyright (C) 1999, 2000 Scott Wimer
   * Copyright (C) 2004, Matthias Clasen <mclasen@redhat.com>
- * Copyright (C) 2005 - 2006, Marco Barisione <marco@barisione.org>
+ * Copyright (C) 2005 - 2007, Marco Barisione <marco@barisione.org>
   *
   * This library is free software; you can redistribute it and/or
   * modify it under the terms of the GNU Lesser General Public
@@ -52,6 +52,7 @@ typedef enum
    G_REGEX_UNGREEDY          = 1 << 9,
    G_REGEX_RAW               = 1 << 11,
    G_REGEX_NO_AUTO_CAPTURE   = 1 << 12,
+  G_REGEX_OPTIMIZE          = 1 << 13,
    G_REGEX_DUPNAMES          = 1 << 19,
    G_REGEX_NEWLINE_CR        = 1 << 20,
    G_REGEX_NEWLINE_LF        = 1 << 21,
@@ -73,9 +74,14 @@ typedef enum
    G_REGEX_MATCH_NEWLINE_ANY   = 1 << 22
  } GRegexMatchFlags;
  
-typedef struct _GRegex  GRegex;
+typedef struct _GRegex         GRegex;
+typedef struct _GMatchInfo     GMatchInfo;
  
-typedef gboolean (*GRegexEvalCallback) (const GRegex*, const gchar*, GString*, gpointer);
+typedef gboolean (*GRegexEvalCallback)         (const GRegex *,
+                                                const GMatchInfo *,
+                                                const gchar *,
+                                                GString *,
+                                                gpointer);
  
  
  GRegex          *g_regex_new                   (const gchar         *pattern,
@@ -83,104 +89,72 @@ GRegex              *g_regex_new                   (const gchar         *pattern,
                                                  GRegexMatchFlags     match_options,
                                                  GError             **error);
  void             g_regex_free                  (GRegex              *regex);
-gboolean         g_regex_optimize              (GRegex              *regex,
-                                                GError             **error);
-GRegex          *g_regex_copy                  (const GRegex        *regex);
  const gchar     *g_regex_get_pattern           (const GRegex        *regex);
-void             g_regex_clear                 (GRegex              *regex);
+gint             g_regex_get_string_number     (const GRegex        *regex, 
+                                                const gchar         *name);
+gchar           *g_regex_escape_string         (const gchar         *string,
+                                                gint                 length);
+
+/* Matching. */
  gboolean         g_regex_match_simple          (const gchar         *pattern,
                                                  const gchar         *string,
                                                  GRegexCompileFlags   compile_options,
                                                  GRegexMatchFlags     match_options);
-gboolean         g_regex_match                 (GRegex              *regex,
+gboolean         g_regex_match                 (const GRegex        *regex,
                                                  const gchar         *string,
-                                                GRegexMatchFlags     match_options);
-gboolean         g_regex_match_full            (GRegex              *regex,
-                                                const gchar         *string,
-                                                gssize               string_len,
-                                                gint                 start_position,
                                                  GRegexMatchFlags     match_options,
-                                                GError             **error);
-gboolean         g_regex_match_next            (GRegex              *regex,
-                                                const gchar         *string,
-                                                GRegexMatchFlags     match_options);
-gboolean         g_regex_match_next_full       (GRegex              *regex,
+                                                GMatchInfo         **match_info);
+gboolean         g_regex_match_full            (const GRegex        *regex,
                                                  const gchar         *string,
                                                  gssize               string_len,
                                                  gint                 start_position,
                                                  GRegexMatchFlags     match_options,
+                                                GMatchInfo         **match_info,
                                                  GError             **error);
-gboolean         g_regex_match_all             (GRegex              *regex,
+gboolean         g_regex_match_all             (const GRegex        *regex,
                                                  const gchar         *string,
-                                                GRegexMatchFlags     match_options);
-gboolean         g_regex_match_all_full        (GRegex              *regex,
+                                                GRegexMatchFlags     match_options,
+                                                GMatchInfo         **match_info);
+gboolean         g_regex_match_all_full        (const GRegex        *regex,
                                                  const gchar         *string,
                                                  gssize               string_len,
                                                  gint                 start_position,
                                                  GRegexMatchFlags     match_options,
+                                                GMatchInfo         **match_info,
                                                  GError             **error);
-gint             g_regex_get_match_count       (const GRegex        *regex);
-gboolean         g_regex_is_partial_match      (const GRegex        *regex);
-gchar           *g_regex_fetch                 (const GRegex        *regex,
-                                                gint                 match_num,
-                                                const gchar         *string);
-gboolean         g_regex_fetch_pos             (const GRegex        *regex,
-                                                gint                 match_num,
-                                                gint                *start_pos,
-                                                gint                *end_pos);
-gchar           *g_regex_fetch_named           (const GRegex        *regex,
-                                                const gchar         *name,
-                                                const gchar         *string);
-gboolean         g_regex_fetch_named_pos       (const GRegex        *regex,
-                                                const gchar         *name,
-                                                gint                *start_pos,
-                                                gint                *end_pos);
-gchar          **g_regex_fetch_all             (const GRegex        *regex,
-                                                const gchar         *string);
-gint             g_regex_get_string_number     (const GRegex        *regex, 
-                                                const gchar         *name);
+
+/* String splitting. */
  gchar          **g_regex_split_simple          (const gchar         *pattern,
                                                  const gchar         *string,
                                                  GRegexCompileFlags   compile_options,
                                                  GRegexMatchFlags     match_options);
-gchar          **g_regex_split                 (GRegex              *regex,
+gchar          **g_regex_split                 (const GRegex        *regex,
                                                  const gchar         *string,
                                                  GRegexMatchFlags     match_options);
-gchar          **g_regex_split_full            (GRegex              *regex,
+gchar          **g_regex_split_full            (const GRegex        *regex,
                                                  const gchar         *string,
                                                  gssize               string_len,
                                                  gint                 start_position,
                                                  GRegexMatchFlags     match_options,
                                                  gint                 max_tokens,
                                                  GError             **error);
-gchar           *g_regex_split_next            (GRegex              *regex,
-                                                const gchar         *string,
-                                                GRegexMatchFlags     match_options);
-gchar           *g_regex_split_next_full       (GRegex              *regex,
-                                                const gchar         *string,
-                                                gssize               string_len,
-                                                gint                 start_position,
-                                                GRegexMatchFlags     match_options,
-                                                GError             **error);
-gchar           *g_regex_expand_references     (GRegex              *regex,
-                                                const gchar         *string,
-                                                const gchar         *string_to_expand,
-                                                GError             **error);
-gchar           *g_regex_replace               (GRegex              *regex,
+
+/* String replacement. */
+gchar           *g_regex_replace               (const GRegex        *regex,
                                                  const gchar         *string,
                                                  gssize               string_len,
                                                  gint                 start_position,
                                                  const gchar         *replacement,
                                                  GRegexMatchFlags     match_options,
                                                  GError             **error);
-gchar           *g_regex_replace_literal       (GRegex              *regex,
+gchar           *g_regex_replace_literal       (const GRegex        *regex,
                                                  const gchar         *string,
                                                  gssize               string_len,
                                                  gint                 start_position,
                                                  const gchar         *replacement,
                                                  GRegexMatchFlags     match_options,
                                                  GError             **error);
-gchar           *g_regex_replace_eval          (GRegex              *regex,
+gchar           *g_regex_replace_eval          (const GRegex        *regex,
                                                  const gchar         *string,
                                                  gssize               string_len,
                                                  gint                 start_position,
@@ -188,9 +162,30 @@ gchar               *g_regex_replace_eval          (GRegex              *regex,
                                                  GRegexEvalCallback   eval,
                                                  gpointer             user_data,
                                                  GError             **error);
-gchar           *g_regex_escape_string         (const gchar         *string,
-                                                gint                 length);
  
+/* Match info */
+void             g_match_info_free             (GMatchInfo          *match_info);
+gboolean         g_match_info_next             (GMatchInfo          *match_info,
+                                                GError             **error);
+gboolean         g_match_info_matches          (const GMatchInfo    *match_info);
+gint             g_match_info_get_match_count  (const GMatchInfo    *match_info);
+gboolean         g_match_info_is_partial_match (const GMatchInfo    *match_info);
+gchar           *g_match_info_expand_references(const GMatchInfo    *match_info,
+                                                const gchar         *string_to_expand,
+                                                GError             **error);
+gchar           *g_match_info_fetch            (const GMatchInfo    *match_info,
+                                                gint                 match_num);
+gboolean         g_match_info_fetch_pos        (const GMatchInfo    *match_info,
+                                                gint                 match_num,
+                                                gint                *start_pos,
+                                                gint                *end_pos);
+gchar           *g_match_info_fetch_named      (const GMatchInfo    *match_info,
+                                                const gchar         *name);
+gboolean         g_match_info_fetch_named_pos  (const GMatchInfo    *match_info,
+                                                const gchar         *name,
+                                                gint                *start_pos,
+                                                gint                *end_pos);
+gchar          **g_match_info_fetch_all        (const GMatchInfo    *match_info);
  
  G_END_DECLS
  
diff --git a/tests/regex-test.c b/tests/regex-test.c

index 79b82af..e1eeb27 100644 (file)
--- a/tests/regex-test.c
+++ b/tests/regex-test.c
@@ -108,13 +108,6 @@ test_new (const gchar        *pattern,
        return FALSE;
      }
  
-  if (!g_regex_optimize (regex, NULL))
-    {
-      g_print ("failed optimization \t(pattern: \"%s\", compile: %d, match %d)\n",
-              pattern, compile_opts, match_opts);
-      return FALSE;
-    }
-
    if (!streq (g_regex_get_pattern (regex), pattern))
      {
        g_print ("failed \t(pattern: \"%s\")\n",
@@ -170,59 +163,6 @@ test_new_fail (const gchar        *pattern,
  }
  
  static gboolean
-test_copy (const gchar  *pattern)
-{
-  GRegex *regex1, *regex2, *regex3;
-
-  verbose ("copying \"%s\" \t", pattern);
-
-  regex1 = g_regex_new (pattern, 0, 0, NULL);
-  if (regex1 != NULL)
-    /* pattern can be not valid as we want to test what happens
-     * when the regex passed to g_regex_copy() is null */
-    g_regex_optimize (regex1, NULL);
-  regex2 = g_regex_copy (regex1);
-
-  if (regex1 != NULL &&
-      !streq (g_regex_get_pattern (regex1), g_regex_get_pattern(regex2)))
-    {
-      g_print ("failed \t(pattern: \"%s\")\n", pattern);
-      g_regex_free (regex1);
-      g_regex_free (regex2);
-      return FALSE;
-    }
-
-  g_regex_free (regex1);
-
-  /* force the creation of the internal GRegexMatch */
-  if (regex2 != NULL)
-    g_regex_match (regex2, "a", 0);
-  regex3 = g_regex_copy (regex2);
-  g_regex_free (regex2);
-
-  if (regex3 != NULL &&
-      !streq (g_regex_get_pattern (regex3), pattern))
-    {
-      g_print ("failed \t(pattern: \"%s\")\n", pattern);
-      g_regex_free (regex3);
-      return FALSE;
-    }
-
-  g_regex_free (regex3);
-
-  verbose ("passed\n");
-  return TRUE;
-}
-
-#define TEST_COPY(pattern) { \
-  total++; \
-  if (test_copy (pattern)) \
-    PASS; \
-  else \
-    FAIL; \
-}
-
-static gboolean
  test_match_simple (const gchar        *pattern,
                    const gchar        *string,
                    GRegexCompileFlags  compile_opts,
@@ -230,8 +170,8 @@ test_match_simple (const gchar        *pattern,
                    gboolean            expected)
  {
    gboolean match;
-  \r
-  verbose ("matching \"%s\" against \"%s\" \t", string, pattern);\r
+
+  verbose ("matching \"%s\" against \"%s\" \t", string, pattern);
  
    match = g_regex_match_simple (pattern, string, compile_opts, match_opts);
    if (match != expected)
@@ -272,31 +212,21 @@ test_match (const gchar        *pattern,
  
    regex = g_regex_new (pattern, compile_opts, match_opts, NULL);
    match = g_regex_match_full (regex, string, string_len,
-                             start_position, match_opts2, NULL);
-  if (match != expected)
-    {\r
-      gchar *e1 = g_strescape (pattern, NULL);\r
-      gchar *e2 = g_strescape (string, NULL);
-      g_print ("failed \t(unexpected %s) '%s' against '%s'\n", match ? "match" : "mismatch", e1, e2);\r
-      g_free (e1);\r
-      g_free (e2);\r
-      g_regex_free (regex);
-      return FALSE;
-    }
-
-  /* Repeat the test to verify that g_regex_clear() is not needed. */
-  match = g_regex_match_full (regex, string, string_len,
-                             start_position, match_opts2, NULL);
+                             start_position, match_opts2, NULL, NULL);
    if (match != expected)
      {
-      g_print ("failed \t(second match != first match)\n");
+      gchar *e1 = g_strescape (pattern, NULL);
+      gchar *e2 = g_strescape (string, NULL);
+      g_print ("failed \t(unexpected %s) '%s' against '%s'\n", match ? "match" : "mismatch", e1, e2);
+      g_free (e1);
+      g_free (e2);
        g_regex_free (regex);
        return FALSE;
      }
  
    if (string_len == -1 && start_position == 0)
      {
-      match = g_regex_match (regex, string, match_opts2);
+      match = g_regex_match (regex, string, match_opts2, NULL);
        if (match != expected)
         {
           g_print ("failed \t(pattern: \"%s\", string: \"%s\")\n",
@@ -340,13 +270,14 @@ free_match (gpointer data, gpointer user_data)
  }
  
  static gboolean
-test_match_next_full (const gchar          *pattern,
-                     const gchar          *string,
-                     gssize                string_len,
-                     gint                  start_position,
-                     ...)
+test_match_next (const gchar *pattern,
+                const gchar *string,
+                gssize       string_len,
+                gint         start_position,
+                ...)
  {
    GRegex *regex;
+  GMatchInfo *match_info;
    va_list args;
    GSList *matches = NULL;
    GSList *expected = NULL;
@@ -376,114 +307,19 @@ test_match_next_full (const gchar          *pattern,
  
    regex = g_regex_new (pattern, 0, 0, NULL);
  
-  while (g_regex_match_next_full (regex, string, string_len,
-                                 start_position, 0, NULL))
-   {
-      Match *match = g_new0 (Match, 1);
-      match->string = g_regex_fetch (regex, 0, string);
-      match->start = UNTOUCHED;
-      match->end = UNTOUCHED;
-      g_regex_fetch_pos (regex, 0, &match->start, &match->end);
-      matches = g_slist_prepend (matches, match);
-   }
-  matches = g_slist_reverse (matches);
-
-  if (g_slist_length (matches) != g_slist_length (expected))
-    {
-      gint match_count = g_slist_length (matches);
-      g_print ("failed \t(got %d %s, expected %d)\n", match_count,
-              match_count == 1 ? "match" : "matches", 
-              g_slist_length (expected));
-      ret = FALSE;
-      goto exit;
-    }
-
-  l_exp = expected;
-  l_match =  matches;
-  while (l_exp != NULL)
-    {
-      Match *exp = l_exp->data;
-      Match *match = l_match->data;
-
-      if (!streq(exp->string, match->string))
-       {
-         g_print ("failed \t(got \"%s\", expected \"%s\")\n",
-                  match->string, exp->string);
-         ret = FALSE;
-         goto exit;
-       }
-
-      if (exp->start != match->start || exp->end != match->end)
-       {
-         g_print ("failed \t(got [%d, %d], expected [%d, %d])\n",
-                  match->start, match->end, exp->start, exp->end);
-         ret = FALSE;
-         goto exit;
-       }
-
-      l_exp = g_slist_next (l_exp);
-      l_match = g_slist_next (l_match);
-    }
-
-exit:
-  if (ret)
+  g_regex_match_full (regex, string, string_len,
+                     start_position, 0, &match_info, NULL);
+  while (g_match_info_matches (match_info))
      {
-      gint count = g_slist_length (matches);
-      verbose ("passed (%d %s)\n", count, count == 1 ? "match" : "matches");
-    }
-
-  g_regex_free (regex);
-  g_slist_foreach (expected, free_match, NULL);
-  g_slist_free (expected);
-  g_slist_foreach (matches, free_match, NULL);
-  g_slist_free (matches);
-
-  return ret;
-}
-
-static gboolean
-test_match_next (const gchar          *pattern,
-                const gchar          *string,
-                ...)
-{
-  GRegex *regex;
-  va_list args;
-  GSList *matches = NULL;
-  GSList *expected = NULL;
-  GSList *l_exp, *l_match;
-  gboolean ret = TRUE;
-  
-  verbose ("matching \"%s\" against \"%s\" \t", string, pattern);
-
-  /* The va_list is a NULL-terminated sequence of: extected matched string,
-   * expected start and expected end. */
-  va_start (args, string);
-  while (TRUE)
-   {
-      Match *match;
-      const gchar *expected_string = va_arg (args, const gchar *);
-      if (expected_string == NULL)
-        break;
-      match = g_new0 (Match, 1);
-      match->string = g_strdup (expected_string);
-      match->start = va_arg (args, gint);
-      match->end = va_arg (args, gint);
-      expected = g_slist_prepend (expected, match);
-    }
-  expected = g_slist_reverse (expected);
-  va_end (args);
-
-  regex = g_regex_new (pattern, 0, 0, NULL);
-
-  while (g_regex_match_next (regex, string, 0))
-   {
        Match *match = g_new0 (Match, 1);
-      match->string = g_regex_fetch (regex, 0, string);
+      match->string = g_match_info_fetch (match_info, 0);
        match->start = UNTOUCHED;
        match->end = UNTOUCHED;
-      g_regex_fetch_pos (regex, 0, &match->start, &match->end);
+      g_match_info_fetch_pos (match_info, 0, &match->start, &match->end);
        matches = g_slist_prepend (matches, match);
-   }
+      g_match_info_next (match_info, NULL);
+    }
+  g_match_info_free (match_info);
    matches = g_slist_reverse (matches);
  
    if (g_slist_length (matches) != g_slist_length (expected))
@@ -541,91 +377,50 @@ exit:
  
  #define TEST_MATCH_NEXT0(pattern, string, string_len, start_position) { \
    total++; \
-  if (test_match_next_full (pattern, string, string_len, start_position, NULL)) \
+  if (test_match_next (pattern, string, string_len, start_position, NULL)) \
      PASS; \
    else \
      FAIL; \
-  if (string_len == -1 && start_position == 0) \
-  { \
-    total++; \
-    if (test_match_next (pattern, string, NULL)) \
-      PASS; \
-    else \
-      FAIL; \
-  } \
  }
  
  #define TEST_MATCH_NEXT1(pattern, string, string_len, start_position, \
                               t1, s1, e1) { \
    total++; \
-  if (test_match_next_full (pattern, string, string_len, start_position, \
-                           t1, s1, e1, NULL)) \
+  if (test_match_next (pattern, string, string_len, start_position, \
+                      t1, s1, e1, NULL)) \
      PASS; \
    else \
      FAIL; \
-  if (string_len == -1 && start_position == 0) \
-  { \
-    total++; \
-    if (test_match_next (pattern, string, t1, s1, e1, NULL)) \
-      PASS; \
-    else \
-      FAIL; \
-  } \
  }
  
  #define TEST_MATCH_NEXT2(pattern, string, string_len, start_position, \
                          t1, s1, e1, t2, s2, e2) { \
    total++; \
-  if (test_match_next_full (pattern, string, string_len, start_position, \
-                           t1, s1, e1, t2, s2, e2, NULL)) \
+  if (test_match_next (pattern, string, string_len, start_position, \
+                      t1, s1, e1, t2, s2, e2, NULL)) \
      PASS; \
    else \
      FAIL; \
-  if (string_len == -1 && start_position == 0) \
-  { \
-    total++; \
-    if (test_match_next (pattern, string, t1, s1, e1, t2, s2, e2, NULL)) \
-      PASS; \
-    else \
-      FAIL; \
-  } \
  }
  
  #define TEST_MATCH_NEXT3(pattern, string, string_len, start_position, \
                          t1, s1, e1, t2, s2, e2, t3, s3, e3) { \
    total++; \
-  if (test_match_next_full (pattern, string, string_len, start_position, \
-                           t1, s1, e1, t2, s2, e2, t3, s3, e3, NULL)) \
+  if (test_match_next (pattern, string, string_len, start_position, \
+                      t1, s1, e1, t2, s2, e2, t3, s3, e3, NULL)) \
      PASS; \
    else \
      FAIL; \
-  if (string_len == -1 && start_position == 0) \
-  { \
-    total++; \
-    if (test_match_next (pattern, string, t1, s1, e1, t2, s2, e2, t3, s3, e3, NULL)) \
-      PASS; \
-    else \
-      FAIL; \
-  } \
  }
  
  #define TEST_MATCH_NEXT4(pattern, string, string_len, start_position, \
                          t1, s1, e1, t2, s2, e2, t3, s3, e3, t4, s4, e4) { \
    total++; \
-  if (test_match_next_full (pattern, string, string_len, start_position, \
-                           t1, s1, e1, t2, s2, e2, t3, s3, e3, t4, s4, e4, NULL)) \
+  if (test_match_next (pattern, string, string_len, start_position, \
+                      t1, s1, e1, t2, s2, e2, t3, s3, e3, t4, s4, e4, NULL)) \
      PASS; \
    else \
      FAIL; \
-  if (string_len == -1 && start_position == 0) \
-  { \
-    total++;\
-    if (test_match_next (pattern, string, t1, s1, e1, t2, s2, e2, t3, s3, e3, \
-                        t4, s4, e4, NULL)) \
-      PASS; \
-    else \
-      FAIL; \
-  } \
  }
  
  static gboolean
@@ -636,6 +431,7 @@ test_match_count (const gchar      *pattern,
                   gint              expected_count)
  {
    GRegex *regex;
+  GMatchInfo *match_info;
    gint count;
    
    verbose ("fetching match count (string: \"%s\", pattern: \"%s\", start: %d) \t",
@@ -643,9 +439,9 @@ test_match_count (const gchar      *pattern,
  
    regex = g_regex_new (pattern, 0, 0, NULL);
  
-  g_regex_match_next_full (regex, string, -1, start_position,
-                          match_opts, NULL);
-  count = g_regex_get_match_count (regex);
+  g_regex_match_full (regex, string, -1, start_position,
+                     match_opts, &match_info, NULL);
+  count = g_match_info_get_match_count (match_info);
  
    if (count != expected_count)
      {
@@ -653,6 +449,7 @@ test_match_count (const gchar      *pattern,
        return FALSE;
      }
  
+  g_match_info_free (match_info);
    g_regex_free (regex);
  
    verbose ("passed\n");
@@ -673,34 +470,36 @@ test_partial (const gchar *pattern,
               gboolean     expected)
  {
    GRegex *regex;
+  GMatchInfo *match_info;
    
    verbose ("partial matching (string: \"%s\", pattern: \"%s\") \t",
            string, pattern);
  
    regex = g_regex_new (pattern, 0, 0, NULL);
  
-  g_regex_match (regex, string, G_REGEX_MATCH_PARTIAL);
-  if (expected != g_regex_is_partial_match (regex))
+  g_regex_match (regex, string, G_REGEX_MATCH_PARTIAL, &match_info);
+  if (expected != g_match_info_is_partial_match (match_info))
      {
        g_print ("failed \t(got %d, expected: %d)\n", !expected, expected);
        g_regex_free (regex);
        return FALSE;
      }
  
-  if (expected && g_regex_fetch_pos (regex, 0, NULL, NULL))
+  if (expected && g_match_info_fetch_pos (match_info, 0, NULL, NULL))
      {
        g_print ("failed \t(got sub-pattern 0)\n");
        g_regex_free (regex);
        return FALSE;
      }
  
-  if (expected && g_regex_fetch_pos (regex, 1, NULL, NULL))
+  if (expected && g_match_info_fetch_pos (match_info, 1, NULL, NULL))
      {
        g_print ("failed \t(got sub-pattern 1)\n");
        g_regex_free (regex);
        return FALSE;
      }
  
+  g_match_info_free (match_info);
    g_regex_free (regex);
  
    verbose ("passed\n");
@@ -716,83 +515,6 @@ test_partial (const gchar *pattern,
  }
  
  static gboolean
-test_clear (const gchar *pattern,
-           const gchar *string,
-           gint         start_position)
-{
-  GRegex *regex;
-  gboolean match1, match2;
-  gint start1 = UNTOUCHED;
-  gint end1 = UNTOUCHED;
-  gint start2 = UNTOUCHED;
-  gint end2 = UNTOUCHED;
-  gchar *text1 = NULL;
-  gchar *text2 = NULL;
-  gboolean ret = TRUE;
-  
-  verbose ("testing clear with \"%s\" against \"%s\" (start: %d) \t",
-          string, pattern, start_position);
-
-  regex = g_regex_new (pattern, 0, 0, NULL);
-
-  match1 = g_regex_match_next_full (regex, string, UNTOUCHED, start_position,
-                                   0, NULL);
-  if (match1)
-    {
-      text1 = g_regex_fetch (regex, 0, string);
-      g_regex_fetch_pos (regex, 0, &start1, &end1);
-    }
-
-  g_regex_clear (regex);
-
-  match2 = g_regex_match_next_full (regex, string, UNTOUCHED, start_position,
-                                   0, NULL);
-  if (match2)
-    {
-      text2 = g_regex_fetch (regex, 0, string);
-      g_regex_fetch_pos (regex, 0, &start2, &end2);
-    }
-
-  if (match1 != match2)
-    {
-      g_print ("failed \t(different matches)\n");
-      ret = FALSE;
-    }
-  else if (match1)
-    {
-      if (!streq (text1, text2))
-       {
-         g_print ("failed \t(first: \"%s\", second: \"%s\")\n",
-                  text1, text2);
-         ret = FALSE;
-       }
-      if (start1 != start2 || end1 != end2)
-       {
-         g_print ("failed \t(first: [%d, %d], second: [%d, %d])\n",
-                  start1, end1, start2, end2);
-         ret = FALSE;
-       }
-    }
-
-  g_regex_free (regex);
-  g_free (text1);
-  g_free (text2);
-
-  if (ret)
-    verbose ("passed\n");
-
-  return ret;
-}
-
-#define TEST_CLEAR(pattern, string, start_position) { \
-  total++; \
-  if (test_clear (pattern, string, start_position)) \
-    PASS; \
-  else \
-    FAIL; \
-}
-
-static gboolean
  test_sub_pattern (const gchar *pattern,
                   const gchar *string,
                   gint         start_position,
@@ -802,6 +524,7 @@ test_sub_pattern (const gchar *pattern,
                   gint         expected_end)
  {
    GRegex *regex;
+  GMatchInfo *match_info;
    gchar *sub_expr;
    gint start = UNTOUCHED, end = UNTOUCHED;
  
@@ -809,9 +532,9 @@ test_sub_pattern (const gchar *pattern,
            sub_n, string, pattern);
  
    regex = g_regex_new (pattern, 0, 0, NULL);
-  g_regex_match_full (regex, string, -1, start_position, 0, NULL);
+  g_regex_match_full (regex, string, -1, start_position, 0, &match_info, NULL);
  
-  sub_expr = g_regex_fetch (regex, sub_n, string);
+  sub_expr = g_match_info_fetch (match_info, sub_n);
    if (!streq(sub_expr, expected_sub))
      {
        g_print ("failed \t(got \"%s\", expected \"%s\")\n",
@@ -822,7 +545,7 @@ test_sub_pattern (const gchar *pattern,
      }
    g_free (sub_expr);
  
-  g_regex_fetch_pos (regex, sub_n, &start, &end);
+  g_match_info_fetch_pos (match_info, sub_n, &start, &end);
    if (start != expected_start || end != expected_end)
      {
        g_print ("failed \t(got [%d, %d], expected [%d, %d])\n",
@@ -831,28 +554,7 @@ test_sub_pattern (const gchar *pattern,
        return FALSE;
      }
  
-  /* Repeat the test to verify that g_regex_clear() is not needed. */
-  g_regex_match_full (regex, string, -1, start_position, 0, NULL);
-
-  sub_expr = g_regex_fetch (regex, sub_n, string);
-  if (!streq(sub_expr, expected_sub))
-    {
-      g_print ("failed \t(second match != first matchs)\n");
-      g_free (sub_expr);
-      g_regex_free (regex);
-      return FALSE;
-    }
-  g_free (sub_expr);
-
-  g_regex_fetch_pos (regex, sub_n, &start, &end);
-  if (start != expected_start || end != expected_end)
-    {
-      g_print ("failed \t(second match != first matchs)\n");
-      g_regex_free (regex);
-      return FALSE;
-    }
-
-
+  g_match_info_free (match_info);
    g_regex_free (regex);
  
    verbose ("passed\n");
@@ -879,6 +581,7 @@ test_named_sub_pattern (const gchar *pattern,
                         gint         expected_end)
  {
    GRegex *regex;
+  GMatchInfo *match_info;
    gint start = UNTOUCHED, end = UNTOUCHED;
    gchar *sub_expr;
  
@@ -887,8 +590,8 @@ test_named_sub_pattern (const gchar *pattern,
  
    regex = g_regex_new (pattern, 0, 0, NULL);
  
-  g_regex_match_full (regex, string, -1, start_position, 0, NULL);
-  sub_expr = g_regex_fetch_named (regex, sub_name, string);
+  g_regex_match_full (regex, string, -1, start_position, 0, &match_info, NULL);
+  sub_expr = g_match_info_fetch_named (match_info, sub_name);
    if (!streq (sub_expr, expected_sub))
      {
        g_print ("failed \t(got \"%s\", expected \"%s\")\n",
@@ -899,7 +602,7 @@ test_named_sub_pattern (const gchar *pattern,
      }
    g_free (sub_expr);
  
-  g_regex_fetch_named_pos (regex, sub_name, &start, &end);
+  g_match_info_fetch_named_pos (match_info, sub_name, &start, &end);
    if (start != expected_start || end != expected_end)
      {
        g_print ("failed \t(got [%d, %d], expected [%d, %d])\n",
@@ -908,6 +611,7 @@ test_named_sub_pattern (const gchar *pattern,
        return FALSE;
      }
  
+  g_match_info_free (match_info);
    g_regex_free (regex);
  
    verbose ("passed\n");
@@ -930,6 +634,7 @@ test_fetch_all (const gchar *pattern,
                 ...)
  {
    GRegex *regex;
+  GMatchInfo *match_info;
    va_list args;
    GSList *expected = NULL;
    GSList *l_exp;
@@ -955,8 +660,8 @@ test_fetch_all (const gchar *pattern,
    va_end (args);
  
    regex = g_regex_new (pattern, 0, 0, NULL);
-  g_regex_match (regex, string, 0);
-  matches = g_regex_fetch_all (regex, string);
+  g_regex_match (regex, string, 0, &match_info);
+  matches = g_match_info_fetch_all (match_info);
    if (matches)
      match_count = g_strv_length (matches);
    else
@@ -987,6 +692,7 @@ test_fetch_all (const gchar *pattern,
            match_count == 1 ? "match" : "matches");
  
  exit:
+  g_match_info_free (match_info);
    g_regex_free (regex);
    g_slist_foreach (expected, (GFunc)g_free, NULL);
    g_slist_free (expected);
@@ -1332,211 +1038,6 @@ exit:
  }
  
  static gboolean
-test_split_next_full (const gchar *pattern,
-                     const gchar *string,
-                     gint         start_position,
-                     ...)
-{
-  GRegex *regex;
-  va_list args;
-  GSList *expected = NULL;
-  GSList *tokens;
-  GSList *l_exp, *l_token;
-  gint token_count;
-  gchar *token;
-  gboolean ret = TRUE;
-  
-  verbose ("splitting \"%s\" against \"%s\" (start: %d) \t",
-          string, pattern, start_position);
-
-  /* The va_list is a NULL-terminated sequence of extected strings. */
-  va_start (args, start_position);
-  while (TRUE)
-   {
-      gchar *expected_string = va_arg (args, gchar *);
-      if (expected_string == NULL)
-        break;
-      else
-        expected = g_slist_prepend (expected, g_strdup (expected_string));
-    }
-  expected = g_slist_reverse (expected);
-  va_end (args);
-
-  regex = g_regex_new (pattern, 0, 0, NULL);
-
-  tokens = NULL;
-  while ((token = g_regex_split_next_full (regex, string, -1,
-                                          start_position, 0, NULL)))
-    {
-      tokens = g_slist_prepend (tokens, token);
-    }
-  tokens = g_slist_reverse (tokens);
-  token_count = g_slist_length (tokens);
-
-  if (token_count != g_slist_length (expected))
-    {
-      g_print ("failed \t(got %d %s, expected %d)\n", token_count,
-              token_count == 1 ? "match" : "matches", 
-              g_slist_length (expected));
-      ret = FALSE;
-      goto exit;
-    }
-
-  l_exp = expected;
-  l_token = tokens;
-  while (l_exp != NULL)
-    {
-      if (!streq(l_exp->data, l_token->data))
-       {
-         g_print ("failed \t(got \"%s\", expected \"%s\")\n",
-                  (gchar *)l_token->data, (gchar *)l_exp->data);
-         ret = FALSE;
-         goto exit;
-       }
-
-      l_exp = g_slist_next (l_exp);
-      l_token = g_slist_next (l_token);
-    }
-
-  verbose ("passed (%d %s)\n", token_count,
-          token_count == 1 ? "token" : "tokens");
-
-exit:
-  g_regex_free (regex);
-  g_slist_foreach (expected, (GFunc)g_free, NULL);
-  g_slist_free (expected);
-  g_slist_foreach (tokens, (GFunc)g_free, NULL);
-  g_slist_free (tokens);
-
-  return ret;
-}
-
-static gboolean
-test_split_next (const gchar *pattern,
-                const gchar *string,
-                ...)
-{
-  GRegex *regex;
-  va_list args;
-  GSList *expected = NULL;
-  GSList *tokens;
-  GSList *l_exp, *l_token;
-  gint token_count;
-  gchar *token;
-  gboolean ret = TRUE;
-  
-  verbose ("splitting \"%s\" against \"%s\" \t", string, pattern);
-
-  /* The va_list is a NULL-terminated sequence of extected strings. */
-  va_start (args, string);
-  while (TRUE)
-   {
-      gchar *expected_string = va_arg (args, gchar *);
-      if (expected_string == NULL)
-        break;
-      else
-        expected = g_slist_prepend (expected, g_strdup (expected_string));
-    }
-  expected = g_slist_reverse (expected);
-  va_end (args);
-
-  regex = g_regex_new (pattern, 0, 0, NULL);
-
-  tokens = NULL;
-  while ((token = g_regex_split_next (regex, string, 0)))
-    {
-      tokens = g_slist_prepend (tokens, token);
-    }
-  tokens = g_slist_reverse (tokens);
-  token_count = g_slist_length (tokens);
-
-  if (token_count != g_slist_length (expected))
-    {
-      g_print ("failed \t(got %d %s, expected %d)\n", token_count,
-              token_count == 1 ? "match" : "matches", 
-              g_slist_length (expected));
-      ret = FALSE;
-      goto exit;
-    }
-
-  l_exp = expected;
-  l_token = tokens;
-  while (l_exp != NULL)
-    {
-      if (!streq(l_exp->data, l_token->data))
-       {
-         g_print ("failed \t(got \"%s\", expected \"%s\")\n",
-                  (gchar *)l_token->data, (gchar *)l_exp->data);
-         ret = FALSE;
-         goto exit;
-       }
-
-      l_exp = g_slist_next (l_exp);
-      l_token = g_slist_next (l_token);
-    }
-
-  verbose ("passed (%d %s)\n", token_count,
-          token_count == 1 ? "token" : "tokens");
-
-exit:
-  g_regex_free (regex);
-  g_slist_foreach (expected, (GFunc)g_free, NULL);
-  g_slist_free (expected);
-  g_slist_foreach (tokens, (GFunc)g_free, NULL);
-  g_slist_free (tokens);
-
-  return ret;
-}
-
-#define TEST_SPLIT_NEXT1(pattern, string, start_position, e1) { \
-  total++; \
-  if (test_split_next_full (pattern, string, start_position, e1, NULL)) \
-    PASS; \
-  else \
-    FAIL; \
-  if (start_position == 0) \
-  { \
-    total++; \
-    if (test_split_next (pattern, string, e1, NULL)) \
-      PASS; \
-    else \
-      FAIL; \
-  } \
-}
-
-#define TEST_SPLIT_NEXT2(pattern, string, start_position, e1, e2) { \
-  total++; \
-  if (test_split_next_full (pattern, string, start_position, e1, e2, NULL)) \
-    PASS; \
-  else \
-    FAIL; \
-  if (start_position == 0) \
-  { \
-    total++; \
-    if (test_split_next (pattern, string, e1, e2, NULL)) \
-      PASS; \
-    else \
-      FAIL; \
-  } \
-}
-
-#define TEST_SPLIT_NEXT3(pattern, string, start_position, e1, e2, e3) { \
-  total++; \
-  if (test_split_next_full (pattern, string, start_position, e1, e2, e3, NULL)) \
-    PASS; \
-  else \
-    FAIL; \
-  if (start_position == 0) \
-  { \
-    total++; \
-    if (test_split_next (pattern, string, e1, e2, e3, NULL)) \
-      PASS; \
-    else \
-      FAIL; \
-  } \
-}
-
-static gboolean
  test_expand (const gchar *pattern,
              const gchar *string,
              const gchar *string_to_expand,
@@ -1544,14 +1045,15 @@ test_expand (const gchar *pattern,
              const gchar *expected)
  {
    GRegex *regex;
+  GMatchInfo *match_info;
    gchar *res;
    
    verbose ("expanding the references in \"%s\" (pattern: \"%s\", string: \"%s\") \t",
            string_to_expand, pattern, string);
  
    regex = g_regex_new (pattern, raw ? G_REGEX_RAW : 0, 0, NULL);
-  g_regex_match (regex, string, 0);
-  res = g_regex_expand_references (regex, string, string_to_expand, NULL);
+  g_regex_match (regex, string, 0, &match_info);
+  res = g_match_info_expand_references (match_info, string_to_expand, NULL);
    if (!streq (res, expected))
      {
        g_print ("failed \t(got \"%s\", expected \"%s\")\n", res, expected);
@@ -1561,6 +1063,7 @@ test_expand (const gchar *pattern,
      }
  
    g_free (res);
+  g_match_info_free (match_info);
    g_regex_free (regex);
  
    verbose ("passed\n");
@@ -1727,6 +1230,7 @@ test_match_all_full (const gchar *pattern,
                      ...)
  {
    GRegex *regex;
+  GMatchInfo *match_info;
    va_list args;
    GSList *expected = NULL;
    GSList *l_exp;
@@ -1757,8 +1261,8 @@ test_match_all_full (const gchar *pattern,
    va_end (args);
  
    regex = g_regex_new (pattern, 0, 0, NULL);
-  match_ok = g_regex_match_all_full (regex, string, string_len,
-                                    start_position, 0, NULL);
+  match_ok = g_regex_match_all_full (regex, string, string_len, start_position,
+                                    0, &match_info, NULL);
  
    if (match_ok && g_slist_length (expected) == 0)
      {
@@ -1773,7 +1277,7 @@ test_match_all_full (const gchar *pattern,
        goto exit;
      }
  
-  match_count = g_regex_get_match_count (regex);
+  match_count = g_match_info_get_match_count (match_info);
    if (match_count != g_slist_length (expected))
      {
        g_print ("failed \t(got %d %s, expected %d)\n", match_count,
@@ -1790,8 +1294,8 @@ test_match_all_full (const gchar *pattern,
        gchar *matched_string;
        Match *exp = l_exp->data;
  
-      matched_string = g_regex_fetch (regex, i, string);
-      g_regex_fetch_pos (regex, i, &start, &end);
+      matched_string = g_match_info_fetch (match_info, i);
+      g_match_info_fetch_pos (match_info, i, &start, &end);
  
        if (!streq(exp->string, matched_string))
         {
@@ -1820,6 +1324,7 @@ exit:
        verbose ("passed (%d %s)\n", match_count, match_count == 1 ? "match" : "matches");
      }
  
+  g_match_info_free (match_info);
    g_regex_free (regex);
    g_slist_foreach (expected, free_match, NULL);
    g_slist_free (expected);
@@ -1833,6 +1338,7 @@ test_match_all (const gchar *pattern,
                  ...)
  {
    GRegex *regex;
+  GMatchInfo *match_info;
    va_list args;
    GSList *expected = NULL;
    GSList *l_exp;
@@ -1862,7 +1368,7 @@ test_match_all (const gchar *pattern,
    va_end (args);
  
    regex = g_regex_new (pattern, 0, 0, NULL);
-  match_ok = g_regex_match_all (regex, string, 0);
+  match_ok = g_regex_match_all (regex, string, 0, &match_info);
  
    if (match_ok && g_slist_length (expected) == 0)
      {
@@ -1877,7 +1383,7 @@ test_match_all (const gchar *pattern,
        goto exit;
      }
  
-  match_count = g_regex_get_match_count (regex);
+  match_count = g_match_info_get_match_count (match_info);
    if (match_count != g_slist_length (expected))
      {
        g_print ("failed \t(got %d %s, expected %d)\n", match_count,
@@ -1894,8 +1400,8 @@ test_match_all (const gchar *pattern,
        gchar *matched_string;
        Match *exp = l_exp->data;
  
-      matched_string = g_regex_fetch (regex, i, string);
-      g_regex_fetch_pos (regex, i, &start, &end);
+      matched_string = g_match_info_fetch (match_info, i);
+      g_match_info_fetch_pos (match_info, i, &start, &end);
  
        if (!streq(exp->string, matched_string))
         {
@@ -1924,6 +1430,7 @@ exit:
        verbose ("passed (%d %s)\n", match_count, match_count == 1 ? "match" : "matches");
      }
  
+  g_match_info_free (match_info);
    g_regex_free (regex);
    g_slist_foreach (expected, free_match, NULL);
    g_slist_free (expected);
@@ -2001,60 +1508,6 @@ exit:
    } \
  }
  
-#define TEST_NULL_MATCH(code) \
-  G_STMT_START \
-    { \
-      GRegex *re = g_regex_new ("a", 0, 0, NULL); \
-      verbose ("trying '" #code "' on a clean regex \t"); \
-      code; \
-      g_regex_free (re); \
-      re = g_regex_new ("a", 0, 0, NULL); \
-      g_regex_match (re, "b", 0); \
-      g_regex_clear (re); \
-      code; \
-      g_regex_free (re); \
-      /* this test always passes if the code does not crash */ \
-      PASS; \
-      verbose ("passed\n"); \
-    } \
-  G_STMT_END
-
-#define TEST_NULL_MATCH_RET(code, expected, type, format) \
-  G_STMT_START \
-    { \
-      type ret; \
-      GRegex *re = g_regex_new ("a", 0, 0, NULL); \
-      verbose ("trying '" #code "' on a clean regex \t"); \
-      ret = code; \
-      g_regex_free (re); \
-      if (ret != expected) \
-        { \
-          g_print ("failed \t(got '" format "', expected '" format \
-                   "', with a newly created regex)\n", ret, expected); \
-          FAIL; \
-        } \
-      else \
-        { \
-          re = g_regex_new ("a", 0, 0, NULL); \
-          g_regex_match (re, "a", 0); \
-          g_regex_clear (re); \
-          ret = code; \
-          g_regex_free (re); \
-          if (ret != expected) \
-            { \
-              g_print ("failed \t(got " format ", expected " format \
-                       ", with a cleared regex)\n", ret, expected); \
-              FAIL; \
-            } \
-          else \
-            { \
-              verbose ("passed\n"); \
-              PASS; \
-            } \
-        } \
-    } \
-  G_STMT_END
-
  int
  main (int argc, char *argv[])
  {
@@ -2078,12 +1531,15 @@ main (int argc, char *argv[])
    /* TEST_NEW(pattern, compile_opts, match_opts) */
    TEST_NEW("", 0, 0);
    TEST_NEW(".*", 0, 0);
+  TEST_NEW(".*", G_REGEX_OPTIMIZE, 0);
    TEST_NEW(".*", G_REGEX_MULTILINE, 0);
    TEST_NEW(".*", G_REGEX_DOTALL, 0);
    TEST_NEW(".*", G_REGEX_DOTALL, G_REGEX_MATCH_NOTBOL);
    TEST_NEW("(123\\d*)[a-zA-Z]+(?P<hello>.*)", 0, 0);
    TEST_NEW("(123\\d*)[a-zA-Z]+(?P<hello>.*)", G_REGEX_CASELESS, 0);
+  TEST_NEW("(123\\d*)[a-zA-Z]+(?P<hello>.*)", G_REGEX_CASELESS | G_REGEX_OPTIMIZE, 0);
    TEST_NEW("(?P<A>x)|(?P<A>y)", G_REGEX_DUPNAMES, 0);
+  TEST_NEW("(?P<A>x)|(?P<A>y)", G_REGEX_DUPNAMES | G_REGEX_OPTIMIZE, 0);
    /* This gives "internal error: code overflow" with pcre 6.0 */
    TEST_NEW("(?i)(?-i)", 0, 0);
  
@@ -2095,14 +1551,6 @@ main (int argc, char *argv[])
    TEST_NEW_FAIL("?", 0);
    TEST_NEW_FAIL("(?P<A>x)|(?P<A>y)", 0);
  
-  /* TEST_COPY(pattern) */
-  TEST_COPY("");
-  TEST_COPY(".*");
-  TEST_COPY("a|b");
-  TEST_COPY("(123\\d*)[a-zA-Z]+(?P<hello>.*)");
-  /* Test if g_regex_copy() works with null regexes. */
-  TEST_COPY("(");
-
    /* TEST_MATCH_SIMPLE(pattern, string, compile_opts, match_opts, expected) */
    TEST_MATCH_SIMPLE("a", "", 0, 0, FALSE);
    TEST_MATCH_SIMPLE("a", "a", 0, 0, TRUE);
@@ -2293,14 +1741,6 @@ main (int argc, char *argv[])
    TEST_PARTIAL("(a)+b", "aa", TRUE);
    TEST_PARTIAL("a?b", "a", TRUE);
  
-  /* TEST_CLEAR(pattern, string, start_position) */
-  TEST_CLEAR("$^", "aaa", 0);
-  TEST_CLEAR("a", "xax", 0);
-  TEST_CLEAR("a", "xax", 1);
-  TEST_CLEAR("a", "xax", 2);
-  TEST_CLEAR("a", "aa", 0);
-  TEST_CLEAR(HSTROKE, HSTROKE, 0);
-
    /* TEST_SUB_PATTERN(pattern, string, start_position, sub_n, expected_sub,
     *                 expected_start, expected_end) */
    TEST_SUB_PATTERN("a", "a", 0, 0, "a", 0, 1);
@@ -2393,26 +1833,6 @@ main (int argc, char *argv[])
    TEST_SPLIT3(" *", "ab c", 0, 3, "a", "b", "c");
    TEST_SPLIT3(" *", "ab c", 0, 4, "a", "b", "c");
  
-  /* TEST_SPLIT_NEXT#(pattern, string, start_position, ...) */
-  TEST_SPLIT_NEXT1(",", "a", 0, "a");
-  TEST_SPLIT_NEXT1("(,)\\s*", "a", 0, "a");
-  TEST_SPLIT_NEXT1(",", "a,b", 2, "b");
-  TEST_SPLIT_NEXT2(",", "a,b", 0, "a", "b");
-  TEST_SPLIT_NEXT2(",", "a,b", 1, "", "b");
-  TEST_SPLIT_NEXT2(",", "a,", 0, "a", "");
-  TEST_SPLIT_NEXT3(",", "a,b,c", 0, "a", "b", "c");
-  TEST_SPLIT_NEXT3(",\\s*", "a,b,c", 0, "a", "b", "c");
-  TEST_SPLIT_NEXT3(",\\s*", "a, b, c", 0, "a", "b", "c");
-  TEST_SPLIT_NEXT3("(,)\\s*", "a,b", 0, "a", ",", "b");
-  TEST_SPLIT_NEXT3("(,)\\s*", "a, b", 0, "a", ",", "b");
-  /* Not matched sub-strings. */
-  TEST_SPLIT_NEXT2("a|(b)", "xay", 0, "x", "y");
-  TEST_SPLIT_NEXT3("a|(b)", "xby", 0, "x", "b", "y");
-  /* Empty matches. */
-  TEST_SPLIT_NEXT2(" *", "ab c", 1, "b", "c");
-  TEST_SPLIT_NEXT3("", "abc", 0, "a", "b", "c");
-  TEST_SPLIT_NEXT3(" *", "ab c", 0, "a", "b", "c");
-
    /* TEST_EXPAND(pattern, string, string_to_expand, raw, expected) */
    TEST_EXPAND("a", "a", "", FALSE, "");
    TEST_EXPAND("a", "a", "\\0", FALSE, "a");
@@ -2486,7 +1906,12 @@ main (int argc, char *argv[])
    TEST_REPLACE("a", "ababa", 2, "A", "abAbA");
    TEST_REPLACE("a", "ababa", 3, "A", "ababA");
    TEST_REPLACE("a", "ababa", 4, "A", "ababA");
+  TEST_REPLACE("a", "ababa", 5, "A", "ababa");
+  TEST_REPLACE("a", "ababa", 6, "A", "ababa");
    TEST_REPLACE("a", "abababa", 2, "A", "abAbAbA");
+  TEST_REPLACE("a", "abab", 0, "A", "AbAb");
+  TEST_REPLACE("a", "baba", 0, "A", "bAbA");
+  TEST_REPLACE("a", "bab", 0, "A", "bAb");
    TEST_REPLACE("$^", "abc", 0, "X", "abc");
    TEST_REPLACE("(.)a", "ciao", 0, "a\\1", "caio");
    TEST_REPLACE("a.", "abc", 0, "\\0\\0", "ababc");
@@ -2509,6 +1934,8 @@ main (int argc, char *argv[])
    TEST_REPLACE_LIT("a", "ababa", 2, "A", "abAbA");
    TEST_REPLACE_LIT("a", "ababa", 3, "A", "ababA");
    TEST_REPLACE_LIT("a", "ababa", 4, "A", "ababA");
+  TEST_REPLACE_LIT("a", "ababa", 5, "A", "ababa");
+  TEST_REPLACE_LIT("a", "ababa", 6, "A", "ababa");
    TEST_REPLACE_LIT("a", "abababa", 2, "A", "abAbAbA");
    TEST_REPLACE_LIT("a", "abcadaa", 0, "A", "AbcAdAA");
    TEST_REPLACE_LIT("$^", "abc", 0, "X", "abc");
@@ -2573,27 +2000,6 @@ main (int argc, char *argv[])
                   "<a><b>", 0, 6, "<a>", 0, 3);
    TEST_MATCH_ALL3("a+", "aaa", -1, 0, "aaa", 0, 3, "aa", 0, 2, "a", 0, 1);
  
-  /* TEST_NULL_MATCH(code) */
-  /* TEST_NULL_MATCH_RET(code, expected, type) */
-  /* Test to see what happens if a function needing GRegexMatch is called
-   * when GRegexMatch is NULL. The result should be the same when the function
-   * is called after g_regex_clear.
-   * "re" is a GRegex, the pattern is "a". */
-  TEST_NULL_MATCH(g_regex_clear (re));
-  TEST_NULL_MATCH(g_regex_get_pattern (re));
-  TEST_NULL_MATCH_RET(g_regex_optimize (re, NULL), TRUE, gboolean, "%d");
-  TEST_NULL_MATCH_RET(g_regex_match (re, "a", 0), TRUE, gboolean, "%d");
-  TEST_NULL_MATCH_RET(g_regex_match (re, "b", 0), FALSE, gboolean, "%d");
-  TEST_NULL_MATCH_RET(g_regex_match_full (re, "a", -1, 0, 0, NULL), TRUE, gboolean, "%d");
-  TEST_NULL_MATCH_RET(g_regex_match_full (re, "a", -1, 1, 0, NULL), FALSE, gboolean, "%d");
-  TEST_NULL_MATCH_RET(g_regex_match_full (re, "b", -1, 0, 0, NULL), FALSE, gboolean, "%d");
-  TEST_NULL_MATCH_RET(g_regex_get_match_count (re), -1, gint, "%d");
-  TEST_NULL_MATCH_RET(g_regex_is_partial_match (re), FALSE, gboolean, "%d");
-  TEST_NULL_MATCH_RET(g_regex_fetch (re, 0, "abc"), NULL, gchar *, "%p");
-  TEST_NULL_MATCH_RET(g_regex_fetch_pos (re, 0, NULL, NULL), FALSE, gboolean, "%d");
-  TEST_NULL_MATCH_RET(g_regex_fetch_all (re, "b"), NULL, gchar **, "%p");
-  TEST_NULL_MATCH_RET(g_regex_get_string_number (re, "X"), -1, gint, "%d");
-
  end: /* if abort_on_fail is TRUE the flow passes to this label. */
    verbose ("\n%u tests passed, %u failed\n", passed, failed);
    return failed;
author	Matthias Clasen <mclasen@redhat.com>
	Mon, 30 Apr 2007 16:02:26 +0000 (16:02 +0000)
committer	Matthias Clasen <matthiasc@src.gnome.org>
	Mon, 30 Apr 2007 16:02:26 +0000 (16:02 +0000)
ChangeLog		patch \| blob \| history
docs/reference/ChangeLog		patch \| blob \| history
docs/reference/glib/glib-sections.txt		patch \| blob \| history
docs/reference/glib/tmpl/gregex.sgml		patch \| blob \| history
glib/glib.symbols		patch \| blob \| history
glib/gregex.c		patch \| blob \| history
glib/gregex.h		patch \| blob \| history
tests/regex-test.c		patch \| blob \| history