Implement SQL99 OVERLAY(). Allows substitution of a substring in a string.

author Thomas G. Lockhart <lockhart@alumni.caltech.edu>

Tue, 11 Jun 2002 15:44:38 +0000 (15:44 +0000)

committer Thomas G. Lockhart <lockhart@alumni.caltech.edu>

Tue, 11 Jun 2002 15:44:38 +0000 (15:44 +0000)
author Thomas G. Lockhart <lockhart@alumni.caltech.edu>
Tue, 11 Jun 2002 15:44:38 +0000 (15:44 +0000)
committer Thomas G. Lockhart <lockhart@alumni.caltech.edu>
Tue, 11 Jun 2002 15:44:38 +0000 (15:44 +0000)
diff --git a/doc/src/sgml/ref/set.sgml b/doc/src/sgml/ref/set.sgml

index 74ce1fc64269a0e8efa2566e8081c31060be216b..1a3cea8ce2463253eaf61826c858d43d3431d652 100644 (file)
--- a/doc/src/sgml/ref/set.sgml
+++ b/doc/src/sgml/ref/set.sgml
@@ -28,8 +28,8 @@ SET [ SESSION | LOCAL ] TIME ZONE { <replaceable class="PARAMETER">timezone</rep
        <listitem>
         <para>
          Specifies that the command takes effect for the current session.
-       (This is the default if neither <option>SESSION</> nor
-       <option>LOCAL</> appears.)
+        (This is the default if neither <option>SESSION</> nor
+        <option>LOCAL</> appears.)
         </para>
        </listitem>
       </varlistentry>
@@ -39,11 +39,11 @@ SET [ SESSION | LOCAL ] TIME ZONE { <replaceable class="PARAMETER">timezone</rep
        <listitem>
         <para>
          Specifies that the command takes effect for only the current
-       transaction.  After <command>COMMIT</> or <command>ROLLBACK</>,
-       the session-level setting takes effect again.  Note that
-       <command>SET LOCAL</> will appear to have no effect if it's
-       executed outside a <command>BEGIN</> block, since the transaction
-       will end immediately.
+        transaction.  After <command>COMMIT</> or <command>ROLLBACK</>,
+        the session-level setting takes effect again.  Note that
+        <command>SET LOCAL</> will appear to have no effect if it's
+        executed outside a <command>BEGIN</> block, since the transaction
+        will end immediately.
         </para>
        </listitem>
       </varlistentry>
@@ -112,7 +112,6 @@ SET [ SESSION | LOCAL ] TIME ZONE { <replaceable class="PARAMETER">timezone</rep
     Here are additional details about a few of the parameters that can be set:
  
     <variablelist>
-
      <varlistentry>
       <term>DATESTYLE</term>
       <listitem>
@@ -126,44 +125,44 @@ SET [ SESSION | LOCAL ] TIME ZONE { <replaceable class="PARAMETER">timezone</rep
         The following are date/time output styles:
  
         <variablelist>
-       <varlistentry>
-        <term>ISO</term>
-        <listitem>
-         <para>
-          Use ISO 8601-style dates and times (<literal>YYYY-MM-DD
-          HH:MM:SS</literal>). This is the default.
+        <varlistentry>
+         <term>ISO</term>
+         <listitem>
+          <para>
+           Use ISO 8601-style dates and times (<literal>YYYY-MM-DD
+            HH:MM:SS</literal>). This is the default.
            </para>
-        </listitem>
-       </varlistentry>
+         </listitem>
+        </varlistentry>
  
          <varlistentry>
-        <term>SQL</term>
-        <listitem>
-         <para>
-          Use Oracle/Ingres-style dates and times. Note that this
-          style has nothing to do with SQL (which mandates ISO 8601
-          style), the naming of this option is a historical accident.
-         </para>
-        </listitem>
-       </varlistentry>
+         <term>SQL</term>
+         <listitem>
+          <para>
+           Use Oracle/Ingres-style dates and times. Note that this
+           style has nothing to do with SQL (which mandates ISO 8601
+           style), the naming of this option is a historical accident.
+          </para>
+         </listitem>
+        </varlistentry>
  
          <varlistentry>
-        <term>PostgreSQL</term>
-        <listitem>
-         <para>
-          Use traditional <productname>PostgreSQL</productname> format.
-         </para>
-        </listitem>
-       </varlistentry>
+         <term>PostgreSQL</term>
+         <listitem>
+          <para>
+           Use traditional <productname>PostgreSQL</productname> format.
+          </para>
+         </listitem>
+        </varlistentry>
  
          <varlistentry>
-        <term>German</term>
-        <listitem>
-         <para>
-          Use <literal>dd.mm.yyyy</literal> for numeric date representations.
-         </para>
-        </listitem>
-       </varlistentry>
+         <term>German</term>
+         <listitem>
+          <para>
+           Use <literal>dd.mm.yyyy</literal> for numeric date representations.
+          </para>
+         </listitem>
+        </varlistentry>
         </variablelist>
        </para>
  
@@ -173,24 +172,24 @@ SET [ SESSION | LOCAL ] TIME ZONE { <replaceable class="PARAMETER">timezone</rep
         and the preferred interpretation of ambiguous date input.
  
         <variablelist>
-       <varlistentry>
-        <term>European</term>
-        <listitem>
-         <para>
-          Use <literal>dd/mm/yyyy</literal> for numeric date representations.
-         </para>
-        </listitem>
-       </varlistentry>
+        <varlistentry>
+         <term>European</term>
+         <listitem>
+          <para>
+           Use <literal>dd/mm/yyyy</literal> for numeric date representations.
+          </para>
+         </listitem>
+        </varlistentry>
  
          <varlistentry>
-        <term>NonEuropean</term>
-        <term>US</term>
-        <listitem>
-         <para>
-          Use <literal>mm/dd/yyyy</literal> for numeric date representations.
-         </para>
-        </listitem>
-       </varlistentry>
+         <term>NonEuropean</term>
+         <term>US</term>
+         <listitem>
+          <para>
+           Use <literal>mm/dd/yyyy</literal> for numeric date representations.
+          </para>
+         </listitem>
+        </varlistentry>
         </variablelist>
        </para>
  
@@ -214,23 +213,23 @@ SET [ SESSION | LOCAL ] TIME ZONE { <replaceable class="PARAMETER">timezone</rep
         in addition to the normal methods of setting it via <command>SET</> or
         a configuration-file entry:
         <simplelist>
-       <member>
-        Setting the postmaster's <envar>PGDATESTYLE</envar> environment
-        variable.  (This will be overridden by any of the other methods.)
-       </member>
-       <member>
-        Running postmaster using the option <option>-o -e</option> to
-        select the <literal>European</literal> conventions.
-        (This overrides environment variables and configuration-file
-        entries.)
-       </member>
-       <member>
-        Setting the client's <envar>PGDATESTYLE</envar> environment variable.
-        If PGDATESTYLE is set in the frontend environment of a client
-        based on libpq, libpq will automatically set DATESTYLE to the
-        value of PGDATESTYLE during connection start-up.  This is
-        equivalent to a manually issued <command>SET</>.
-       </member>
+        <member>
+         Setting the postmaster's <envar>PGDATESTYLE</envar> environment
+         variable.  (This will be overridden by any of the other methods.)
+        </member>
+        <member>
+         Running postmaster using the option <option>-o -e</option> to
+         set dates to the <literal>European</literal> convention.
+         (This overrides environment variables and configuration-file
+         entries.)
+        </member>
+        <member>
+         Setting the client's <envar>PGDATESTYLE</envar> environment variable.
+         If PGDATESTYLE is set in the frontend environment of a client
+         based on libpq, libpq will automatically set DATESTYLE to the
+         value of PGDATESTYLE during connection start-up.  This is
+         equivalent to a manually issued <command>SET DATESTYLE</>.
+        </member>
         </simplelist>
        </para>
  
@@ -250,50 +249,49 @@ SET [ SESSION | LOCAL ] TIME ZONE { <replaceable class="PARAMETER">timezone</rep
        <term>SEED</term>
        <listitem>
         <para>
-       Sets the internal seed for the random number generator.
+       Sets the internal seed for the random number generator.
         
-       <variablelist>
-        <varlistentry>
-         <term><replaceable class="parameter">value</replaceable></term>
-         <listitem>
-          <para>
-           The value for the seed to be used by the
-           <function>random</function> function. Allowed
-           values are floating-point numbers between 0 and 1, which
-           are then multiplied by 2<superscript>31</>-1.
-          </para>
-         </listitem>
-        </varlistentry>
-       </variablelist>
-       </para>
+       <variablelist>
+        <varlistentry>
+         <term><replaceable class="parameter">value</replaceable></term>
+         <listitem>
+          <para>
+           The value for the seed to be used by the
+           <function>random</function> function. Allowed
+           values are floating-point numbers between 0 and 1, which
+           are then multiplied by 2<superscript>31</>-1.
+          </para>
+         </listitem>
+        </varlistentry>
+       </variablelist>
+      </para>
  
-       <para>
-        The seed can also be set by invoking the
-        <function>setseed</function> SQL function:
+      <para>
+       The seed can also be set by invoking the
+       <function>setseed</function> SQL function:
  
-        <programlisting>
+       <programlisting>
  SELECT setseed(<replaceable>value</replaceable>);
-        </programlisting>
-       </para>
-
-      </listitem>
-     </varlistentry>
+       </programlisting>
+      </para>
+     </listitem>
+    </varlistentry>
  
-     <varlistentry>
-      <term>SERVER_ENCODING</term>
-      <listitem>
-       <para>
-       Shows the server-side multibyte encoding.  (At present, this
-       parameter can be shown but not set, because the encoding is
-       determined at initdb time.)
-       </para>
-      </listitem>
-     </varlistentry>
+    <varlistentry>
+     <term>SERVER_ENCODING</term>
+     <listitem>
+      <para>
+       Shows the server-side multibyte encoding.  (At present, this
+       parameter can be shown but not set, because the encoding is
+       determined at initdb time.)
+      </para>
+     </listitem>
+    </varlistentry>
  
-     <varlistentry>
-      <term>TIME ZONE</term>
-      <term>TIMEZONE</term>
-      <listitem>
+    <varlistentry>
+     <term>TIME ZONE</term>
+     <term>TIMEZONE</term>
+     <listitem>
        <para>
         Sets the default time zone for your session. Arguments can be
         an SQL time interval constant, an integer or double precision
@@ -301,92 +299,88 @@ SELECT setseed(<replaceable>value</replaceable>);
         by the host operating system.
        </para>
  
-       <para>
-       The available time zone names depend on your operating
-       system. For example, on Linux
-       <filename>/usr/share/zoneinfo</filename> contains the database
-       of time zones.
-       </para>
-       <para>
-       Here are some typical values for time zone names:
+      <para>
+       Here are some typical values for time zone settings:
  
         <variablelist>
-        <varlistentry>
-         <term>'PST8PDT'</term>
-         <listitem>
-          <para>
-           Set the time zone for California.
-          </para>
-         </listitem>
-        </varlistentry>
-        <varlistentry>
-         <term>'Portugal'</term>
-         <listitem>
-          <para>
-           Set the time zone for Portugal.
-          </para>
-         </listitem>
-        </varlistentry>
-        <varlistentry>
-         <term>'Europe/Rome'</term>
-         <listitem>
-          <para>
-           Set the time zone for Italy.
-          </para>
-         </listitem>
-        </varlistentry>
-       </variablelist>
-       </para>
+        <varlistentry>
+         <term>'PST8PDT'</term>
+         <listitem>
+          <para>
+           Set the time zone for Berkeley, California.
+          </para>
+         </listitem>
+        </varlistentry>
+        <varlistentry>
+         <term>'Portugal'</term>
+         <listitem>
+          <para>
+           Set the time zone for Portugal.
+          </para>
+         </listitem>
+        </varlistentry>
+        <varlistentry>
+         <term>'Europe/Rome'</term>
+         <listitem>
+          <para>
+           Set the time zone for Italy.
+          </para>
+         </listitem>
+        </varlistentry>
+        <varlistentry>
+         <term>7</term>
+         <listitem>
+          <para>
+           Set the time zone to 7 hours offset west from GMT (equivalent
+           to PDT).
+          </para>
+         </listitem>
+        </varlistentry>
+        <varlistentry>
+         <term>INTERVAL '08:00' HOUR TO MINUTE</term>
+         <listitem>
+          <para>
+           Set the time zone to 8 hours offset west from GMT (equivalent
+           to PST).
+          </para>
+         </listitem>
+        </varlistentry>
+        <varlistentry>
+         <term>LOCAL</term>
+         <term>DEFAULT</term>
+         <listitem>
+          <para>
+           Set the time zone to your local time zone (the one that
+           your operating system defaults to).
+          </para>
+         </listitem>
+        </varlistentry>
+       </variablelist>
+      </para>
  
-       <para>
-       In addition to time zone names, <productname>PostgreSQL</productname>
-       accepts these other methods of specifying a time zone:
+      <para>
+       The available time zone names depend on your operating
+       system. For example, on Linux
+       <filename>/usr/share/zoneinfo</filename> contains the database
+       of time zones; the names of the files in that directory can be
+       used as parameters to this command.
+      </para>
  
-       <variablelist>
-        <varlistentry>
-         <term>7</term>
-         <listitem>
-          <para>
-           Set the time zone to 7 hours offset west from GMT (equivalent
-          to PDT).
-          </para>
-         </listitem>
-        </varlistentry>
-        <varlistentry>
-         <term>INTERVAL '08:00' HOUR TO MINUTE</term>
-         <listitem>
-          <para>
-           Set the time zone to 8 hours offset west from GMT (equivalent
-          to PST).
-          </para>
-         </listitem>
-        </varlistentry>
-        <varlistentry>
-         <term>LOCAL</term>
-          <term>DEFAULT</term>
-         <listitem>
-          <para>
-           Set the time zone to your local time zone (the one that
-           your operating system defaults to).
-          </para>
-         </listitem>
-        </varlistentry>
-       </variablelist>
-       </para>
-       <para>
-       If an invalid time zone name is specified, the time zone
-       becomes GMT (on most systems anyway).
-       </para>
-       <para>
-        If the <envar>PGTZ</envar> environment variable is set in the frontend
-       environment of a client based on libpq, libpq will automatically
-       set TIMEZONE to the value of <envar>PGTZ</envar> during connection start-up.
-       </para>
-      </listitem>
-     </varlistentry>
+      <para>
+       If an invalid time zone is specified, the time zone
+       becomes GMT (on most systems anyway).
+      </para>
  
-    </variablelist>
-   </para>
+      <para>
+       If the <envar>PGTZ</envar> environment variable is set in the frontend
+       environment of a client based on libpq, libpq will automatically
+       <command>SET TIMEZONE</command> to the value of
+       <envar>PGTZ</envar> during connection start-up. 
+      </para>
+     </listitem>
+    </varlistentry>
+   </variablelist>
+  </para>
  
    <para>
     Use <xref linkend="SQL-SHOW" endterm="SQL-SHOW-title"> to show the
diff --git a/src/backend/parser/gram.y b/src/backend/parser/gram.y

index 22d76860a24b3d6a088d3dd617de298d78e73028..2e5127b78d6e9017ba827d305f5cee13029c027d 100644 (file)
--- a/src/backend/parser/gram.y
+++ b/src/backend/parser/gram.y
@@ -227,10 +227,10 @@ static void doNegateFloat(Value *v);
  %type <node>   join_outer, join_qual
  %type <jtype>  join_type
  
-%type <list>   extract_list, position_list
+%type <list>   extract_list, overlay_list, position_list
  %type <list>   substr_list, trim_list
  %type <ival>   opt_interval
-%type <node>   substr_from, substr_for
+%type <node>   overlay_placing, substr_from, substr_for
  
  %type <boolean>        opt_binary, opt_using, opt_instead, opt_cursor
  %type <boolean>        opt_with_copy, index_opt_unique, opt_verbose, opt_full
@@ -336,7 +336,7 @@ static void doNegateFloat(Value *v);
         FALSE_P, FETCH, FLOAT_P, FOR, FORCE, FOREIGN, FORWARD, FREEZE, FROM,
         FULL, FUNCTION,
  
-       GLOBAL, GRANT, GROUP_P,
+       GET, GLOBAL, GRANT, GROUP_P,
         HANDLER, HAVING, HOUR_P,
  
         ILIKE, IMMEDIATE, IMMUTABLE, IMPLICIT, IN_P, INCREMENT, INDEX, INHERITS,
@@ -356,16 +356,16 @@ static void doNegateFloat(Value *v);
         NUMERIC,
  
         OF, OFF, OFFSET, OIDS, OLD, ON, ONLY, OPERATOR, OPTION, OR, ORDER,
-       OUT_P, OUTER_P, OVERLAPS, OWNER,
+       OUT_P, OUTER_P, OVERLAPS, OVERLAY, OWNER,
  
-       PARTIAL, PASSWORD, PATH_P, PENDANT, POSITION, PRECISION, PRIMARY,
+       PARTIAL, PASSWORD, PATH_P, PENDANT, PLACING, POSITION, PRECISION, PRIMARY,
         PRIOR, PRIVILEGES, PROCEDURE, PROCEDURAL,
  
         READ, REAL, REFERENCES, REINDEX, RELATIVE, RENAME, REPLACE, RESET,
         RESTRICT, RETURNS, REVOKE, RIGHT, ROLLBACK, ROW, RULE,
  
         SCHEMA, SCROLL, SECOND_P, SECURITY, SELECT, SEQUENCE, SERIALIZABLE,
-       SESSION, SESSION_USER, SET, SETOF, SHARE, SHOW, SMALLINT, SOME,
+       SESSION, SESSION_USER, SET, SETOF, SHARE, SHOW, SIMILAR, SMALLINT, SOME,
         STABLE, START, STATEMENT, STATISTICS, STDIN, STDOUT, STORAGE, STRICT,
         SUBSTRING, SYSID,
  
@@ -402,7 +402,7 @@ static void doNegateFloat(Value *v);
  %right         NOT
  %right         '='
  %nonassoc      '<' '>'
-%nonassoc      LIKE ILIKE
+%nonassoc      LIKE ILIKE SIMILAR
  %nonassoc      ESCAPE
  %nonassoc      OVERLAPS
  %nonassoc      BETWEEN
@@ -420,6 +420,7 @@ static void doNegateFloat(Value *v);
  %right         UMINUS
  %left          '[' ']'
  %left          '(' ')'
+%left          COLLATE
  %left          TYPECAST
  %left          '.'
  %%
@@ -2139,6 +2140,14 @@ DefineStmt:  CREATE AGGREGATE func_name definition
                                         n->definition = $4;
                                         $$ = (Node *)n;
                                 }
+               | CREATE CHARACTER SET opt_as any_name GET definition opt_collate
+                               {
+                                       DefineStmt *n = makeNode(DefineStmt);
+                                       n->defType = CHARACTER;
+                                       n->defnames = $5;
+                                       n->definition = $7;
+                                       $$ = (Node *)n;
+                               }
                 ;
  
  definition:  '(' def_list ')'                          { $$ = $2; }
@@ -4978,9 +4987,18 @@ qual_all_Op:  all_Op
   * it's factored out just to eliminate redundant coding.
   */
  a_expr:  c_expr
-                               {       $$ = $1;  }
+                               {       $$ = $1; }
                 | a_expr TYPECAST Typename
                                 {       $$ = makeTypeCast($1, $3); }
+               | a_expr COLLATE ColId
+                               {
+                                       FuncCall *n = makeNode(FuncCall);
+                                       n->funcname = SystemFuncName($3);
+                                       n->args = makeList1($1);
+                                       n->agg_star = FALSE;
+                                       n->agg_distinct = FALSE;
+                                       $$ = (Node *) n;
+                               }
                 | a_expr AT TIME ZONE c_expr
                                 {
                                         FuncCall *n = makeNode(FuncCall);
@@ -5088,6 +5106,30 @@ a_expr:  c_expr
                                         n->agg_distinct = FALSE;
                                         $$ = (Node *) makeSimpleA_Expr(OP, "!~~*", $1, (Node *) n);
                                 }
+
+               | a_expr SIMILAR TO a_expr                              %prec SIMILAR
+                               {       $$ = (Node *) makeSimpleA_Expr(OP, "~", $1, $4); }
+               | a_expr SIMILAR TO a_expr ESCAPE a_expr
+                               {
+                                       FuncCall *n = makeNode(FuncCall);
+                                       n->funcname = SystemFuncName("like_escape");
+                                       n->args = makeList2($4, $6);
+                                       n->agg_star = FALSE;
+                                       n->agg_distinct = FALSE;
+                                       $$ = (Node *) makeSimpleA_Expr(OP, "~", $1, (Node *) n);
+                               }
+               | a_expr NOT SIMILAR TO a_expr                  %prec SIMILAR
+                               {       $$ = (Node *) makeSimpleA_Expr(OP, "!~", $1, $5); }
+               | a_expr NOT SIMILAR TO a_expr ESCAPE a_expr
+                               {
+                                       FuncCall *n = makeNode(FuncCall);
+                                       n->funcname = SystemFuncName("like_escape");
+                                       n->args = makeList2($5, $7);
+                                       n->agg_star = FALSE;
+                                       n->agg_distinct = FALSE;
+                                       $$ = (Node *) makeSimpleA_Expr(OP, "!~", $1, (Node *) n);
+                               }
+
                 /* NullTest clause
                  * Define SQL92-style Null test clause.
                  * Allow two forms described in the standard:
@@ -5568,6 +5610,20 @@ c_expr:  columnref
                                         n->agg_distinct = FALSE;
                                         $$ = (Node *)n;
                                 }
+               | OVERLAY '(' overlay_list ')'
+                               {
+                                       /* overlay(A PLACING B FROM C FOR D) is converted to
+                                        * substring(A, 1, C-1) || B || substring(A, C+1, C+D)
+                                        * overlay(A PLACING B FROM C) is converted to
+                                        * substring(A, 1, C-1) || B || substring(A, C+1, C+char_length(B))
+                                        */
+                                       FuncCall *n = makeNode(FuncCall);
+                                       n->funcname = SystemFuncName("overlay");
+                                       n->args = $3;
+                                       n->agg_star = FALSE;
+                                       n->agg_distinct = FALSE;
+                                       $$ = (Node *)n;
+                               }
                 | POSITION '(' position_list ')'
                                 {
                                         /* position(A in B) is converted to position(B, A) */
@@ -5706,6 +5762,25 @@ extract_arg:  IDENT                                              { $$ = $1; }
                 | SCONST                                                { $$ = $1; }
                 ;
  
+/* OVERLAY() arguments
+ * SQL99 defines the OVERLAY() function:
+ * o overlay(text placing text from int for int)
+ * o overlay(text placing text from int)
+ */
+overlay_list:  a_expr overlay_placing substr_from substr_for
+                               {
+                                       $$ = makeList4($1, $2, $3, $4);
+                               }
+               | a_expr overlay_placing substr_from
+                               {
+                                       $$ = makeList3($1, $2, $3);
+                               }
+               ;
+
+overlay_placing:  PLACING a_expr
+                               {       $$ = $2; }
+               ;
+
  /* position_list uses b_expr not a_expr to avoid conflict with general IN */
  
  position_list:  b_expr IN_P b_expr
@@ -6259,6 +6334,7 @@ unreserved_keyword:
                 | FORCE
                 | FORWARD
                 | FUNCTION
+               | GET
                 | GLOBAL
                 | HANDLER
                 | HOUR_P
@@ -6404,6 +6480,7 @@ col_name_keyword:
                 | NONE
                 | NULLIF
                 | NUMERIC
+               | OVERLAY
                 | POSITION
                 | REAL
                 | SETOF
@@ -6423,7 +6500,7 @@ col_name_keyword:
   *
   * Do not include POSITION, SUBSTRING, etc here since they have explicit
   * productions in a_expr to support the goofy SQL9x argument syntax.
- *  - thomas 2000-11-28
+ * - thomas 2000-11-28
   */
  func_name_keyword:
                   AUTHORIZATION
@@ -6445,6 +6522,7 @@ func_name_keyword:
                 | OUTER_P
                 | OVERLAPS
                 | RIGHT
+               | SIMILAR
                 | VERBOSE
                 ;
  
diff --git a/src/backend/parser/keywords.c b/src/backend/parser/keywords.c

index dfe8908b464e2be6367baa75816ebce56704a743..7398408051ac311477faa76a61d466d19f217585 100644 (file)
--- a/src/backend/parser/keywords.c
+++ b/src/backend/parser/keywords.c
@@ -129,6 +129,7 @@ static const ScanKeyword ScanKeywords[] = {
         {"from", FROM},
         {"full", FULL},
         {"function", FUNCTION},
+       {"get", GET},
         {"global", GLOBAL},
         {"grant", GRANT},
         {"group", GROUP_P},
@@ -211,11 +212,13 @@ static const ScanKeyword ScanKeywords[] = {
         {"out", OUT_P},
         {"outer", OUTER_P},
         {"overlaps", OVERLAPS},
+       {"overlay", OVERLAY},
         {"owner", OWNER},
         {"partial", PARTIAL},
         {"password", PASSWORD},
         {"path", PATH_P},
         {"pendant", PENDANT},
+       {"placing", PLACING},
         {"position", POSITION},
         {"precision", PRECISION},
         {"primary", PRIMARY},
@@ -251,6 +254,7 @@ static const ScanKeyword ScanKeywords[] = {
         {"setof", SETOF},
         {"share", SHARE},
         {"show", SHOW},
+       {"similar", SIMILAR},
         {"smallint", SMALLINT},
         {"some", SOME},
         {"stable", STABLE},
diff --git a/src/backend/parser/scan.l b/src/backend/parser/scan.l

index 829dccc8e091d8037ea71c88579eb33f0efd7765..c67f5744f3d41d6dc1f667e8403e1b7e38cb9771 100644 (file)
--- a/src/backend/parser/scan.l
+++ b/src/backend/parser/scan.l
@@ -92,14 +92,14 @@ unsigned char unescape_single_char(unsigned char c);
   * We use exclusive states for quoted strings, extended comments,
   * and to eliminate parsing troubles for numeric strings.
   * Exclusive states:
- *  <xbit> bit string literal
+ *  <xb> bit string literal
   *  <xc> extended C-style comments - thomas 1997-07-12
   *  <xd> delimited identifiers (double-quoted identifiers) - thomas 1997-10-27
   *  <xh> hexadecimal numeric string - thomas 1997-11-16
   *  <xq> quoted strings - thomas 1997-07-30
   */
  
-%x xbit
+%x xb
  %x xc
  %x xd
  %x xh
@@ -107,10 +107,10 @@ unsigned char unescape_single_char(unsigned char c);
  
  /* Bit string
   */
-xbitstart              [bB]{quote}
-xbitstop               {quote}
-xbitinside             [^']*
-xbitcat                        {quote}{whitespace_with_newline}{quote}
+xbstart                [bB]{quote}
+xbstop         {quote}
+xbinside               [^']*
+xbcat                  {quote}{whitespace_with_newline}{quote}
  
  /* Hexadecimal number
   */
@@ -285,13 +285,13 @@ other                     .
  
  <xc><<EOF>>            { yyerror("unterminated /* comment"); }
  
-{xbitstart}            {
+{xbstart}              {
                                         token_start = yytext;
-                                       BEGIN(xbit);
+                                       BEGIN(xb);
                                         startlit();
                                         addlitchar('b');
                                 }
-<xbit>{xbitstop}       {
+<xb>{xbstop}   {
                                         BEGIN(INITIAL);
                                         if (literalbuf[strspn(literalbuf + 1, "01") + 1] != '\0')
                                                 yyerror("invalid bit string input");
@@ -299,14 +299,14 @@ other                     .
                                         return BITCONST;
                                 }
  <xh>{xhinside} |
-<xbit>{xbitinside}     {
+<xb>{xbinside} {
                                         addlit(yytext, yyleng);
                                 }
  <xh>{xhcat}            |
-<xbit>{xbitcat}                {
+<xb>{xbcat}            {
                                         /* ignore */
                                 }
-<xbit><<EOF>>          { yyerror("unterminated bit string literal"); }
+<xb><<EOF>>            { yyerror("unterminated bit string literal"); }
  
  {xhstart}              {
                                         token_start = yytext;
diff --git a/src/backend/regex/regcomp.c b/src/backend/regex/regcomp.c

index bea464bd2ae88aa2b8a8bd0d8f27e27d9e1ff68d..d6f7b26fa1a4cb77579963312a8b768664dee2c8 100644 (file)
--- a/src/backend/regex/regcomp.c
+++ b/src/backend/regex/regcomp.c
@@ -174,9 +174,10 @@ static int never = 0;                      /* for use in asserts; shuts lint up */
  
  /*
   * regcomp - interface for parser and compilation
+ * returns 0 success, otherwise REG_something
   */
-int                                                            /* 0 success, otherwise REG_something */
-pg95_regcomp(regex_t *preg, const char *pattern, int cflags)
+int
+pg_regcomp(regex_t *preg, const char *pattern, int cflags)
  {
         struct parse pa;
         struct re_guts *g;
@@ -224,7 +225,6 @@ pg95_regcomp(regex_t *preg, const char *pattern, int cflags)
                 (void) pg_mb2wchar((unsigned char *) pattern, wcp);
                 len = pg_wchar_strlen(wcp);
  #else
-
                 len = strlen((char *) pattern);
  #endif
         }
@@ -305,7 +305,7 @@ pg95_regcomp(regex_t *preg, const char *pattern, int cflags)
  
         /* win or lose, we're done */
         if (p->error != 0)                      /* lose */
-               pg95_regfree(preg);
+               pg_regfree(preg);
         return p->error;
  }
  
diff --git a/src/backend/regex/regerror.c b/src/backend/regex/regerror.c

index 3fa00946aa414e2307991f96680e5ec3cf553d43..fb12cba3048ee78dda4d4f425438702133abf230 100644 (file)
--- a/src/backend/regex/regerror.c
+++ b/src/backend/regex/regerror.c
@@ -117,8 +117,8 @@ static struct rerr
   */
  /* ARGSUSED */
  size_t
-pg95_regerror(int errcode, const regex_t *preg,
-                         char *errbuf, size_t errbuf_size)
+pg_regerror(int errcode, const regex_t *preg,
+                       char *errbuf, size_t errbuf_size)
  {
         struct rerr *r;
         size_t          len;
diff --git a/src/backend/regex/regexec.c b/src/backend/regex/regexec.c

index 476773044138393e42f671896496dd5e574cbdd6..06459ef1dbcaefec6d33d44df2ba88ebb6b85031 100644 (file)
--- a/src/backend/regex/regexec.c
+++ b/src/backend/regex/regexec.c
@@ -149,8 +149,8 @@ do { \
   * when choosing which matcher to call.
   */
  int                                                            /* 0 success, REG_NOMATCH failure */
-pg95_regexec(const regex_t *preg, const char *string, size_t nmatch,
-                        regmatch_t *pmatch, int eflags)
+pg_regexec(const regex_t *preg, const char *string, size_t nmatch,
+                  regmatch_t *pmatch, int eflags)
  {
         struct re_guts *g = preg->re_g;
  
diff --git a/src/backend/regex/regfree.c b/src/backend/regex/regfree.c

index 87e0c99ef96690afcb1bb3b6b9da293216fa4add..5672fcf240f4f9f7358f26f3d53d4ddefe36d041 100644 (file)
--- a/src/backend/regex/regfree.c
+++ b/src/backend/regex/regfree.c
@@ -49,7 +49,7 @@
   * regfree - free everything
   */
  void
-pg95_regfree(regex_t *preg)
+pg_regfree(regex_t *preg)
  {
         struct re_guts *g;
  
diff --git a/src/backend/regex/retest.c b/src/backend/regex/retest.c

index aa49acff30dd0a624c6a1561d686183a6015fe97..f0643362a4700a3d8d069d258dbacb65d08bfb70 100644 (file)
--- a/src/backend/regex/retest.c
+++ b/src/backend/regex/retest.c
@@ -22,7 +22,7 @@ main()
         if (p)
                 *p = '\0';
  
-       sts = pg95_regcomp(&re, buf, 1);
+       sts = pg_regcomp(&re, buf, 1);
         printf("regcomp: parses \"%s\" and returns %d\n", buf, sts);
         for (;;)
         {
@@ -33,7 +33,7 @@ main()
                 if (p)
                         *p = '\0';
  
-               sts = pg95_regexec(&re, buf, 0, 0, 0);
+               sts = pg_regexec(&re, buf, 0, 0, 0);
                 printf("regexec: returns %d\n", sts);
         }
  }
diff --git a/src/backend/utils/adt/regexp.c b/src/backend/utils/adt/regexp.c

index 7203e1a284fa619ce7b526bbf8e745942c11861f..50bfc68f926393def2fd3cdeece6ab2320522d16 100644 (file)
--- a/src/backend/utils/adt/regexp.c
+++ b/src/backend/utils/adt/regexp.c
@@ -19,7 +19,7 @@
   *
   *             agc - incorporated Keith Bostic's Berkeley regex code into
   *             the tree for all ports. To distinguish this regex code from any that
- *             is existent on a platform, I've prepended the string "pg95_" to
+ *             is existent on a platform, I've prepended the string "pg_" to
   *             the functions regcomp, regerror, regexec and regfree.
   *             Fixed a bug that was originally a typo by me, where `i' was used
   *             instead of `oldest' when compiling regular expressions - benign
@@ -53,11 +53,13 @@ struct cached_re_str
  static int     rec = 0;                        /* # of cached re's */
  static struct cached_re_str rev[MAX_CACHED_RES];               /* cached re's */
  static unsigned long lru;              /* system lru tag */
+static int pg_lastre = 0;
  
  /* attempt to compile `re' as an re, then match it against text */
  /* cflags - flag to regcomp indicates case sensitivity */
  static bool
-RE_compile_and_execute(text *text_re, char *text, int cflags)
+RE_compile_and_execute(text *text_re, char *text, int cflags,
+                                          int nmatch, regmatch_t *pmatch)
  {
         char       *re;
         int                     oldest;
@@ -68,9 +70,27 @@ RE_compile_and_execute(text *text_re, char *text, int cflags)
         re = DatumGetCString(DirectFunctionCall1(textout,
                                                                                          PointerGetDatum(text_re)));
  
+       if ((i = pg_lastre) < rec)
+       {
+               if (rev[i].cre_s)
+               {
+                       if (strcmp(rev[i].cre_s, re) == 0 &&
+                               rev[i].cre_type == cflags)
+                       {
+                               rev[i].cre_lru = ++lru;
+                               pfree(re);
+                               return (pg_regexec(&rev[i].cre_re,
+                                                                  text, nmatch,
+                                                                  pmatch, 0) == 0);
+                       }
+               }
+       }
+
         /* find a previously compiled regular expression */
         for (i = 0; i < rec; i++)
         {
+               if (i == pg_lastre) continue;
+
                 if (rev[i].cre_s)
                 {
                         if (strcmp(rev[i].cre_s, re) == 0 &&
@@ -78,9 +98,9 @@ RE_compile_and_execute(text *text_re, char *text, int cflags)
                         {
                                 rev[i].cre_lru = ++lru;
                                 pfree(re);
-                               return (pg95_regexec(&rev[i].cre_re,
-                                                                        text, 0,
-                                                                        (regmatch_t *) NULL, 0) == 0);
+                               return (pg_regexec(&rev[i].cre_re,
+                                                                  text, nmatch,
+                                                                  pmatch, 0) == 0);
                         }
                 }
         }
@@ -107,7 +127,7 @@ RE_compile_and_execute(text *text_re, char *text, int cflags)
                         if (rev[i].cre_lru > lru)
                                 lru = rev[i].cre_lru;
                 }
-               pg95_regfree(&rev[oldest].cre_re);
+               pg_regfree(&rev[oldest].cre_re);
  
                 /*
                  * use malloc/free for the cre_s field because the storage has to
@@ -118,7 +138,7 @@ RE_compile_and_execute(text *text_re, char *text, int cflags)
         }
  
         /* compile the re */
-       regcomp_result = pg95_regcomp(&rev[oldest].cre_re, re, cflags);
+       regcomp_result = pg_regcomp(&rev[oldest].cre_re, re, cflags);
         if (regcomp_result == 0)
         {
                 /*
@@ -130,16 +150,16 @@ RE_compile_and_execute(text *text_re, char *text, int cflags)
                 rev[oldest].cre_type = cflags;
                 pfree(re);
                 /* agc - fixed an old typo here */
-               return (pg95_regexec(&rev[oldest].cre_re, text, 0,
-                                                        (regmatch_t *) NULL, 0) == 0);
+               return (pg_regexec(&rev[oldest].cre_re, text,
+                                                  nmatch, pmatch, 0) == 0);
         }
         else
         {
                 char            errMsg[1000];
  
                 /* re didn't compile */
-               pg95_regerror(regcomp_result, &rev[oldest].cre_re, errMsg,
-                                         sizeof(errMsg));
+               pg_regerror(regcomp_result, &rev[oldest].cre_re, errMsg,
+                                       sizeof(errMsg));
                 elog(ERROR, "Invalid regular expression: %s", errMsg);
         }
  
@@ -167,7 +187,7 @@ fixedlen_regexeq(char *s, text *p, int charlen, int cflags)
         memcpy(sterm, s, charlen);
         sterm[charlen] = '\0';
  
-       result = RE_compile_and_execute(p, sterm, cflags);
+       result = RE_compile_and_execute(p, sterm, cflags, 0, NULL);
  
         pfree(sterm);
  
@@ -230,7 +250,7 @@ textregexne(PG_FUNCTION_ARGS)
  
  /*
   *     routines that use the regexp stuff, but ignore the case.
- *     for this, we use the REG_ICASE flag to pg95_regcomp
+ *     for this, we use the REG_ICASE flag to pg_regcomp
   */
  
  
@@ -281,3 +301,54 @@ nameicregexne(PG_FUNCTION_ARGS)
                                                                          strlen(NameStr(*n)),
                                                                          REG_ICASE | REG_EXTENDED));
  }
+
+
+/* textregexsubstr()
+ * Return a substring matched by a regular expression.
+ */
+Datum
+textregexsubstr(PG_FUNCTION_ARGS)
+{
+       text       *s = PG_GETARG_TEXT_P(0);
+       text       *p = PG_GETARG_TEXT_P(1);
+       text       *result;
+       char       *sterm;
+       int                     len;
+       bool            match;
+       int                     nmatch = 1;
+       regmatch_t      pmatch;
+
+       /* be sure sterm is null-terminated */
+       len = VARSIZE(s) - VARHDRSZ;
+       sterm = (char *) palloc(len + 1);
+       memcpy(sterm, VARDATA(s), len);
+       sterm[len] = '\0';
+       /* We need the match info back from the pattern match
+        * to be able to actually extract the substring.
+        * It seems to be adequate to pass in a structure to return
+        * only one result.
+        */
+       match = RE_compile_and_execute(p, sterm, REG_EXTENDED, nmatch, &pmatch);
+       pfree(sterm);
+
+       /* match? then return the substring matching the pattern */
+       if (match)
+       {
+               return (DirectFunctionCall3(text_substr,
+                                                                       PointerGetDatum(s),
+                                                                       Int32GetDatum(pmatch.rm_so+1),
+                                                                       Int32GetDatum(pmatch.rm_eo-pmatch.rm_so)));
+       }
+#if 0
+       /* otherwise, return a zero-length string */
+       else
+       {
+               result = palloc(VARHDRSZ);
+               VARATT_SIZEP(result) = VARHDRSZ;
+               PG_RETURN_TEXT_P(result);
+       }
+#endif
+
+       /* not reached */
+       PG_RETURN_NULL();
+}
diff --git a/src/include/catalog/catversion.h b/src/include/catalog/catversion.h

index b70d950e75d7e39f8a9307f977088283b0177a85..a15341aee95f10630bae0f2755b2f383107ffc1e 100644 (file)
--- a/src/include/catalog/catversion.h
+++ b/src/include/catalog/catversion.h
@@ -53,6 +53,6 @@
   */
  
  /*                                                     yyyymmddN */
-#define CATALOG_VERSION_NO     200205221
+#define CATALOG_VERSION_NO     200206111
  
  #endif
diff --git a/src/include/catalog/pg_proc.h b/src/include/catalog/pg_proc.h

index 06a78ad82405bc8438b5ab00d9cfccba435589ff..576d6204fc4d10ed292316d2e10393cfddd79a2e 100644 (file)
--- a/src/include/catalog/pg_proc.h
+++ b/src/include/catalog/pg_proc.h
@@ -1679,7 +1679,7 @@ DESCR("less-equal-greater");
  DATA(insert OID = 1359 (  timestamptz     PGNSP PGUID 12 f f f t f i 2 1184 "1082 1266" 100 0 0 100  datetimetz_timestamptz - _null_ ));
  DESCR("convert date and time with time zone to timestamp with time zone");
  
-DATA(insert OID = 1364 (  time                          PGNSP PGUID 14 f f f t f i 1 1083 "702" 100 0 0 100  "select time(cast($1 as timestamp without time zone))" - _null_ ));
+DATA(insert OID = 1364 (  time                    PGNSP PGUID 14 f f f t f i 1 1083 "702" 100 0 0 100  "select time(cast($1 as timestamp without time zone))" - _null_ ));
  DESCR("convert abstime to time");
  
  DATA(insert OID = 1367 (  character_length     PGNSP PGUID 12 f f f t f i 1    23 "1042" 100 0 0 100  bpcharlen - _null_ ));
@@ -1764,6 +1764,11 @@ DESCR("current schema name");
  DATA(insert OID = 1403 (  current_schemas      PGNSP PGUID 12 f f f t f s 0  1003 "0" 100 0 0 100      current_schemas - _null_ ));
  DESCR("current schema search list");
  
+DATA(insert OID = 1404 (  overlay                      PGNSP PGUID 14 f f f t f i 4 25 "25 25 23 23" 100 0 0 100  "select substring($1, 1, ($3 - 1)) || $2 || substring($1, ($3 + $4))" - _null_ ));
+DESCR("substitute portion of string");
+DATA(insert OID = 1405 (  overlay                      PGNSP PGUID 14 f f f t f i 3 25 "25 25 23" 100 0 0 100  "select substring($1, 1, ($3 - 1)) || $2 || substring($1, ($3 + char_length($2)))" - _null_ ));
+DESCR("substitute portion of string");
+
  DATA(insert OID = 1406 (  isvertical           PGNSP PGUID 12 f f f t f i 2    16 "600 600" 100 0 0 100  point_vert - _null_ ));
  DESCR("vertically aligned?");
  DATA(insert OID = 1407 (  ishorizontal         PGNSP PGUID 12 f f f t f i 2    16 "600 600" 100 0 0 100  point_horiz - _null_ ));
@@ -2871,6 +2876,11 @@ DESCR("add");
  DATA(insert OID = 2072 (  date_mi_interval     PGNSP PGUID 14 f f f t f i 2 1114 "1082 1186" 100 0 0 100  "select cast($1 as timestamp without time zone) - $2;" - _null_ ));
  DESCR("subtract");
  
+DATA(insert OID = 2073 (  substring                    PGNSP PGUID 12 f f f t f i 2 25 "25 25" 100 0 0 100     textregexsubstr - _null_ ));
+DESCR("substitutes regular expression");
+DATA(insert OID = 2074 (  substring                    PGNSP PGUID 14 f f f t f i 3 25 "25 25 25" 100 0 0 100  "select substring($1, like_escape($2, $3))" - _null_ ));
+DESCR("substitutes regular expression with escape argument");
+
  /* Aggregates (moved here from pg_aggregate for 7.3) */
  
  DATA(insert OID = 2100 (  avg                          PGNSP PGUID 12 t f f f f i 1 1700 "20" 100 0 0 100  aggregate_dummy - _null_ ));
diff --git a/src/include/regex/regex.h b/src/include/regex/regex.h

index 09f966e1bf26ae1c712dfcb2f9713d53f6486130..dd8e0da171bd61491535dbf9ab4921e07d1c70d7 100644 (file)
--- a/src/include/regex/regex.h
+++ b/src/include/regex/regex.h
@@ -53,7 +53,7 @@ typedef struct
         const pg_wchar *re_endp;        /* end pointer for REG_PEND */
         struct re_guts *re_g;           /* none of your business :-) */
  #ifdef MULTIBYTE
-       pg_wchar   *patsave;            /* mee too :-) */
+       pg_wchar   *patsave;            /* me too :-) */
  #endif
  
  } regex_t;
@@ -102,12 +102,12 @@ typedef struct
  #define REG_LARGE              01000   /* force large representation */
  #define REG_BACKR              02000   /* force use of backref code */
  
-extern int     pg95_regcomp(regex_t *preg, const char *pattern, int cflags);
-extern size_t pg95_regerror(int errcode, const regex_t *preg,
-                         char *errbuf, size_t errbuf_size);
-extern int pg95_regexec(const regex_t *preg, const char *string,
-                        size_t nmatch,
-                        regmatch_t *pmatch, int eflags);
-extern void pg95_regfree(regex_t *preg);
+extern int     pg_regcomp(regex_t *preg, const char *pattern, int cflags);
+extern size_t pg_regerror(int errcode, const regex_t *preg,
+                                                 char *errbuf, size_t errbuf_size);
+extern int pg_regexec(const regex_t *preg, const char *string,
+                                         size_t nmatch,
+                                         regmatch_t *pmatch, int eflags);
+extern void pg_regfree(regex_t *preg);
  
  #endif   /* !_REGEX_H_ */
diff --git a/src/include/utils/builtins.h b/src/include/utils/builtins.h

index 30b6d6f51866369682b1af0c8cdb6d18c8d4f79b..dda30a46a536212cd72cc4d4592c4e2d4fb077a3 100644 (file)
--- a/src/include/utils/builtins.h
+++ b/src/include/utils/builtins.h
@@ -327,6 +327,7 @@ extern Datum nameicregexeq(PG_FUNCTION_ARGS);
  extern Datum nameicregexne(PG_FUNCTION_ARGS);
  extern Datum texticregexeq(PG_FUNCTION_ARGS);
  extern Datum texticregexne(PG_FUNCTION_ARGS);
+extern Datum textregexsubstr(PG_FUNCTION_ARGS);
  
  /* regproc.c */
  extern Datum regprocin(PG_FUNCTION_ARGS);
diff --git a/src/test/regress/expected/strings.out b/src/test/regress/expected/strings.out

index ebfe8eeb66328d0014fc1981638dba5698a84a34..680a76c0bd5696f9c170389fee7a15a80d7fe2fc 100644 (file)
--- a/src/test/regress/expected/strings.out
+++ b/src/test/regress/expected/strings.out
@@ -3,6 +3,7 @@
  -- Test various data entry syntaxes.
  --
  -- SQL92 string continuation syntax
+-- E021-03 character string literals
  SELECT 'first line'
  ' - next line'
         ' - third line'
@@ -20,6 +21,7 @@ SELECT 'first line'
  ERROR:  parser: parse error at or near "' - third line'"
  --
  -- test conversions between various string types
+-- E021-10 implicit casting among the character data types
  --
  SELECT CAST(f1 AS text) AS "text(char)" FROM CHAR_TBL;
   text(char) 
@@ -93,7 +95,9 @@ SELECT CAST(name 'namefield' AS varchar) AS "varchar(name)";
  
  --
  -- test SQL92 string functions
+-- E### and T### are feature reference numbers from SQL99
  --
+-- E021-09 trim function
  SELECT TRIM(BOTH FROM '  bunch o blanks  ') = 'bunch o blanks' AS "bunch o blanks";
   bunch o blanks 
  ----------------
@@ -118,6 +122,7 @@ SELECT TRIM(BOTH 'x' FROM 'xxxxxsome Xsxxxxx') = 'some Xs' AS "some Xs";
   t
  (1 row)
  
+-- E021-06 substring expression
  SELECT SUBSTRING('1234567890' FROM 3) = '34567890' AS "34567890";
   34567890 
  ----------
@@ -130,6 +135,47 @@ SELECT SUBSTRING('1234567890' FROM 4 FOR 3) = '456' AS "456";
   t
  (1 row)
  
+-- T581 regular expression substring
+SELECT SUBSTRING('abcdefg' FROM '(b|f).*(d)' FOR '#') AS "bcd";
+ bcd 
+-----
+ bcd
+(1 row)
+
+-- No match should return NULL
+SELECT SUBSTRING('abcdefg' FROM '(1|2|3)' FOR '#') IS NULL AS "True";
+ True 
+------
+ t
+(1 row)
+
+-- Null inputs should return NULL
+SELECT SUBSTRING('abcdefg' FROM '(b|c)' FOR NULL) IS NULL AS "True";
+ True 
+------
+ t
+(1 row)
+
+SELECT SUBSTRING(NULL FROM '(b|c)' FOR '#') IS NULL AS "True";
+ True 
+------
+ t
+(1 row)
+
+SELECT SUBSTRING('abcdefg' FROM NULL FOR '#') IS NULL AS "True";
+ True 
+------
+ t
+(1 row)
+
+-- PostgreSQL extention to allow omitting the escape character
+SELECT SUBSTRING('abcdefg' FROM '(c|d).e') AS "cde";
+ cde 
+-----
+ cde
+(1 row)
+
+-- E021-11 position expression
  SELECT POSITION('4' IN '1234567890') = '4' AS "4";
   4 
  ---
@@ -142,11 +188,37 @@ SELECT POSITION(5 IN '1234567890') = '5' AS "5";
   t
  (1 row)
  
+-- T312 character overlay function
+SELECT OVERLAY('abcdef' PLACING '45' FROM 4) AS "abc45f";
+ abc45f 
+--------
+ abc45f
+(1 row)
+
+SELECT OVERLAY('yabadoo' PLACING 'daba' FROM 5) AS "yabadaba";
+ yabadaba 
+----------
+ yabadaba
+(1 row)
+
+SELECT OVERLAY('yabadoo' PLACING 'daba' FROM 5 FOR 0) AS "yabadabadoo";
+ yabadabadoo 
+-------------
+ yabadabadoo
+(1 row)
+
+SELECT OVERLAY('babosa' PLACING 'ubb' FROM 2 FOR 4) AS "bubba";
+ bubba 
+-------
+ bubba
+(1 row)
+
  --
  -- test LIKE
  -- Be sure to form every test as a LIKE/NOT LIKE pair.
  --
  -- simplest examples
+-- E061-04 like predicate
  SELECT 'hawkeye' LIKE 'h%' AS "true";
   true 
  ------
@@ -257,6 +329,7 @@ SELECT 'indio' NOT LIKE 'ind_o' ESCAPE '$' AS "false";
  (1 row)
  
  -- escape character
+-- E061-05 like predicate with escape clause
  SELECT 'h%' LIKE 'h#%' ESCAPE '#' AS "true";
   true 
  ------
@@ -469,6 +542,7 @@ SELECT 'Hawkeye' NOT ILIKE 'h%' AS "false";
  --
  -- test implicit type conversion
  --
+-- E021-07 character concatenation
  SELECT 'unknown' || ' and unknown' AS "Concat unknown types";
   Concat unknown types 
  ----------------------
diff --git a/src/test/regress/sql/strings.sql b/src/test/regress/sql/strings.sql

index b7f214f4d89c30c573cdb7c13a9149f302f5d5d9..3127d0ebffcc5e932c72d0da9e1c26cb77f15b93 100644 (file)
--- a/src/test/regress/sql/strings.sql
+++ b/src/test/regress/sql/strings.sql
@@ -4,6 +4,7 @@
  --
  
  -- SQL92 string continuation syntax
+-- E021-03 character string literals
  SELECT 'first line'
  ' - next line'
         ' - third line'
@@ -17,6 +18,7 @@ SELECT 'first line'
  
  --
  -- test conversions between various string types
+-- E021-10 implicit casting among the character data types
  --
  
  SELECT CAST(f1 AS text) AS "text(char)" FROM CHAR_TBL;
@@ -41,8 +43,10 @@ SELECT CAST(name 'namefield' AS varchar) AS "varchar(name)";
  
  --
  -- test SQL92 string functions
+-- E### and T### are feature reference numbers from SQL99
  --
  
+-- E021-09 trim function
  SELECT TRIM(BOTH FROM '  bunch o blanks  ') = 'bunch o blanks' AS "bunch o blanks";
  
  SELECT TRIM(LEADING FROM '  bunch o blanks  ') = 'bunch o blanks  ' AS "bunch o blanks  ";
@@ -51,20 +55,46 @@ SELECT TRIM(TRAILING FROM '  bunch o blanks  ') = '  bunch o blanks' AS "  bunch
  
  SELECT TRIM(BOTH 'x' FROM 'xxxxxsome Xsxxxxx') = 'some Xs' AS "some Xs";
  
+-- E021-06 substring expression
  SELECT SUBSTRING('1234567890' FROM 3) = '34567890' AS "34567890";
  
  SELECT SUBSTRING('1234567890' FROM 4 FOR 3) = '456' AS "456";
  
+-- T581 regular expression substring
+SELECT SUBSTRING('abcdefg' FROM '(b|f).*(d)' FOR '#') AS "bcd";
+
+-- No match should return NULL
+SELECT SUBSTRING('abcdefg' FROM '(1|2|3)' FOR '#') IS NULL AS "True";
+
+-- Null inputs should return NULL
+SELECT SUBSTRING('abcdefg' FROM '(b|c)' FOR NULL) IS NULL AS "True";
+SELECT SUBSTRING(NULL FROM '(b|c)' FOR '#') IS NULL AS "True";
+SELECT SUBSTRING('abcdefg' FROM NULL FOR '#') IS NULL AS "True";
+
+-- PostgreSQL extention to allow omitting the escape character
+SELECT SUBSTRING('abcdefg' FROM '(c|d).e') AS "cde";
+
+-- E021-11 position expression
  SELECT POSITION('4' IN '1234567890') = '4' AS "4";
  
  SELECT POSITION(5 IN '1234567890') = '5' AS "5";
  
+-- T312 character overlay function
+SELECT OVERLAY('abcdef' PLACING '45' FROM 4) AS "abc45f";
+
+SELECT OVERLAY('yabadoo' PLACING 'daba' FROM 5) AS "yabadaba";
+
+SELECT OVERLAY('yabadoo' PLACING 'daba' FROM 5 FOR 0) AS "yabadabadoo";
+
+SELECT OVERLAY('babosa' PLACING 'ubb' FROM 2 FOR 4) AS "bubba";
+
  --
  -- test LIKE
  -- Be sure to form every test as a LIKE/NOT LIKE pair.
  --
  
  -- simplest examples
+-- E061-04 like predicate
  SELECT 'hawkeye' LIKE 'h%' AS "true";
  SELECT 'hawkeye' NOT LIKE 'h%' AS "false";
  
@@ -94,6 +124,7 @@ SELECT 'indio' LIKE 'ind_o' ESCAPE '$' AS "true";
  SELECT 'indio' NOT LIKE 'ind_o' ESCAPE '$' AS "false";
  
  -- escape character
+-- E061-05 like predicate with escape clause
  SELECT 'h%' LIKE 'h#%' ESCAPE '#' AS "true";
  SELECT 'h%' NOT LIKE 'h#%' ESCAPE '#' AS "false";
  
@@ -156,6 +187,7 @@ SELECT 'Hawkeye' NOT ILIKE 'h%' AS "false";
  -- test implicit type conversion
  --
  
+-- E021-07 character concatenation
  SELECT 'unknown' || ' and unknown' AS "Concat unknown types";
  
  SELECT text 'text' || ' and unknown' AS "Concat text to unknown type";
@@ -165,4 +197,3 @@ SELECT char(20) 'characters' || 'and text' AS "Concat char to unknown type";
  SELECT text 'text' || char(20) ' and characters' AS "Concat text to char";
  
  SELECT text 'text' || varchar ' and varchar' AS "Concat text to varchar";
-
author	Thomas G. Lockhart <lockhart@alumni.caltech.edu>
	Tue, 11 Jun 2002 15:44:38 +0000 (15:44 +0000)
committer	Thomas G. Lockhart <lockhart@alumni.caltech.edu>
	Tue, 11 Jun 2002 15:44:38 +0000 (15:44 +0000)
doc/src/sgml/ref/set.sgml		patch \| blob \| blame \| history
src/backend/parser/gram.y		patch \| blob \| blame \| history
src/backend/parser/keywords.c		patch \| blob \| blame \| history
src/backend/parser/scan.l		patch \| blob \| blame \| history
src/backend/regex/regcomp.c		patch \| blob \| blame \| history
src/backend/regex/regerror.c		patch \| blob \| blame \| history
src/backend/regex/regexec.c		patch \| blob \| blame \| history
src/backend/regex/regfree.c		patch \| blob \| blame \| history
src/backend/regex/retest.c		patch \| blob \| blame \| history
src/backend/utils/adt/regexp.c		patch \| blob \| blame \| history
src/include/catalog/catversion.h		patch \| blob \| blame \| history
src/include/catalog/pg_proc.h		patch \| blob \| blame \| history
src/include/regex/regex.h		patch \| blob \| blame \| history
src/include/utils/builtins.h		patch \| blob \| blame \| history
src/test/regress/expected/strings.out		patch \| blob \| blame \| history
src/test/regress/sql/strings.sql		patch \| blob \| blame \| history