Fix documentation of regular expression character-entry escapes.

author Tom Lane

Wed, 16 Sep 2015 18:50:12 +0000 (14:50 -0400)

committer Tom Lane

Wed, 16 Sep 2015 18:50:38 +0000 (14:50 -0400)
author Tom Lane
Wed, 16 Sep 2015 18:50:12 +0000 (14:50 -0400)
committer Tom Lane
Wed, 16 Sep 2015 18:50:38 +0000 (14:50 -0400)
diff --git a/doc/src/sgml/func.sgml b/doc/src/sgml/func.sgml

index 1dbc7d6410197273018954fe8ca80c6378adf9b5..ab92e243d1c1b9ae63f3b9a70f43dbb9cf7cf8ae 100644 (file)
--- a/doc/src/sgml/func.sgml
+++ b/doc/src/sgml/func.sgml
@@ -4636,7 +4636,7 @@ SELECT foo FROM regexp_split_to_table('the quick brown fox', E'\\s*') AS foo;
          \e 
          the character whose collating-sequence name
         is ESC,
-       or failing that, the character with octal value 033 
+       or failing that, the character with octal value 033 
         
  
         
@@ -4662,15 +4662,17 @@ SELECT foo FROM regexp_split_to_table('the quick brown fox', E'\\s*') AS foo;
         
          \uwxyz 
          (where wxyz is exactly four hexadecimal digits)
-       the UTF16 (Unicode, 16-bit) character U+wxyz
-       in the local byte ordering 
+       the character whose hexadecimal value is
+       0xwxyz
+       
         
  
         
          \Ustuvwxyz 
          (where stuvwxyz is exactly eight hexadecimal
         digits)
-       reserved for a hypothetical Unicode extension to 32 bits
+       the character whose hexadecimal value is
+       0xstuvwxyz
         
         
  
@@ -4719,6 +4721,17 @@ SELECT foo FROM regexp_split_to_table('the quick brown fox', E'\\s*') AS foo;
      Octal digits are 0-7.
     
  
+   
+    Numeric character-entry escapes specifying values outside the ASCII range
+    (0-127) have meanings dependent on the database encoding.  When the
+    encoding is UTF-8, escape values are equivalent to Unicode code points,
+    for example \u1234 means the character U+1234.
+    For other multibyte encodings, character-entry escapes usually just
+    specify the concatenation of the byte values for the character.  If the
+    escape value does not correspond to any legal character in the database
+    encoding, no error will be raised, but it will never match any data.
+   
+
     
      The character-entry escapes are always taken as ordinary characters.
      For example, \135 is ] in ASCII, but
author	Tom Lane
	Wed, 16 Sep 2015 18:50:12 +0000 (14:50 -0400)
committer	Tom Lane
	Wed, 16 Sep 2015 18:50:38 +0000 (14:50 -0400)