Don't downcase non-ascii identifier chars in multi-byte encodings.

author Andrew Dunstan <andrew@dunslane.net>

Sat, 8 Jun 2013 14:20:37 +0000 (10:20 -0400)

committer Andrew Dunstan <andrew@dunslane.net>

Sat, 8 Jun 2013 14:20:37 +0000 (10:20 -0400)
author Andrew Dunstan <andrew@dunslane.net>
Sat, 8 Jun 2013 14:20:37 +0000 (10:20 -0400)
committer Andrew Dunstan <andrew@dunslane.net>
Sat, 8 Jun 2013 14:20:37 +0000 (10:20 -0400)
diff --git a/src/backend/parser/scansup.c b/src/backend/parser/scansup.c

index f1bb4370fe99873b92daf2181a5406c450afb652..c440b7b51e97b8658d2d99fee37e2e1733873cf6 100644 (file)
--- a/src/backend/parser/scansup.c
+++ b/src/backend/parser/scansup.c
@@ -130,8 +130,10 @@ downcase_truncate_identifier(const char *ident, int len, bool warn)
  {
         char       *result;
         int                     i;
+       bool        enc_is_single_byte;
  
         result = palloc(len + 1);
+       enc_is_single_byte = pg_database_encoding_max_length() == 1;
  
         /*
          * SQL99 specifies Unicode-aware case normalization, which we don't yet
@@ -139,8 +141,8 @@ downcase_truncate_identifier(const char *ident, int len, bool warn)
          * locale-aware translation.  However, there are some locales where this
          * is not right either (eg, Turkish may do strange things with 'i' and
          * 'I').  Our current compromise is to use tolower() for characters with
-        * the high bit set, and use an ASCII-only downcasing for 7-bit
-        * characters.
+        * the high bit set, as long as they aren't part of a multi-byte character,
+        * and use an ASCII-only downcasing for 7-bit characters.
          */
         for (i = 0; i < len; i++)
         {
@@ -148,7 +150,7 @@ downcase_truncate_identifier(const char *ident, int len, bool warn)
  
                 if (ch >= 'A' && ch <= 'Z')
                         ch += 'a' - 'A';
-               else if (IS_HIGHBIT_SET(ch) && isupper(ch))
+               else if (enc_is_single_byte && IS_HIGHBIT_SET(ch) && isupper(ch))
                         ch = tolower(ch);
                 result[i] = (char) ch;
         }
author	Andrew Dunstan <andrew@dunslane.net>
	Sat, 8 Jun 2013 14:20:37 +0000 (10:20 -0400)
committer	Andrew Dunstan <andrew@dunslane.net>
	Sat, 8 Jun 2013 14:20:37 +0000 (10:20 -0400)