Improve context display for failures during COPY IN, as recently

author Tom Lane <tgl@sss.pgh.pa.us>

Mon, 29 Sep 2003 22:06:40 +0000 (22:06 +0000)

committer Tom Lane <tgl@sss.pgh.pa.us>

Mon, 29 Sep 2003 22:06:40 +0000 (22:06 +0000)
author Tom Lane <tgl@sss.pgh.pa.us>
Mon, 29 Sep 2003 22:06:40 +0000 (22:06 +0000)
committer Tom Lane <tgl@sss.pgh.pa.us>
Mon, 29 Sep 2003 22:06:40 +0000 (22:06 +0000)
diff --git a/src/backend/commands/copy.c b/src/backend/commands/copy.c

index faf982167bb1adf4a479b0c123543ee5c6addac7..aac9f3c1d4fa850baf1a2a2b913dfec628583a1e 100644 (file)
--- a/src/backend/commands/copy.c
+++ b/src/backend/commands/copy.c
@@ -8,7 +8,7 @@
   *
   *
   * IDENTIFICATION
- *   $Header: /cvsroot/pgsql/src/backend/commands/copy.c,v 1.211 2003/09/25 06:57:58 petere Exp $
+ *   $Header: /cvsroot/pgsql/src/backend/commands/copy.c,v 1.212 2003/09/29 22:06:40 tgl Exp $
   *
   *-------------------------------------------------------------------------
   */
@@ -59,22 +59,21 @@
  typedef enum CopyDest
  {
     COPY_FILE,                  /* to/from file */
-   COPY_OLD_FE,                /* to/from frontend (old protocol) */
-   COPY_NEW_FE                 /* to/from frontend (new protocol) */
+   COPY_OLD_FE,                /* to/from frontend (2.0 protocol) */
+   COPY_NEW_FE                 /* to/from frontend (3.0 protocol) */
  } CopyDest;
  
  /*
- * Represents the type of data returned by CopyReadAttribute()
+ * State indicator showing what stopped CopyReadAttribute()
   */
  typedef enum CopyReadResult
  {
     NORMAL_ATTR,
-   END_OF_LINE,
-   END_OF_FILE
+   END_OF_LINE
  } CopyReadResult;
  
  /*
- * Represents the end-of-line terminator of the input
+ * Represents the end-of-line terminator type of the input
   */
  typedef enum EolType
  {
@@ -85,17 +84,6 @@ typedef enum EolType
  } EolType;
  
  
-/* non-export function prototypes */
-static void CopyTo(Relation rel, List *attnumlist, bool binary, bool oids,
-      char *delim, char *null_print);
-static void CopyFrom(Relation rel, List *attnumlist, bool binary, bool oids,
-        char *delim, char *null_print);
-static char *CopyReadAttribute(const char *delim, CopyReadResult *result);
-static Datum CopyReadBinaryAttribute(int column_no, FmgrInfo *flinfo,
-                       Oid typelem, bool *isnull);
-static void CopyAttributeOut(char *string, char *delim);
-static List *CopyGetAttnums(Relation rel, List *attnamelist);
-
  static const char BinarySignature[11] = "PGCOPY\n\377\r\n\0";
  
  /*
@@ -103,11 +91,18 @@ static const char BinarySignature[11] = "PGCOPY\n\377\r\n\0";
   * never been reentrant...
   */
  static CopyDest copy_dest;
-static FILE *copy_file;            /* if copy_dest == COPY_FILE */
-static StringInfo copy_msgbuf; /* if copy_dest == COPY_NEW_FE */
+static FILE *copy_file;            /* used if copy_dest == COPY_FILE */
+static StringInfo copy_msgbuf; /* used if copy_dest == COPY_NEW_FE */
  static bool fe_eof;                /* true if detected end of copy data */
  static EolType eol_type;       /* EOL type of input */
+static int client_encoding;    /* remote side's character encoding */
+static int server_encoding;    /* local encoding */
+
+/* these are just for error messages, see copy_in_error_callback */
+static bool copy_binary;       /* is it a binary copy? */
+static const char *copy_relname;   /* table name for error messages */
  static int copy_lineno;        /* line number for error messages */
+static const char *copy_attname;   /* current att for error messages */
  
  
  /*
@@ -117,16 +112,34 @@ static int    copy_lineno;        /* line number for error messages */
   * grow to a suitable size, and then we will avoid palloc/pfree overhead
   * for subsequent attributes.  Note that CopyReadAttribute returns a pointer
   * to attribute_buf's data buffer!
- * encoding, if needed, can be set once at the start of the copy operation.
   */
  static StringInfoData attribute_buf;
  
-static int client_encoding;
-static int server_encoding;
-
  /*
- * Internal communications functions
+ * Similarly, line_buf holds the whole input line being processed (its
+ * cursor field points to the next character to be read by CopyReadAttribute).
+ * The input cycle is first to read the whole line into line_buf, convert it
+ * to server encoding, and then extract individual attribute fields into
+ * attribute_buf.  (We used to have CopyReadAttribute read the input source
+ * directly, but that caused a lot of encoding issues and unnecessary logic
+ * complexity).
   */
+static StringInfoData line_buf;
+static bool line_buf_converted;
+
+/* non-export function prototypes */
+static void CopyTo(Relation rel, List *attnumlist, bool binary, bool oids,
+      char *delim, char *null_print);
+static void CopyFrom(Relation rel, List *attnumlist, bool binary, bool oids,
+        char *delim, char *null_print);
+static bool CopyReadLine(void);
+static char *CopyReadAttribute(const char *delim, CopyReadResult *result);
+static Datum CopyReadBinaryAttribute(int column_no, FmgrInfo *flinfo,
+                       Oid typelem, bool *isnull);
+static void CopyAttributeOut(char *string, char *delim);
+static List *CopyGetAttnums(Relation rel, List *attnamelist);
+
+/* Internal communications functions */
  static void SendCopyBegin(bool binary, int natts);
  static void ReceiveCopyBegin(bool binary, int natts);
  static void SendCopyEnd(bool binary);
@@ -145,6 +158,7 @@ static int32 CopyGetInt32(void);
  static void CopySendInt16(int16 val);
  static int16 CopyGetInt16(void);
  
+
  /*
   * Send copy start/stop messages for frontend copies.  These have changed
   * in past protocol redesigns.
@@ -780,6 +794,8 @@ DoCopy(const CopyStmt *stmt)
      * Set up variables to avoid per-attribute overhead.
      */
     initStringInfo(&attribute_buf);
+   initStringInfo(&line_buf);
+   line_buf_converted = false;
  
     client_encoding = pg_get_client_encoding();
     server_encoding = GetDatabaseEncoding();
@@ -907,6 +923,7 @@ DoCopy(const CopyStmt *stmt)
     else if (IsUnderPostmaster && !is_from)
         SendCopyEnd(binary);
     pfree(attribute_buf.data);
+   pfree(line_buf.data);
  
     /*
      * Close the relation.  If reading, we can release the AccessShareLock
@@ -1111,7 +1128,55 @@ CopyTo(Relation rel, List *attnumlist, bool binary, bool oids,
  static void
  copy_in_error_callback(void *arg)
  {
-   errcontext("COPY FROM, line %d", copy_lineno);
+#define MAX_COPY_DATA_DISPLAY 100
+
+   if (copy_binary)
+   {
+       /* can't usefully display the data */
+       if (copy_attname)
+           errcontext("COPY %s, line %d, column %s",
+                      copy_relname, copy_lineno, copy_attname);
+       else
+           errcontext("COPY %s, line %d", copy_relname, copy_lineno);
+   }
+   else
+   {
+       if (copy_attname)
+       {
+           /* error is relevant to a particular column */
+           errcontext("COPY %s, line %d, column %s: \"%.*s%s\"",
+                      copy_relname, copy_lineno, copy_attname,
+                      MAX_COPY_DATA_DISPLAY, attribute_buf.data,
+                      (attribute_buf.len > MAX_COPY_DATA_DISPLAY) ? "..." : "");
+       }
+       else
+       {
+           /* error is relevant to a particular line */
+           if (!line_buf_converted)
+           {
+               /* didn't convert the encoding yet... */
+               if (client_encoding != server_encoding)
+               {
+                   char       *cvt;
+
+                   cvt = (char *) pg_client_to_server((unsigned char *) line_buf.data,
+                                                      line_buf.len);
+                   if (cvt != line_buf.data)
+                   {
+                       /* transfer converted data back to line_buf */
+                       line_buf.len = 0;
+                       line_buf.data[0] = '\0';
+                       appendBinaryStringInfo(&line_buf, cvt, strlen(cvt));
+                   }
+               }
+               line_buf_converted = true;
+           }
+           errcontext("COPY %s, line %d: \"%.*s%s\"",
+                      copy_relname, copy_lineno,
+                      MAX_COPY_DATA_DISPLAY, line_buf.data,
+                      (line_buf.len > MAX_COPY_DATA_DISPLAY) ? "..." : "");
+       }
+   }
  }
  
  
@@ -1327,7 +1392,10 @@ CopyFrom(Relation rel, List *attnumlist, bool binary, bool oids,
     /* Initialize static variables */
     fe_eof = false;
     eol_type = EOL_UNKNOWN;
+   copy_binary = binary;
+   copy_relname = RelationGetRelationName(rel);
     copy_lineno = 0;
+   copy_attname = NULL;
  
     /* Set up callback to identify error line number */
     errcontext.callback = copy_in_error_callback;
@@ -1359,29 +1427,36 @@ CopyFrom(Relation rel, List *attnumlist, bool binary, bool oids,
             CopyReadResult result = NORMAL_ATTR;
             char       *string;
  
+           /* Actually read the line into memory here */
+           done = CopyReadLine();
+
+           /*
+            * EOF at start of line means we're done.  If we see EOF
+            * after some characters, we act as though it was newline
+            * followed by EOF, ie, process the line and then exit loop
+            * on next iteration.
+            */
+           if (done && line_buf.len == 0)
+               break;
+
             if (file_has_oids)
             {
                 string = CopyReadAttribute(delim, &result);
  
-               if (result == END_OF_FILE && *string == '\0')
-               {
-                   /* EOF at start of line: all is well */
-                   done = true;
-                   break;
-               }
-
                 if (strcmp(string, null_print) == 0)
                     ereport(ERROR,
                             (errcode(ERRCODE_BAD_COPY_FILE_FORMAT),
                              errmsg("null OID in COPY data")));
                 else
                 {
+                   copy_attname = "oid";
                     loaded_oid = DatumGetObjectId(DirectFunctionCall1(oidin,
                                                CStringGetDatum(string)));
                     if (loaded_oid == InvalidOid)
                         ereport(ERROR,
                                 (errcode(ERRCODE_BAD_COPY_FILE_FORMAT),
                                  errmsg("invalid OID in COPY data")));
+                   copy_attname = NULL;
                 }
             }
  
@@ -1394,7 +1469,7 @@ CopyFrom(Relation rel, List *attnumlist, bool binary, bool oids,
                 int         m = attnum - 1;
  
                 /*
-                * If prior attr on this line was ended by newline or EOF,
+                * If prior attr on this line was ended by newline,
                  * complain.
                  */
                 if (result != NORMAL_ATTR)
@@ -1405,68 +1480,33 @@ CopyFrom(Relation rel, List *attnumlist, bool binary, bool oids,
  
                 string = CopyReadAttribute(delim, &result);
  
-               if (result == END_OF_FILE && *string == '\0' &&
-                   cur == attnumlist && !file_has_oids)
-               {
-                   /* EOF at start of line: all is well */
-                   done = true;
-                   break;      /* out of per-attr loop */
-               }
-
                 if (strcmp(string, null_print) == 0)
                 {
                     /* we read an SQL NULL, no need to do anything */
                 }
                 else
                 {
+                   copy_attname = NameStr(attr[m]->attname);
                     values[m] = FunctionCall3(&in_functions[m],
                                               CStringGetDatum(string),
                                            ObjectIdGetDatum(elements[m]),
                                       Int32GetDatum(attr[m]->atttypmod));
                     nulls[m] = ' ';
+                   copy_attname = NULL;
                 }
             }
  
-           if (done)
-               break;          /* out of per-row loop */
-
             /*
              * Complain if there are more fields on the input line.
              *
              * Special case: if we're reading a zero-column table, we won't
-            * yet have called CopyReadAttribute() at all; so do that and
-            * check we have an empty line.  Fortunately we can keep that
-            * silly corner case out of the main line of execution.
-            */
-           if (result == NORMAL_ATTR)
-           {
-               if (attnumlist == NIL && !file_has_oids)
-               {
-                   string = CopyReadAttribute(delim, &result);
-                   if (result == NORMAL_ATTR || *string != '\0')
-                       ereport(ERROR,
-                               (errcode(ERRCODE_BAD_COPY_FILE_FORMAT),
-                       errmsg("extra data after last expected column")));
-                   if (result == END_OF_FILE)
-                   {
-                       /* EOF at start of line: all is well */
-                       done = true;
-                       break;
-                   }
-               }
-               else
-                   ereport(ERROR,
-                           (errcode(ERRCODE_BAD_COPY_FILE_FORMAT),
-                      errmsg("extra data after last expected column")));
-           }
-
-           /*
-            * If we got some data on the line, but it was ended by EOF,
-            * process the line normally but set flag to exit the loop
-            * when we return to the top.
+            * yet have called CopyReadAttribute() at all; so no error if
+            * line is empty.
              */
-           if (result == END_OF_FILE)
-               done = true;
+           if (result == NORMAL_ATTR && line_buf.len != 0)
+               ereport(ERROR,
+                       (errcode(ERRCODE_BAD_COPY_FILE_FORMAT),
+                        errmsg("extra data after last expected column")));
         }
         else
         {
@@ -1488,6 +1528,7 @@ CopyFrom(Relation rel, List *attnumlist, bool binary, bool oids,
  
             if (file_has_oids)
             {
+               copy_attname = "oid";
                 loaded_oid =
                     DatumGetObjectId(CopyReadBinaryAttribute(0,
                                                         &oid_in_function,
@@ -1497,6 +1538,7 @@ CopyFrom(Relation rel, List *attnumlist, bool binary, bool oids,
                     ereport(ERROR,
                             (errcode(ERRCODE_BAD_COPY_FILE_FORMAT),
                              errmsg("invalid OID in COPY data")));
+               copy_attname = NULL;
             }
  
             i = 0;
@@ -1505,12 +1547,14 @@ CopyFrom(Relation rel, List *attnumlist, bool binary, bool oids,
                 int         attnum = lfirsti(cur);
                 int         m = attnum - 1;
  
+               copy_attname = NameStr(attr[m]->attname);
                 i++;
                 values[m] = CopyReadBinaryAttribute(i,
                                                     &in_functions[m],
                                                     elements[m],
                                                     &isnull);
                 nulls[m] = isnull ? 'n' : ' ';
+               copy_attname = NULL;
             }
         }
  
@@ -1642,46 +1686,53 @@ CopyFrom(Relation rel, List *attnumlist, bool binary, bool oids,
  
  
  /*
- * Read the value of a single attribute.
- *
- * *result is set to indicate what terminated the read:
- *     NORMAL_ATTR:    column delimiter
- *     END_OF_LINE:    newline
- *     END_OF_FILE:    EOF indicator
- * In all cases, the string read up to the terminator is returned.
+ * Read the next input line and stash it in line_buf, with conversion to
+ * server encoding.
   *
- * Note: This function does not care about SQL NULL values -- it
- * is the caller's responsibility to check if the returned string
- * matches what the user specified for the SQL NULL value.
- *
- * delim is the column delimiter string.
+ * Result is true if read was terminated by EOF, false if terminated
+ * by newline.
   */
-static char *
-CopyReadAttribute(const char *delim, CopyReadResult *result)
+static bool
+CopyReadLine(void)
  {
+   bool        result;
+   bool        change_encoding = (client_encoding != server_encoding);
     int         c;
-   int         delimc = (unsigned char) delim[0];
     int         mblen;
+   int         j;
     unsigned char s[2];
     char       *cvt;
-   int         j;
  
     s[1] = 0;
  
-   /* reset attribute_buf to empty */
-   attribute_buf.len = 0;
-   attribute_buf.data[0] = '\0';
+   /* reset line_buf to empty */
+   line_buf.len = 0;
+   line_buf.data[0] = '\0';
+   line_buf.cursor = 0;
+
+   /* mark that encoding conversion hasn't occurred yet */
+   line_buf_converted = false;
  
     /* set default status */
-   *result = NORMAL_ATTR;
+   result = false;
  
+   /*
+    * In this loop we only care for detecting newlines (\r and/or \n)
+    * and the end-of-copy marker (\.).  For backwards compatibility
+    * we allow backslashes to escape newline characters.  Backslashes
+    * other than the end marker get put into the line_buf, since
+    * CopyReadAttribute does its own escape processing.  These four
+    * characters, and only these four, are assumed the same in frontend
+    * and backend encodings.  We do not assume that second and later bytes
+    * of a frontend multibyte character couldn't look like ASCII characters.
+    */
     for (;;)
     {
         c = CopyGetChar();
         if (c == EOF)
         {
-           *result = END_OF_FILE;
-           goto copy_eof;
+           result = true;
+           break;
         }
         if (c == '\r')
         {
@@ -1691,7 +1742,7 @@ CopyReadAttribute(const char *delim, CopyReadResult *result)
                          errmsg("literal carriage return found in data"),
                   errhint("Use \"\\r\" to represent carriage return.")));
             /* Check for \r\n on first line, _and_ handle \r\n. */
-           if (copy_lineno == 1 || eol_type == EOL_CRNL)
+           if (eol_type == EOL_UNKNOWN || eol_type == EOL_CRNL)
             {
                 int         c2 = CopyPeekChar();
  
@@ -1717,7 +1768,6 @@ CopyReadAttribute(const char *delim, CopyReadResult *result)
                     eol_type = EOL_CR;
                 }
             }
-           *result = END_OF_LINE;
             break;
         }
         if (c == '\n')
@@ -1728,19 +1778,150 @@ CopyReadAttribute(const char *delim, CopyReadResult *result)
                          errmsg("literal newline found in data"),
                          errhint("Use \"\\n\" to represent newline.")));
             eol_type = EOL_NL;
-           *result = END_OF_LINE;
             break;
         }
-       if (c == delimc)
-           break;
         if (c == '\\')
         {
             c = CopyGetChar();
             if (c == EOF)
             {
-               *result = END_OF_FILE;
-               goto copy_eof;
+               result = true;
+               break;
+           }
+           if (c == '.')
+           {
+               if (eol_type == EOL_CRNL)
+               {
+                   c = CopyGetChar();
+                   if (c == '\n')
+                       ereport(ERROR,
+                               (errcode(ERRCODE_BAD_COPY_FILE_FORMAT),
+                                errmsg("end-of-copy marker does not match previous newline style")));
+                   if (c != '\r')
+                       ereport(ERROR,
+                               (errcode(ERRCODE_BAD_COPY_FILE_FORMAT),
+                                errmsg("end-of-copy marker corrupt")));
+               }
+               c = CopyGetChar();
+               if (c != '\r' && c != '\n')
+                   ereport(ERROR,
+                           (errcode(ERRCODE_BAD_COPY_FILE_FORMAT),
+                            errmsg("end-of-copy marker corrupt")));
+               if ((eol_type == EOL_NL && c != '\n') ||
+                   (eol_type == EOL_CRNL && c != '\n') ||
+                   (eol_type == EOL_CR && c != '\r'))
+                   ereport(ERROR,
+                           (errcode(ERRCODE_BAD_COPY_FILE_FORMAT),
+                            errmsg("end-of-copy marker does not match previous newline style")));
+
+               /*
+                * In protocol version 3, we should ignore anything
+                * after \. up to the protocol end of copy data.  (XXX
+                * maybe better not to treat \. as special?)
+                */
+               if (copy_dest == COPY_NEW_FE)
+               {
+                   while (c != EOF)
+                       c = CopyGetChar();
+               }
+               result = true;  /* report EOF */
+               break;
+           }
+           /* not EOF mark, so emit \ and following char literally */
+           appendStringInfoCharMacro(&line_buf, '\\');
+       }
+
+       appendStringInfoCharMacro(&line_buf, c);
+
+       /*
+        * When client encoding != server, must be careful to read the
+        * extra bytes of a multibyte character exactly, since the encoding
+        * might not ensure they don't look like ASCII.  When the encodings
+        * are the same, we need not do this, since no server encoding we
+        * use has ASCII-like following bytes.
+        */
+       if (change_encoding)
+       {
+           s[0] = c;
+           mblen = pg_encoding_mblen(client_encoding, s);
+           for (j = 1; j < mblen; j++)
+           {
+               c = CopyGetChar();
+               if (c == EOF)
+               {
+                   result = true;
+                   break;
+               }
+               appendStringInfoCharMacro(&line_buf, c);
             }
+           if (result)
+               break;          /* out of outer loop */
+       }
+   } /* end of outer loop */
+
+   /*
+    * Done reading the line.  Convert it to server encoding.
+    */
+   if (change_encoding)
+   {
+       cvt = (char *) pg_client_to_server((unsigned char *) line_buf.data,
+                                          line_buf.len);
+       if (cvt != line_buf.data)
+       {
+           /* transfer converted data back to line_buf */
+           line_buf.len = 0;
+           line_buf.data[0] = '\0';
+           appendBinaryStringInfo(&line_buf, cvt, strlen(cvt));
+       }
+   }
+
+   line_buf_converted = true;
+
+   return result;
+}
+
+/*
+ * Read the value of a single attribute, performing de-escaping as needed.
+ *
+ * *result is set to indicate what terminated the read:
+ *     NORMAL_ATTR:    column delimiter
+ *     END_OF_LINE:    end of line
+ * In either case, the string read up to the terminator is returned.
+ *
+ * Note: This function does not care about SQL NULL values -- it
+ * is the caller's responsibility to check if the returned string
+ * matches what the user specified for the SQL NULL value.
+ *
+ * delim is the column delimiter string.
+ */
+static char *
+CopyReadAttribute(const char *delim, CopyReadResult *result)
+{
+   char        c;
+   char        delimc = delim[0];
+
+   /* reset attribute_buf to empty */
+   attribute_buf.len = 0;
+   attribute_buf.data[0] = '\0';
+
+   /* set default status */
+   *result = END_OF_LINE;
+
+   for (;;)
+   {
+       if (line_buf.cursor >= line_buf.len)
+           break;
+       c = line_buf.data[line_buf.cursor++];
+       if (c == delimc)
+       {
+           *result = NORMAL_ATTR;
+           break;
+       }
+       if (c == '\\')
+       {
+           if (line_buf.cursor >= line_buf.len)
+               break;
+           c = line_buf.data[line_buf.cursor++];
             switch (c)
             {
                 case '0':
@@ -1755,36 +1936,24 @@ CopyReadAttribute(const char *delim, CopyReadResult *result)
                         int         val;
  
                         val = OCTVALUE(c);
-                       c = CopyPeekChar();
-                       if (ISOCTAL(c))
+                       if (line_buf.cursor < line_buf.len)
                         {
-                           val = (val << 3) + OCTVALUE(c);
-                           CopyDonePeek(c, true /* pick up */ );
-                           c = CopyPeekChar();
+                           c = line_buf.data[line_buf.cursor];
                             if (ISOCTAL(c))
                             {
+                               line_buf.cursor++;
                                 val = (val << 3) + OCTVALUE(c);
-                               CopyDonePeek(c, true /* pick up */ );
-                           }
-                           else
-                           {
-                               if (c == EOF)
+                               if (line_buf.cursor < line_buf.len)
                                 {
-                                   *result = END_OF_FILE;
-                                   goto copy_eof;
+                                   c = line_buf.data[line_buf.cursor];
+                                   if (ISOCTAL(c))
+                                   {
+                                       line_buf.cursor++;
+                                       val = (val << 3) + OCTVALUE(c);
+                                   }
                                 }
-                               CopyDonePeek(c, false /* put back */ );
                             }
                         }
-                       else
-                       {
-                           if (c == EOF)
-                           {
-                               *result = END_OF_FILE;
-                               goto copy_eof;
-                           }
-                           CopyDonePeek(c, false /* put back */ );
-                       }
                         c = val & 0377;
                     }
                     break;
@@ -1816,79 +1985,12 @@ CopyReadAttribute(const char *delim, CopyReadResult *result)
                 case 'v':
                     c = '\v';
                     break;
-               case '.':
-                   if (eol_type == EOL_CRNL)
-                   {
-                       c = CopyGetChar();
-                       if (c == '\n')
-                           ereport(ERROR,
-                                 (errcode(ERRCODE_BAD_COPY_FILE_FORMAT),
-                                  errmsg("end-of-copy marker does not match previous newline style")));
-                       if (c != '\r')
-                           ereport(ERROR,
-                                 (errcode(ERRCODE_BAD_COPY_FILE_FORMAT),
-                                  errmsg("end-of-copy marker corrupt")));
-                   }
-                   c = CopyGetChar();
-                   if (c != '\r' && c != '\n')
-                       ereport(ERROR,
-                               (errcode(ERRCODE_BAD_COPY_FILE_FORMAT),
-                                errmsg("end-of-copy marker corrupt")));
-                   if ((eol_type == EOL_NL && c != '\n') ||
-                       (eol_type == EOL_CRNL && c != '\n') ||
-                       (eol_type == EOL_CR && c != '\r'))
-                       ereport(ERROR,
-                               (errcode(ERRCODE_BAD_COPY_FILE_FORMAT),
-                                errmsg("end-of-copy marker does not match previous newline style")));
-
-                   /*
-                    * In protocol version 3, we should ignore anything
-                    * after \. up to the protocol end of copy data.  (XXX
-                    * maybe better not to treat \. as special?)
-                    */
-                   if (copy_dest == COPY_NEW_FE)
-                   {
-                       while (c != EOF)
-                           c = CopyGetChar();
-                   }
-                   *result = END_OF_FILE;
-                   goto copy_eof;
+               /*
+                * in all other cases, take the char after '\' literally
+                */
             }
         }
         appendStringInfoCharMacro(&attribute_buf, c);
-
-       /* XXX shouldn't this be done even when encoding is the same? */
-       if (client_encoding != server_encoding)
-       {
-           /* get additional bytes of the char, if any */
-           s[0] = c;
-           mblen = pg_encoding_mblen(client_encoding, s);
-           for (j = 1; j < mblen; j++)
-           {
-               c = CopyGetChar();
-               if (c == EOF)
-               {
-                   *result = END_OF_FILE;
-                   goto copy_eof;
-               }
-               appendStringInfoCharMacro(&attribute_buf, c);
-           }
-       }
-   }
-
-copy_eof:
-
-   if (client_encoding != server_encoding)
-   {
-       cvt = (char *) pg_client_to_server((unsigned char *) attribute_buf.data,
-                                          attribute_buf.len);
-       if (cvt != attribute_buf.data)
-       {
-           /* transfer converted data back to attribute_buf */
-           attribute_buf.len = 0;
-           attribute_buf.data[0] = '\0';
-           appendBinaryStringInfo(&attribute_buf, cvt, strlen(cvt));
-       }
     }
  
     return attribute_buf.data;
@@ -1917,7 +2019,7 @@ CopyReadBinaryAttribute(int column_no, FmgrInfo *flinfo, Oid typelem,
     if (fld_size < 0)
         ereport(ERROR,
                 (errcode(ERRCODE_BAD_COPY_FILE_FORMAT),
-                errmsg("invalid size for field %d", column_no)));
+                errmsg("invalid field size")));
  
     /* reset attribute_buf to empty, and load raw data in it */
     attribute_buf.len = 0;
@@ -1944,8 +2046,7 @@ CopyReadBinaryAttribute(int column_no, FmgrInfo *flinfo, Oid typelem,
     if (attribute_buf.cursor != attribute_buf.len)
         ereport(ERROR,
                 (errcode(ERRCODE_INVALID_BINARY_REPRESENTATION),
-                errmsg("incorrect binary data format in field %d",
-                       column_no)));
+                errmsg("incorrect binary data format")));
  
     *isnull = false;
     return result;
diff --git a/src/test/regress/expected/alter_table.out b/src/test/regress/expected/alter_table.out

index 42b3e03f80b6d791b8bd2a04fa204ed2287fcd12..0fb90a5e475af06daff36116556ecf4021fadaf1 100644 (file)
--- a/src/test/regress/expected/alter_table.out
+++ b/src/test/regress/expected/alter_table.out
@@ -998,7 +998,7 @@ copy test("........pg.dropped.1........") to stdout;
  ERROR:  column "........pg.dropped.1........" of relation "test" does not exist
  copy test from stdin;
  ERROR:  extra data after last expected column
-CONTEXT:  COPY FROM, line 1
+CONTEXT:  COPY test, line 1: "10   11  12"
  select * from test;
   b | c 
  ---+---
diff --git a/src/test/regress/expected/copy2.out b/src/test/regress/expected/copy2.out

index a6e9ae27e2817f10483aa03130a0c350a14d3151..df08fcd45a6e6c57fcdc92531a8dffc5a1093fa8 100644 (file)
--- a/src/test/regress/expected/copy2.out
+++ b/src/test/regress/expected/copy2.out
@@ -35,17 +35,17 @@ ERROR:  column "d" specified more than once
  -- missing data: should fail
  COPY x from stdin;
  ERROR:  invalid input syntax for integer: ""
-CONTEXT:  COPY FROM, line 1
+CONTEXT:  COPY x, line 1, column a: ""
  COPY x from stdin;
  ERROR:  missing data for column "e"
-CONTEXT:  COPY FROM, line 1
+CONTEXT:  COPY x, line 1: "2000    230 23  23"
  COPY x from stdin;
  ERROR:  missing data for column "e"
-CONTEXT:  COPY FROM, line 1
+CONTEXT:  COPY x, line 1: "2001    231 \N  \N"
  -- extra data: should fail
  COPY x from stdin;
  ERROR:  extra data after last expected column
-CONTEXT:  COPY FROM, line 1
+CONTEXT:  COPY x, line 1: "2002    232 40  50  60  70  80"
  -- various COPY options: delimiters, oids, NULL string
  COPY x (b, c, d, e) from stdin with oids delimiter ',' null 'x';
  -- check results of copy in
diff --git a/src/test/regress/expected/domain.out b/src/test/regress/expected/domain.out

index 87a941e003c454ebe1e44a3611dee56586bb1e38..b23e84e7288a5ee1ecc160b67eab13c0f6257582 100644 (file)
--- a/src/test/regress/expected/domain.out
+++ b/src/test/regress/expected/domain.out
@@ -40,7 +40,7 @@ INSERT INTO basictest values ('88', 'haha', 'short', '123.1212');    -- Truncate
  -- Test copy
  COPY basictest (testvarchar) FROM stdin; -- fail
  ERROR:  value too long for type character varying(5)
-CONTEXT:  COPY FROM, line 1
+CONTEXT:  COPY basictest, line 1: "notsoshorttext"
  COPY basictest (testvarchar) FROM stdin;
  select * from basictest;
   testint4 | testtext | testvarchar | testnumeric 
@@ -127,11 +127,11 @@ INSERT INTO nulltest values ('a', 'b', 'c', NULL, 'd'); -- Good
  -- Test copy
  COPY nulltest FROM stdin; --fail
  ERROR:  domain dcheck does not allow null values
-CONTEXT:  COPY FROM, line 1
+CONTEXT:  COPY nulltest, line 1: "a    b   \N  d   \N"
  -- Last row is bad
  COPY nulltest FROM stdin;
  ERROR:  new row for relation "nulltest" violates check constraint "nulltest_col5"
-CONTEXT:  COPY FROM, line 3
+CONTEXT:  COPY nulltest, line 3: "a    b   c   \N  a"
  select * from nulltest;
   col1 | col2 | col3 | col4 | col5 
  ------+------+------+------+------
diff --git a/src/test/regress/output/constraints.source b/src/test/regress/output/constraints.source

index 48b75f8d8b15f04732aa10f78b21d20230b37f4a..7c1ac5e12d20c3908e1eb96aee0e5948038fd1a7 100644 (file)
--- a/src/test/regress/output/constraints.source
+++ b/src/test/regress/output/constraints.source
@@ -274,7 +274,7 @@ SELECT '' AS two, * FROM COPY_TBL;
  
  COPY COPY_TBL FROM '@abs_srcdir@/data/constrf.data';
  ERROR:  new row for relation "copy_tbl" violates check constraint "copy_con"
-CONTEXT:  COPY FROM, line 2
+CONTEXT:  COPY copy_tbl, line 2: "7    check failed    6"
  SELECT * FROM COPY_TBL;
   x |       y       | z 
  ---+---------------+---
author	Tom Lane <tgl@sss.pgh.pa.us>
	Mon, 29 Sep 2003 22:06:40 +0000 (22:06 +0000)
committer	Tom Lane <tgl@sss.pgh.pa.us>
	Mon, 29 Sep 2003 22:06:40 +0000 (22:06 +0000)
src/backend/commands/copy.c		patch \| blob \| blame \| history
src/test/regress/expected/alter_table.out		patch \| blob \| blame \| history
src/test/regress/expected/copy2.out		patch \| blob \| blame \| history
src/test/regress/expected/domain.out		patch \| blob \| blame \| history
src/test/regress/output/constraints.source		patch \| blob \| blame \| history