2018-03-22 18:38 GMT+01:00 Fabien COELHO <coe...@cri.ensmp.fr>: > > Hello Pavel, > > Using \pset format csv means overwriting field sep every time - nobody uses >> | >> > > Yep. The alternative is to have a csv-specific separator variable, which > does not seem very useful, must be remembered, but this is indeed debatable. > > I think so dependency on order of psql arguments is significant problem >> > > This is intentional, and this issue/feature already exists, the last > argument overwrite previous settings thus will win, eg: > > psql --pset=format=troff --html -c 'SELECT 1' > > Will output in html, not in troff. >
Can we introduce some format specific default separators - if we would not to introduce csv_field_sep options? It should not be hard. All formats can has '|' like now, and csv can have a ',' - then if field separator is not explicit, then default field separator is used, else specified field separator is used. You can see my idea in attached patch Regards Pavel postgres=# \pset format csv Output format is csv. postgres=# select * from foo; a,b,c 1,2,Hello 3,4,Nazdar postgres=# \pset fieldsep ; Field separator is ";". postgres=# select * from foo; a;b;c 1;2;Hello 3;4;Nazdar > > -- > Fabien. >
diff --git a/doc/src/sgml/ref/psql-ref.sgml b/doc/src/sgml/ref/psql-ref.sgml index bfdf859731..4d3e3b59f3 100644 --- a/doc/src/sgml/ref/psql-ref.sgml +++ b/doc/src/sgml/ref/psql-ref.sgml @@ -151,6 +151,16 @@ EOF </listitem> </varlistentry> + <varlistentry> + <term><option>--csv</option></term> + <listitem> + <para> + Switches to csv output mode. This is equivalent to <command>\pset format + csv</command> followed by <command>\pset fieldsep ','</command>. + </para> + </listitem> + </varlistentry> + <varlistentry> <term><option>-d <replaceable class="parameter">dbname</replaceable></option></term> <term><option>--dbname=<replaceable class="parameter">dbname</replaceable></option></term> @@ -246,7 +256,7 @@ EOF <listitem> <para> Use <replaceable class="parameter">separator</replaceable> as the - field separator for unaligned output. This is equivalent to + field separator for unaligned and csv outputs. This is equivalent to <command>\pset fieldsep</command> or <command>\f</command>. </para> </listitem> @@ -382,7 +392,7 @@ EOF <listitem> <para> Use <replaceable class="parameter">separator</replaceable> as the - record separator for unaligned output. This is equivalent to + record separator for unaligned and csv outputs. This is equivalent to <command>\pset recordsep</command>. </para> </listitem> @@ -558,7 +568,7 @@ EOF <listitem> <para> Set the field separator for unaligned output to a zero byte. This is - equvalent to <command>\pset fieldsep_zero</command>. + equivalent to <command>\pset fieldsep_zero</command>. </para> </listitem> </varlistentry> @@ -1937,9 +1947,9 @@ Tue Oct 26 21:40:57 CEST 1999 <listitem> <para> - Sets the field separator for unaligned query output. The default - is the vertical bar (<literal>|</literal>). It is equivalent to - <command>\pset fieldsep</command>. + Sets the field separator for unaligned and csv query outputs. The + default is the vertical bar (<literal>|</literal>). It is equivalent + to <command>\pset fieldsep</command>. </para> </listitem> </varlistentry> @@ -2546,8 +2556,8 @@ lo_import 152801 <term><literal>fieldsep</literal></term> <listitem> <para> - Specifies the field separator to be used in unaligned output - format. That way one can create, for example, tab- or + Specifies the field separator to be used in unaligned and csv output + formats. That way one can create, for example, tab- or comma-separated output, which other programs might prefer. To set a tab as field separator, type <literal>\pset fieldsep '\t'</literal>. The default field separator is @@ -2584,9 +2594,13 @@ lo_import 152801 <term><literal>format</literal></term> <listitem> <para> - Sets the output format to one of <literal>unaligned</literal>, - <literal>aligned</literal>, <literal>wrapped</literal>, - <literal>html</literal>, <literal>asciidoc</literal>, + Sets the output format to one of + <literal>unaligned</literal>, + <literal>aligned</literal>, + <literal>csv</literal>, + <literal>wrapped</literal>, + <literal>html</literal>, + <literal>asciidoc</literal>, <literal>latex</literal> (uses <literal>tabular</literal>), <literal>latex-longtable</literal>, or <literal>troff-ms</literal>. @@ -2601,6 +2615,15 @@ lo_import 152801 format). </para> + <para><literal>csv</literal> format writes columns separated + by <literal>fieldsep</literal>, applying the CSV quoting rules + described in RFC-4180 and compatible with the CSV format + of the <command>COPY</command> command. + The header with column names is output unless the + <literal>tuples_only</literal> parameter is <literal>on</literal>. + Title and footers are not printed. + </para> + <para><literal>aligned</literal> format is the standard, human-readable, nicely formatted text output; this is the default. </para> @@ -2747,8 +2770,8 @@ lo_import 152801 <term><literal>recordsep</literal></term> <listitem> <para> - Specifies the record (line) separator to use in unaligned - output format. The default is a newline character. + Specifies the record (line) separator to use in unaligned or + csv output formats. The default is a newline character. </para> </listitem> </varlistentry> diff --git a/src/bin/psql/command.c b/src/bin/psql/command.c index 3560318749..1cd8a3856e 100644 --- a/src/bin/psql/command.c +++ b/src/bin/psql/command.c @@ -1222,6 +1222,10 @@ exec_command_f(PsqlScanState scan_state, bool active_branch) OT_NORMAL, NULL, false); success = do_pset("fieldsep", fname, &pset.popt, pset.quiet); + + if (success) + pset.popt.topt.fieldSep.is_explicit = true; + free(fname); } else @@ -3603,6 +3607,9 @@ _align2string(enum printFormat in) case PRINT_TROFF_MS: return "troff-ms"; break; + case PRINT_CSV: + return "csv"; + break; } return "unknown"; } @@ -3658,25 +3665,27 @@ do_pset(const char *param, const char *value, printQueryOpt *popt, bool quiet) { if (!value) ; - else if (pg_strncasecmp("unaligned", value, vallen) == 0) - popt->topt.format = PRINT_UNALIGNED; else if (pg_strncasecmp("aligned", value, vallen) == 0) popt->topt.format = PRINT_ALIGNED; - else if (pg_strncasecmp("wrapped", value, vallen) == 0) - popt->topt.format = PRINT_WRAPPED; - else if (pg_strncasecmp("html", value, vallen) == 0) - popt->topt.format = PRINT_HTML; else if (pg_strncasecmp("asciidoc", value, vallen) == 0) popt->topt.format = PRINT_ASCIIDOC; + else if (pg_strncasecmp("csv", value, vallen) == 0) + popt->topt.format = PRINT_CSV; + else if (pg_strncasecmp("html", value, vallen) == 0) + popt->topt.format = PRINT_HTML; else if (pg_strncasecmp("latex", value, vallen) == 0) popt->topt.format = PRINT_LATEX; else if (pg_strncasecmp("latex-longtable", value, vallen) == 0) popt->topt.format = PRINT_LATEX_LONGTABLE; else if (pg_strncasecmp("troff-ms", value, vallen) == 0) popt->topt.format = PRINT_TROFF_MS; + else if (pg_strncasecmp("unaligned", value, vallen) == 0) + popt->topt.format = PRINT_UNALIGNED; + else if (pg_strncasecmp("wrapped", value, vallen) == 0) + popt->topt.format = PRINT_WRAPPED; else { - psql_error("\\pset: allowed formats are unaligned, aligned, wrapped, html, asciidoc, latex, latex-longtable, troff-ms\n"); + psql_error("\\pset: allowed formats are aligned, asciidoc, csv, html, latex, latex-longtable, troff-ms, unaligned, wrapped\n"); return false; } } @@ -3800,6 +3809,7 @@ do_pset(const char *param, const char *value, printQueryOpt *popt, bool quiet) { free(popt->topt.fieldSep.separator); popt->topt.fieldSep.separator = pg_strdup(value); + popt->topt.fieldSep.is_explicit = true; popt->topt.fieldSep.separator_zero = false; } } diff --git a/src/bin/psql/help.c b/src/bin/psql/help.c index 702e742af4..338b27524c 100644 --- a/src/bin/psql/help.c +++ b/src/bin/psql/help.c @@ -108,13 +108,14 @@ usage(unsigned short int pager) fprintf(output, _("\nOutput format options:\n")); fprintf(output, _(" -A, --no-align unaligned table output mode\n")); + fprintf(output, _(" --csv Comma-Separated-Values output mode\n")); fprintf(output, _(" -F, --field-separator=STRING\n" - " field separator for unaligned output (default: \"%s\")\n"), + " field separator for unaligned or csv output (default: \"%s\")\n"), DEFAULT_FIELD_SEP); fprintf(output, _(" -H, --html HTML table output mode\n")); fprintf(output, _(" -P, --pset=VAR[=ARG] set printing option VAR to ARG (see \\pset command)\n")); fprintf(output, _(" -R, --record-separator=STRING\n" - " record separator for unaligned output (default: newline)\n")); + " record separator for unaligned or csv output (default: newline)\n")); fprintf(output, _(" -t, --tuples-only print rows only\n")); fprintf(output, _(" -T, --table-attr=TEXT set HTML table tag attributes (e.g., width, border)\n")); fprintf(output, _(" -x, --expanded turn on expanded table output\n")); @@ -426,7 +427,7 @@ helpVariables(unsigned short int pager) fprintf(output, _(" expanded (or x)\n" " expanded output [on, off, auto]\n")); fprintf(output, _(" fieldsep\n" - " field separator for unaligned output (default \"%s\")\n"), + " field separator for unaligned and csv output (default \"%s\")\n"), DEFAULT_FIELD_SEP); fprintf(output, _(" fieldsep_zero\n" " set field separator for unaligned output to a zero byte\n")); @@ -443,7 +444,7 @@ helpVariables(unsigned short int pager) fprintf(output, _(" pager\n" " control when an external pager is used [yes, no, always]\n")); fprintf(output, _(" recordsep\n" - " record (line) separator for unaligned output\n")); + " record (line) separator for unaligned and csv output\n")); fprintf(output, _(" recordsep_zero\n" " set record separator for unaligned output to a zero byte\n")); fprintf(output, _(" tableattr (or T)\n" diff --git a/src/bin/psql/settings.h b/src/bin/psql/settings.h index 69e617e6b5..93d0b957f5 100644 --- a/src/bin/psql/settings.h +++ b/src/bin/psql/settings.h @@ -13,6 +13,7 @@ #include "fe_utils/print.h" #define DEFAULT_FIELD_SEP "|" +#define DEFAULT_FIELD_SEP_CSV "," #define DEFAULT_RECORD_SEP "\n" #if defined(WIN32) || defined(__CYGWIN__) diff --git a/src/bin/psql/startup.c b/src/bin/psql/startup.c index be57574cd3..f2df82d4ca 100644 --- a/src/bin/psql/startup.c +++ b/src/bin/psql/startup.c @@ -148,6 +148,8 @@ main(int argc, char *argv[]) pset.popt.topt.unicode_column_linestyle = UNICODE_LINESTYLE_SINGLE; pset.popt.topt.unicode_header_linestyle = UNICODE_LINESTYLE_SINGLE; + pset.popt.topt.fieldSep.is_explicit = false; + refresh_utf8format(&(pset.popt.topt)); /* We must get COLUMNS here before readline() sets it */ @@ -436,6 +438,7 @@ parse_psql_options(int argc, char *argv[], struct adhoc_opts *options) {"echo-all", no_argument, NULL, 'a'}, {"no-align", no_argument, NULL, 'A'}, {"command", required_argument, NULL, 'c'}, + {"csv", no_argument, NULL, 2}, /* no single-letter (leave -C for future use) */ {"dbname", required_argument, NULL, 'd'}, {"echo-queries", no_argument, NULL, 'e'}, {"echo-errors", no_argument, NULL, 'b'}, @@ -516,6 +519,7 @@ parse_psql_options(int argc, char *argv[], struct adhoc_opts *options) break; case 'F': pset.popt.topt.fieldSep.separator = pg_strdup(optarg); + pset.popt.topt.fieldSep.is_explicit = true; pset.popt.topt.fieldSep.separator_zero = false; break; case 'h': @@ -658,6 +662,12 @@ parse_psql_options(int argc, char *argv[], struct adhoc_opts *options) exit(EXIT_SUCCESS); } break; + case 2: + /* --csv: set both format and field separator */ + pset.popt.topt.format = PRINT_CSV; +// pset.popt.topt.fieldSep.separator = pg_strdup(DEFAULT_FIELD_SEP_CSV); + pset.popt.topt.fieldSep.separator_zero = false; + break; default: unknown_option: fprintf(stderr, _("Try \"%s --help\" for more information.\n"), diff --git a/src/bin/psql/tab-complete.c b/src/bin/psql/tab-complete.c index 08d8ef09a4..b9fc423526 100644 --- a/src/bin/psql/tab-complete.c +++ b/src/bin/psql/tab-complete.c @@ -3753,8 +3753,8 @@ psql_completion(const char *text, int start, int end) if (TailMatchesCS1("format")) { static const char *const my_list[] = - {"unaligned", "aligned", "wrapped", "html", "asciidoc", - "latex", "latex-longtable", "troff-ms", NULL}; + {"unaligned", "aligned", "csv", "wrapped", "html", "asciidoc", + "latex", "latex-longtable", "troff-ms", NULL}; COMPLETE_WITH_LIST_CS(my_list); } diff --git a/src/fe_utils/print.c b/src/fe_utils/print.c index ec5ad45a30..542b5413e2 100644 --- a/src/fe_utils/print.c +++ b/src/fe_utils/print.c @@ -35,6 +35,8 @@ #include "catalog/pg_type.h" #include "fe_utils/mbprint.h" +#define DEFAULT_FIELD_SEP_CSV "," + /* * If the calling program doesn't have any mechanism for setting @@ -2783,6 +2785,114 @@ print_troff_ms_vertical(const printTableContent *cont, FILE *fout) } } +/*************************/ +/* CSV */ +/*************************/ +static void +csv_escaped_print(const char *text, FILE *fout) +{ + const char *p; + + fputc('"', fout); + for (p = text; *p; p++) + { + if (*p == '"') + fputc('"', fout); /* double quotes are doubled */ + fputc(*p, fout); + } + fputc('"', fout); +} + +static void +csv_print_field(const char *text, FILE *fout, const char *sep) +{ + /* + * Enclose and escape field contents when one of these conditions is + * met: + * - the field separator is found in the contents + * - the field contains a CR or LF + * - the field contains a double quote + */ + if ((sep != NULL && *sep != '\0' && strstr(text, sep) != NULL) || + strcspn(text, "\r\n\"") != strlen(text)) + { + csv_escaped_print(text, fout); + } + else + fputs(text, fout); +} + +static void +print_csv_text(const printTableContent *cont, FILE *fout) +{ + const char *const *ptr; + const char* fieldsep; + const char* const recordsep = cont->opt->recordSep.separator; + int i; + + if (cancel_pressed) + return; + + if (cont->opt->fieldSep.is_explicit) + fieldsep = cont->opt->fieldSep.separator; + else + fieldsep = DEFAULT_FIELD_SEP_CSV; + + /* + * The title and footer are never printed in csv format. + * The header is printed if opt_tuples_only is false. + */ + + if (cont->opt->start_table && !cont->opt->tuples_only) + { + /* print headers */ + for (ptr = cont->headers; *ptr; ptr++) + { + if (ptr != cont->headers) + fputs(fieldsep, fout); + csv_print_field(*ptr, fout, fieldsep); + } + fputs(recordsep, fout); + } + + /* print cells */ + for (i = 0, ptr = cont->cells; *ptr; i++, ptr++) + { + if (cancel_pressed) + break; + + csv_print_field(*ptr, fout, fieldsep); + + if ((i + 1) % cont->ncolumns) + fputs(fieldsep, fout); + else + fputs(recordsep, fout); + } +} + +static void +print_csv_vertical(const printTableContent *cont, FILE *fout) +{ + unsigned int i; + const char *const *ptr; + + /* Print records */ + for (i = 0, ptr = cont->cells; *ptr; i++, ptr++) + { + if (cancel_pressed) + break; + + /* Field name */ + csv_print_field(cont->headers[i % cont->ncolumns], fout, + cont->opt->fieldSep.separator); + fputs(cont->opt->fieldSep.separator, fout); + + /* Field value followed by record separator */ + csv_print_field(*ptr, fout, cont->opt->fieldSep.separator); + fputs(cont->opt->recordSep.separator, fout); + } +} + /********************************/ /* Public functions */ @@ -3234,6 +3344,12 @@ printTable(const printTableContent *cont, else print_aligned_text(cont, fout, is_pager); break; + case PRINT_CSV: + if (cont->opt->expanded == 1) + print_csv_vertical(cont, fout); + else + print_csv_text(cont, fout); + break; case PRINT_HTML: if (cont->opt->expanded == 1) print_html_vertical(cont, fout); diff --git a/src/include/fe_utils/print.h b/src/include/fe_utils/print.h index 83320d06bd..bdb0c65434 100644 --- a/src/include/fe_utils/print.h +++ b/src/include/fe_utils/print.h @@ -33,7 +33,8 @@ enum printFormat PRINT_ASCIIDOC, PRINT_LATEX, PRINT_LATEX_LONGTABLE, - PRINT_TROFF_MS + PRINT_TROFF_MS, + PRINT_CSV /* add your favourite output format here ... */ }; @@ -91,6 +92,7 @@ struct separator { char *separator; bool separator_zero; + bool is_explicit; }; typedef struct printTableOpt @@ -158,8 +160,8 @@ typedef struct printTableContent char *aligns; /* Array of alignment specifiers; 'l' or 'r', * one per column */ char *align; /* Pointer to the last added alignment */ -} printTableContent; +} printTableContent; typedef struct printQueryOpt { printTableOpt topt; /* the options above */ diff --git a/src/test/regress/expected/psql.out b/src/test/regress/expected/psql.out index 3818cfea7e..0bdfa4d505 100644 --- a/src/test/regress/expected/psql.out +++ b/src/test/regress/expected/psql.out @@ -3243,3 +3243,106 @@ last error message: division by zero \echo 'last error code:' :LAST_ERROR_SQLSTATE last error code: 22012 \unset FETCH_COUNT +-- test csv format +prepare q as select 'ab,cd' as col1, 'ab' as "col,2", E'a\tb' as col3, '"' as col4, + '""' as col5, 'a"b' as "col""6", E'a\nb' as col7, NULL as col8, 'ab' as "col + 9", array['ab', E'cd\nef'] as col10, + '{"a":"a,b", "a,b":null, "c":"a,\"b"}'::json as col11 + from generate_series(1,2); +\pset format csv +\pset fieldsep ',' +\pset expanded off +\t off +execute q; +col1,"col,2",col3,col4,col5,"col""6",col7,col8,"col + 9",col10,col11 +"ab,cd",ab,a b,"""","""""","a""b","a +b",,ab,"{ab,""cd +ef""}","{""a"":""a,b"", ""a,b"":null, ""c"":""a,\""b""}" +"ab,cd",ab,a b,"""","""""","a""b","a +b",,ab,"{ab,""cd +ef""}","{""a"":""a,b"", ""a,b"":null, ""c"":""a,\""b""}" +\pset fieldsep '\t' +execute q; +col1 col,2 col3 col4 col5 "col""6" col7 col8 "col + 9" col10 col11 +ab,cd ab "a b" """" """""" "a""b" "a +b" ab "{ab,""cd +ef""}" "{""a"":""a,b"", ""a,b"":null, ""c"":""a,\""b""}" +ab,cd ab "a b" """" """""" "a""b" "a +b" ab "{ab,""cd +ef""}" "{""a"":""a,b"", ""a,b"":null, ""c"":""a,\""b""}" +\t on +execute q; +ab,cd ab "a b" """" """""" "a""b" "a +b" ab "{ab,""cd +ef""}" "{""a"":""a,b"", ""a,b"":null, ""c"":""a,\""b""}" +ab,cd ab "a b" """" """""" "a""b" "a +b" ab "{ab,""cd +ef""}" "{""a"":""a,b"", ""a,b"":null, ""c"":""a,\""b""}" +\t off +\pset expanded on +execute q; +col1 ab,cd +col,2 ab +col3 "a b" +col4 """" +col5 """""" +"col""6" "a""b" +col7 "a +b" +col8 +"col + 9" ab +col10 "{ab,""cd +ef""}" +col11 "{""a"":""a,b"", ""a,b"":null, ""c"":""a,\""b""}" +col1 ab,cd +col,2 ab +col3 "a b" +col4 """" +col5 """""" +"col""6" "a""b" +col7 "a +b" +col8 +"col + 9" ab +col10 "{ab,""cd +ef""}" +col11 "{""a"":""a,b"", ""a,b"":null, ""c"":""a,\""b""}" +\pset fieldsep ',' +execute q; +col1,"ab,cd" +"col,2",ab +col3,a b +col4,"""" +col5,"""""" +"col""6","a""b" +col7,"a +b" +col8, +"col + 9",ab +col10,"{ab,""cd +ef""}" +col11,"{""a"":""a,b"", ""a,b"":null, ""c"":""a,\""b""}" +col1,"ab,cd" +"col,2",ab +col3,a b +col4,"""" +col5,"""""" +"col""6","a""b" +col7,"a +b" +col8, +"col + 9",ab +col10,"{ab,""cd +ef""}" +col11,"{""a"":""a,b"", ""a,b"":null, ""c"":""a,\""b""}" +deallocate q; +\pset format aligned +\pset expanded off +\pset fieldsep '|' +\t off diff --git a/src/test/regress/sql/psql.sql b/src/test/regress/sql/psql.sql index b45da9bb8d..6891a9b54c 100644 --- a/src/test/regress/sql/psql.sql +++ b/src/test/regress/sql/psql.sql @@ -688,3 +688,31 @@ select 1/(15-unique2) from tenk1 order by unique2 limit 19; \echo 'last error code:' :LAST_ERROR_SQLSTATE \unset FETCH_COUNT + +-- test csv format +prepare q as select 'ab,cd' as col1, 'ab' as "col,2", E'a\tb' as col3, '"' as col4, + '""' as col5, 'a"b' as "col""6", E'a\nb' as col7, NULL as col8, 'ab' as "col + 9", array['ab', E'cd\nef'] as col10, + '{"a":"a,b", "a,b":null, "c":"a,\"b"}'::json as col11 + from generate_series(1,2); + +\pset format csv +\pset fieldsep ',' +\pset expanded off +\t off +execute q; +\pset fieldsep '\t' +execute q; +\t on +execute q; +\t off +\pset expanded on +execute q; +\pset fieldsep ',' +execute q; + +deallocate q; +\pset format aligned +\pset expanded off +\pset fieldsep '|' +\t off