1 /* PSPP - a program for statistical analysis.
2 Copyright (C) 2010, 2011, 2013, 2016 Free Software Foundation, Inc.
4 This program is free software: you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation, either version 3 of the License, or
7 (at your option) any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program. If not, see <http://www.gnu.org/licenses/>. */
21 #include "data/case-map.h"
22 #include "data/casereader.h"
23 #include "data/casewriter.h"
24 #include "data/csv-file-writer.h"
25 #include "data/dataset.h"
26 #include "data/dictionary.h"
27 #include "data/file-name.h"
28 #include "data/format.h"
29 #include "data/settings.h"
30 #include "language/command.h"
31 #include "language/data-io/file-handle.h"
32 #include "language/data-io/trim.h"
33 #include "language/lexer/lexer.h"
34 #include "libpspp/message.h"
39 #define _(msgid) gettext (msgid)
40 #define N_(msgid) (msgid)
43 cmd_save_translate (struct lexer *lexer, struct dataset *ds)
45 enum { CSV_FILE = 1, TAB_FILE } type;
47 struct dictionary *dict;
48 struct case_map_stage *stage;
50 struct casewriter *writer;
51 struct file_handle *handle;
53 struct csv_writer_options csv_opts;
57 bool retain_unselected;
58 bool recode_user_missing;
59 bool include_var_names;
60 bool use_value_labels;
61 bool use_print_formats;
70 dict = dict_clone (dataset_dict (ds));
71 dict_set_names_must_be_ids (dict, false);
78 retain_unselected = true;
79 recode_user_missing = false;
80 include_var_names = false;
81 use_value_labels = false;
82 use_print_formats = false;
83 decimal = settings_get_decimal_char (FMT_F);
87 stage = case_map_stage_create (dict);
88 dict_delete_scratch_vars (dict);
90 while (lex_token (lexer) != T_ENDCMD)
92 if (!lex_force_match (lexer, T_SLASH))
95 if (lex_match_id (lexer, "OUTFILE"))
99 lex_sbc_only_once ("OUTFILE");
103 lex_match (lexer, T_EQUALS);
105 handle = fh_parse (lexer, FH_REF_FILE, NULL);
109 else if (lex_match_id (lexer, "TYPE"))
113 lex_sbc_only_once ("TYPE");
117 lex_match (lexer, T_EQUALS);
118 if (lex_match_id (lexer, "CSV"))
120 else if (lex_match_id (lexer, "TAB"))
124 lex_error_expecting (lexer, "CSV", "TAB");
128 else if (lex_match_id (lexer, "REPLACE"))
130 else if (lex_match_id (lexer, "FIELDNAMES"))
131 include_var_names = true;
132 else if (lex_match_id (lexer, "MISSING"))
134 lex_match (lexer, T_EQUALS);
135 if (lex_match_id (lexer, "IGNORE"))
136 recode_user_missing = false;
137 else if (lex_match_id (lexer, "RECODE"))
138 recode_user_missing = true;
141 lex_error_expecting (lexer, "IGNORE", "RECODE");
145 else if (lex_match_id (lexer, "CELLS"))
147 lex_match (lexer, T_EQUALS);
148 if (lex_match_id (lexer, "VALUES"))
149 use_value_labels = false;
150 else if (lex_match_id (lexer, "LABELS"))
151 use_value_labels = true;
154 lex_error_expecting (lexer, "VALUES", "LABELS");
158 else if (lex_match_id (lexer, "TEXTOPTIONS"))
160 lex_match (lexer, T_EQUALS);
163 if (lex_match_id (lexer, "DELIMITER"))
165 lex_match (lexer, T_EQUALS);
166 if (!lex_force_string (lexer))
168 /* XXX should support multibyte UTF-8 delimiters */
169 if (ss_length (lex_tokss (lexer)) != 1)
171 msg (SE, _("The %s string must contain exactly one "
172 "character."), "DELIMITER");
175 delimiter = ss_first (lex_tokss (lexer));
178 else if (lex_match_id (lexer, "QUALIFIER"))
180 lex_match (lexer, T_EQUALS);
181 if (!lex_force_string (lexer))
183 /* XXX should support multibyte UTF-8 qualifiers */
184 if (ss_length (lex_tokss (lexer)) != 1)
186 msg (SE, _("The %s string must contain exactly one "
187 "character."), "QUALIFIER");
190 qualifier = ss_first (lex_tokss (lexer));
193 else if (lex_match_id (lexer, "DECIMAL"))
195 lex_match (lexer, T_EQUALS);
196 if (lex_match_id (lexer, "DOT"))
198 else if (lex_match_id (lexer, "COMMA"))
202 lex_error_expecting (lexer, "DOT", "COMMA");
206 else if (lex_match_id (lexer, "FORMAT"))
208 lex_match (lexer, T_EQUALS);
209 if (lex_match_id (lexer, "PLAIN"))
210 use_print_formats = false;
211 else if (lex_match_id (lexer, "VARIABLE"))
212 use_print_formats = true;
215 lex_error_expecting (lexer, "PLAIN", "VARIABLE");
223 else if (lex_match_id (lexer, "UNSELECTED"))
225 lex_match (lexer, T_EQUALS);
226 if (lex_match_id (lexer, "RETAIN"))
227 retain_unselected = true;
228 else if (lex_match_id (lexer, "DELETE"))
229 retain_unselected = false;
232 lex_error_expecting (lexer, "RETAIN", "DELETE");
236 else if (!parse_dict_trim (lexer, dict))
242 lex_sbc_missing ("TYPE");
245 else if (handle == NULL)
247 lex_sbc_missing ("OUTFILE");
250 else if (!replace && fn_exists (handle))
252 msg (SE, _("Output file `%s' exists but %s was not specified."),
253 fh_get_file_name (handle), "REPLACE");
257 dict_delete_scratch_vars (dict);
258 dict_compact_values (dict);
260 csv_opts.recode_user_missing = recode_user_missing;
261 csv_opts.include_var_names = include_var_names;
262 csv_opts.use_value_labels = use_value_labels;
263 csv_opts.use_print_formats = use_print_formats;
264 csv_opts.decimal = decimal;
265 csv_opts.delimiter = (delimiter ? delimiter
266 : type == TAB_FILE ? '\t'
267 : decimal == '.' ? ','
269 csv_opts.qualifier = qualifier;
271 writer = csv_writer_open (handle, dict, &csv_opts);
276 map = case_map_stage_get_case_map (stage);
277 case_map_stage_destroy (stage);
279 writer = case_map_create_output_translator (map, writer);
282 casereader_transfer (proc_open_filtering (ds, !retain_unselected), writer);
283 ok = casewriter_destroy (writer);
284 ok = proc_commit (ds) && ok;
286 return ok ? CMD_SUCCESS : CMD_CASCADING_FAILURE;
289 case_map_stage_destroy (stage);
292 case_map_destroy (map);