1 /* PSPPIRE - a graphical user interface for PSPP.
2 Copyright (C) 2008, 2009, 2010, 2011, 2012, 2013 Free Software Foundation
4 This program is free software: you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation, either version 3 of the License, or
7 (at your option) any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program. If not, see <http://www.gnu.org/licenses/>. */
19 #include "ui/gui/text-data-import-dialog.h"
23 #include <gtk-contrib/psppire-sheet.h>
29 #include "data/data-in.h"
30 #include "data/data-out.h"
31 #include "data/format-guesser.h"
32 #include "data/value-labels.h"
33 #include "language/data-io/data-parser.h"
34 #include "language/lexer/lexer.h"
35 #include "libpspp/assertion.h"
36 #include "libpspp/i18n.h"
37 #include "libpspp/line-reader.h"
38 #include "libpspp/message.h"
39 #include "ui/gui/checkbox-treeview.h"
40 #include "ui/gui/dialog-common.h"
41 #include "ui/gui/executor.h"
42 #include "ui/gui/helper.h"
43 #include "ui/gui/builder-wrapper.h"
44 #include "ui/gui/psppire-data-window.h"
45 #include "ui/gui/psppire-dialog.h"
46 #include "ui/gui/psppire-encoding-selector.h"
47 #include "ui/gui/psppire-empty-list-store.h"
48 #include "ui/gui/psppire-var-sheet.h"
49 #include "ui/gui/psppire-var-store.h"
50 #include "ui/gui/psppire-scanf.h"
51 #include "ui/syntax-gen.h"
54 #include "gl/intprops.h"
55 #include "gl/xalloc.h"
58 #define _(msgid) gettext (msgid)
59 #define N_(msgid) msgid
61 struct import_assistant;
63 static void apply_dict (const struct dictionary *, struct string *);
64 static char *generate_syntax (const struct import_assistant *);
66 static void add_line_number_column (const struct import_assistant *,
68 /* Pops up the Text Data Import assistant. */
70 text_data_import_assistant (PsppireDataWindow *dw)
72 GtkWindow *parent_window = GTK_WINDOW (dw);
73 struct import_assistant *ia;
75 ia = xzalloc (sizeof *ia);
76 if (!init_file (ia, parent_window))
82 printf ("%s:%d %s\n", __FILE__, __LINE__, ia->file.file_name);
84 init_assistant (ia, parent_window);
85 if ( ia->file.type == FTYPE_TEXT)
88 init_first_line_page (ia);
89 init_separators_page (ia);
93 init_sheet_spec_page (ia);
96 init_formats_page (ia);
98 gtk_widget_show_all (GTK_WIDGET (ia->asst.assistant));
100 ia->asst.main_loop = g_main_loop_new (NULL, false);
101 g_main_loop_run (ia->asst.main_loop);
102 g_main_loop_unref (ia->asst.main_loop);
104 switch (ia->asst.response)
106 case GTK_RESPONSE_APPLY:
107 free (execute_syntax_string (dw, generate_syntax (ia)));
109 case PSPPIRE_RESPONSE_PASTE:
110 free (paste_syntax_to_window (generate_syntax (ia)));
116 if ( ia->file.type == FTYPE_TEXT)
118 destroy_formats_page (ia);
119 destroy_separators_page (ia);
122 destroy_assistant (ia);
127 /* Emits PSPP syntax to S that applies the dictionary attributes
128 (such as missing values and value labels) of the variables in
131 apply_dict (const struct dictionary *dict, struct string *s)
133 size_t var_cnt = dict_get_var_cnt (dict);
136 for (i = 0; i < var_cnt; i++)
138 struct variable *var = dict_get_var (dict, i);
139 const char *name = var_get_name (var);
140 enum val_type type = var_get_type (var);
141 int width = var_get_width (var);
142 enum measure measure = var_get_measure (var);
143 enum alignment alignment = var_get_alignment (var);
144 const struct fmt_spec *format = var_get_print_format (var);
146 if (var_has_missing_values (var))
148 const struct missing_values *mv = var_get_missing_values (var);
151 syntax_gen_pspp (s, "MISSING VALUES %ss (", name);
152 for (j = 0; j < mv_n_values (mv); j++)
155 ds_put_cstr (s, ", ");
156 syntax_gen_value (s, mv_get_value (mv, j), width, format);
159 if (mv_has_range (mv))
162 if (mv_has_value (mv))
163 ds_put_cstr (s, ", ");
164 mv_get_range (mv, &low, &high);
165 syntax_gen_num_range (s, low, high, format);
167 ds_put_cstr (s, ").\n");
169 if (var_has_value_labels (var))
171 const struct val_labs *vls = var_get_value_labels (var);
172 const struct val_lab **labels = val_labs_sorted (vls);
173 size_t n_labels = val_labs_count (vls);
176 syntax_gen_pspp (s, "VALUE LABELS %ss", name);
177 for (i = 0; i < n_labels; i++)
179 const struct val_lab *vl = labels[i];
180 ds_put_cstr (s, "\n ");
181 syntax_gen_value (s, &vl->value, width, format);
182 ds_put_byte (s, ' ');
183 syntax_gen_string (s, ss_cstr (val_lab_get_escaped_label (vl)));
186 ds_put_cstr (s, ".\n");
188 if (var_has_label (var))
189 syntax_gen_pspp (s, "VARIABLE LABELS %ss %sq.\n",
190 name, var_get_label (var));
191 if (measure != var_default_measure (type))
192 syntax_gen_pspp (s, "VARIABLE LEVEL %ss (%ss).\n",
194 (measure == MEASURE_NOMINAL ? "NOMINAL"
195 : measure == MEASURE_ORDINAL ? "ORDINAL"
197 if (alignment != var_default_alignment (type))
198 syntax_gen_pspp (s, "VARIABLE ALIGNMENT %ss (%ss).\n",
200 (alignment == ALIGN_LEFT ? "LEFT"
201 : alignment == ALIGN_CENTRE ? "CENTER"
203 if (var_get_display_width (var) != var_default_display_width (width))
204 syntax_gen_pspp (s, "VARIABLE WIDTH %ss (%d).\n",
205 name, var_get_display_width (var));
209 /* Generates and returns PSPP syntax to execute the import
210 operation described by IA. The caller must free the syntax
213 generate_syntax (const struct import_assistant *ia)
215 struct string s = DS_EMPTY_INITIALIZER;
217 if (ia->file.type == FTYPE_TEXT)
226 if (ia->file.encoding && strcmp (ia->file.encoding, "Auto"))
227 syntax_gen_pspp (&s, " /ENCODING=%sq\n", ia->file.encoding);
228 if (gtk_toggle_button_get_active (GTK_TOGGLE_BUTTON (
229 ia->intro.n_cases_button)))
230 ds_put_format (&s, " /IMPORTCASES=FIRST %d\n",
231 gtk_spin_button_get_value_as_int (
232 GTK_SPIN_BUTTON (ia->intro.n_cases_spin)));
233 else if (gtk_toggle_button_get_active (GTK_TOGGLE_BUTTON (
234 ia->intro.percent_button)))
235 ds_put_format (&s, " /IMPORTCASES=PERCENT %d\n",
236 gtk_spin_button_get_value_as_int (
237 GTK_SPIN_BUTTON (ia->intro.percent_spin)));
239 ds_put_cstr (&s, " /IMPORTCASES=ALL\n");
241 " /ARRANGEMENT=DELIMITED\n"
243 if (ia->first_line.skip_lines > 0)
244 ds_put_format (&s, " /FIRSTCASE=%d\n", ia->first_line.skip_lines + 1);
245 ds_put_cstr (&s, " /DELIMITERS=\"");
246 if (ds_find_byte (&ia->separators.separators, '\t') != SIZE_MAX)
247 ds_put_cstr (&s, "\\t");
248 if (ds_find_byte (&ia->separators.separators, '\\') != SIZE_MAX)
249 ds_put_cstr (&s, "\\\\");
250 for (i = 0; i < ds_length (&ia->separators.separators); i++)
252 char c = ds_at (&ia->separators.separators, i);
254 ds_put_cstr (&s, "\"\"");
255 else if (c != '\t' && c != '\\')
258 ds_put_cstr (&s, "\"\n");
259 if (!ds_is_empty (&ia->separators.quotes))
260 syntax_gen_pspp (&s, " /QUALIFIER=%sq\n", ds_cstr (&ia->separators.quotes));
261 if (!ds_is_empty (&ia->separators.quotes) && ia->separators.escape)
262 ds_put_cstr (&s, " /ESCAPE\n");
263 ds_put_cstr (&s, " /VARIABLES=\n");
265 var_cnt = dict_get_var_cnt (ia->formats.dict);
266 for (i = 0; i < var_cnt; i++)
268 struct variable *var = dict_get_var (ia->formats.dict, i);
269 char format_string[FMT_STRING_LEN_MAX + 1];
270 fmt_to_string (var_get_print_format (var), format_string);
271 ds_put_format (&s, " %s %s%s\n",
272 var_get_name (var), format_string,
273 i == var_cnt - 1 ? "." : "");
276 apply_dict (ia->formats.dict, &s);
293 static void render_input_cell (GtkTreeViewColumn *tree_column,
294 GtkCellRenderer *cell,
295 GtkTreeModel *model, GtkTreeIter *iter,
298 static gboolean on_query_input_tooltip (GtkWidget *widget, gint wx, gint wy,
299 gboolean keyboard_mode UNUSED,
301 struct import_assistant *);
305 /* Called to render one of the cells in the fields preview tree
308 render_input_cell (GtkTreeViewColumn *tree_column, GtkCellRenderer *cell,
309 GtkTreeModel *model, GtkTreeIter *iter,
312 struct import_assistant *ia = ia_;
313 struct substring field;
317 column = GPOINTER_TO_INT (g_object_get_data (G_OBJECT (tree_column),
319 row = empty_list_store_iter_to_row (iter) + ia->first_line.skip_lines;
320 field = ia->separators.columns[column].contents[row];
321 if (field.string != NULL)
324 g_value_init (&text, G_TYPE_STRING);
325 g_value_take_string (&text, ss_xstrdup (field));
326 g_object_set_property (G_OBJECT (cell), "text", &text);
327 g_value_unset (&text);
328 g_object_set (cell, "background-set", FALSE, (void *) NULL);
334 "background-set", TRUE,
339 get_tooltip_location (GtkWidget *widget, gint wx, gint wy,
340 const struct import_assistant *ia,
341 size_t *row, size_t *column);
344 /* Called to render a tooltip on one of the cells in the fields
345 preview tree view. */
347 on_query_input_tooltip (GtkWidget *widget, gint wx, gint wy,
348 gboolean keyboard_mode UNUSED,
349 GtkTooltip *tooltip, struct import_assistant *ia)
353 if (!get_tooltip_location (widget, wx, wy, ia, &row, &column))
356 if (ia->separators.columns[column].contents[row].string != NULL)
359 gtk_tooltip_set_text (tooltip,
360 _("This input line has too few separators "
361 "to fill in this field."));
366 /* Parses the contents of the field at (ROW,COLUMN) according to
367 its variable format. If OUTPUTP is non-null, then *OUTPUTP
368 receives the formatted output for that field (which must be
369 freed with free). If TOOLTIPP is non-null, then *TOOLTIPP
370 receives a message suitable for use in a tooltip, if one is
371 needed, or a null pointer otherwise. Returns true if a
372 tooltip message is needed, otherwise false. */
374 parse_field (struct import_assistant *ia,
375 size_t row, size_t column,
376 char **outputp, char **tooltipp)
378 struct substring field;
380 struct variable *var;
381 const struct fmt_spec *in;
386 field = ia->separators.columns[column].contents[row];
387 var = dict_get_var (ia->formats.dict, column);
388 value_init (&val, var_get_width (var));
389 in = var_get_print_format (var);
390 out = fmt_for_output_from_input (in);
392 if (field.string != NULL)
396 error = data_in (field, "UTF-8", in->type, &val, var_get_width (var),
397 dict_get_encoding (ia->formats.dict));
400 tooltip = xasprintf (_("Cannot parse field content `%.*s' as "
402 (int) field.length, field.string,
403 fmt_name (in->type), error);
409 tooltip = xstrdup (_("This input line has too few separators "
410 "to fill in this field."));
411 value_set_missing (&val, var_get_width (var));
415 *outputp = data_out (&val, dict_get_encoding (ia->formats.dict), &out);
417 value_destroy (&val, var_get_width (var));
419 ok = tooltip == NULL;
420 if (tooltipp != NULL)
427 /* Called to render one of the cells in the data preview tree
430 render_output_cell (GtkTreeViewColumn *tree_column,
431 GtkCellRenderer *cell,
436 struct import_assistant *ia = ia_;
438 GValue gvalue = { 0, };
441 ok = parse_field (ia,
442 (empty_list_store_iter_to_row (iter)
443 + ia->first_line.skip_lines),
444 GPOINTER_TO_INT (g_object_get_data (G_OBJECT (tree_column),
448 g_value_init (&gvalue, G_TYPE_STRING);
449 g_value_take_string (&gvalue, output);
450 g_object_set_property (G_OBJECT (cell), "text", &gvalue);
451 g_value_unset (&gvalue);
454 g_object_set (cell, "background-set", FALSE, (void *) NULL);
458 "background-set", TRUE,
462 /* Called to render a tooltip for one of the cells in the data
463 preview tree view. */
465 on_query_output_tooltip (GtkWidget *widget, gint wx, gint wy,
466 gboolean keyboard_mode UNUSED,
467 GtkTooltip *tooltip, struct import_assistant *ia)
472 if (!get_tooltip_location (widget, wx, wy, ia, &row, &column))
475 if (parse_field (ia, row, column, NULL, &text))
478 gtk_tooltip_set_text (tooltip, text);
483 /* Utility functions used by multiple pages of the assistant. */
486 get_tooltip_location (GtkWidget *widget, gint wx, gint wy,
487 const struct import_assistant *ia,
488 size_t *row, size_t *column)
490 GtkTreeView *tree_view = GTK_TREE_VIEW (widget);
494 GtkTreeViewColumn *tree_column;
495 GtkTreeModel *tree_model;
498 /* Check that WIDGET is really visible on the screen before we
499 do anything else. This is a bug fix for a sticky situation:
500 when text_data_import_assistant() returns, it frees the data
501 necessary to compose the tool tip message, but there may be
502 a tool tip under preparation at that point (even if there is
503 no visible tool tip) that will call back into us a little
504 bit later. Perhaps the correct solution to this problem is
505 to make the data related to the tool tips part of a GObject
506 that only gets destroyed when all references are released,
507 but this solution appears to be effective too. */
508 if (!gtk_widget_get_mapped (widget))
511 gtk_tree_view_convert_widget_to_bin_window_coords (tree_view,
513 if (!gtk_tree_view_get_path_at_pos (tree_view, bx, by,
514 &path, &tree_column, NULL, NULL))
517 *column = GPOINTER_TO_INT (g_object_get_data (G_OBJECT (tree_column),
520 tree_model = gtk_tree_view_get_model (tree_view);
521 ok = gtk_tree_model_get_iter (tree_model, &iter, path);
522 gtk_tree_path_free (path);
526 *row = empty_list_store_iter_to_row (&iter) + ia->first_line.skip_lines;
531 make_tree_view (const struct import_assistant *ia,
533 GtkTreeView **tree_view)
537 *tree_view = GTK_TREE_VIEW (gtk_tree_view_new ());
538 model = GTK_TREE_MODEL (psppire_empty_list_store_new (
539 ia->file.line_cnt - first_line));
540 g_object_set_data (G_OBJECT (model), "lines", ia->file.lines + first_line);
541 g_object_set_data (G_OBJECT (model), "first-line",
542 GINT_TO_POINTER (first_line));
543 gtk_tree_view_set_model (*tree_view, model);
544 g_object_unref (model);
546 add_line_number_column (ia, *tree_view);
550 render_line_number (GtkTreeViewColumn *tree_column,
551 GtkCellRenderer *cell,
552 GtkTreeModel *tree_model,
556 gint row = empty_list_store_iter_to_row (iter);
557 char s[INT_BUFSIZE_BOUND (int)];
560 first_line = GPOINTER_TO_INT (g_object_get_data (G_OBJECT (tree_model),
562 sprintf (s, "%d", first_line + row);
563 g_object_set (cell, "text", s, NULL);
567 add_line_number_column (const struct import_assistant *ia,
568 GtkTreeView *treeview)
570 GtkTreeViewColumn *column;
572 column = gtk_tree_view_column_new_with_attributes (
573 _("Line"), ia->asst.prop_renderer, (void *) NULL);
574 gtk_tree_view_column_set_sizing (column, GTK_TREE_VIEW_COLUMN_FIXED);
575 gtk_tree_view_column_set_fixed_width (
576 column, get_monospace_width (treeview, ia->asst.prop_renderer, 5));
577 gtk_tree_view_column_set_resizable (column, TRUE);
578 gtk_tree_view_column_set_cell_data_func (column, ia->asst.prop_renderer,
579 render_line_number, NULL, NULL);
580 gtk_tree_view_append_column (treeview, column);
584 get_monospace_width (GtkTreeView *treeview, GtkCellRenderer *renderer,
591 ds_put_byte_multiple (&s, '0', char_cnt);
592 ds_put_byte (&s, ' ');
593 width = get_string_width (treeview, renderer, ds_cstr (&s));
600 get_string_width (GtkTreeView *treeview, GtkCellRenderer *renderer,
604 g_object_set (G_OBJECT (renderer), "text", string, (void *) NULL);
605 gtk_cell_renderer_get_size (renderer, GTK_WIDGET (treeview),
606 NULL, NULL, NULL, &width, NULL);
611 make_data_column (struct import_assistant *ia, GtkTreeView *tree_view,
612 bool input, gint dict_idx)
614 struct variable *var = NULL;
615 struct column *column = NULL;
617 gint content_width, header_width;
618 GtkTreeViewColumn *tree_column;
622 column = &ia->separators.columns[dict_idx];
624 var = dict_get_var (ia->formats.dict, dict_idx);
626 name = escape_underscores (input ? column->name : var_get_name (var));
627 char_cnt = input ? column->width : var_get_print_format (var)->w;
628 content_width = get_monospace_width (tree_view, ia->asst.fixed_renderer,
630 header_width = get_string_width (tree_view, ia->asst.prop_renderer,
633 tree_column = gtk_tree_view_column_new ();
634 g_object_set_data (G_OBJECT (tree_column), "column-number",
635 GINT_TO_POINTER (dict_idx));
636 gtk_tree_view_column_set_title (tree_column, name);
637 gtk_tree_view_column_pack_start (tree_column, ia->asst.fixed_renderer,
639 gtk_tree_view_column_set_cell_data_func (
640 tree_column, ia->asst.fixed_renderer,
641 input ? render_input_cell : render_output_cell, ia, NULL);
642 gtk_tree_view_column_set_sizing (tree_column, GTK_TREE_VIEW_COLUMN_FIXED);
643 gtk_tree_view_column_set_fixed_width (tree_column, MAX (content_width,
652 create_data_tree_view (bool input, GtkContainer *parent,
653 struct import_assistant *ia)
655 GtkTreeView *tree_view;
658 make_tree_view (ia, ia->first_line.skip_lines, &tree_view);
659 gtk_tree_selection_set_mode (gtk_tree_view_get_selection (tree_view),
662 for (i = 0; i < ia->separators.column_cnt; i++)
663 gtk_tree_view_append_column (tree_view,
664 make_data_column (ia, tree_view, input, i));
666 g_object_set (G_OBJECT (tree_view), "has-tooltip", TRUE, (void *) NULL);
667 g_signal_connect (tree_view, "query-tooltip",
668 G_CALLBACK (input ? on_query_input_tooltip
669 : on_query_output_tooltip), ia);
670 gtk_tree_view_set_fixed_height_mode (tree_view, true);
672 gtk_container_add (parent, GTK_WIDGET (tree_view));
673 gtk_widget_show (GTK_WIDGET (tree_view));
678 /* Increments the "watch cursor" level, setting the cursor for
679 the assistant window to a watch face to indicate to the user
680 that the ongoing operation may take some time. */
682 push_watch_cursor (struct import_assistant *ia)
684 if (++ia->asst.watch_cursor == 1)
686 GtkWidget *widget = GTK_WIDGET (ia->asst.assistant);
687 GdkDisplay *display = gtk_widget_get_display (widget);
688 GdkCursor *cursor = gdk_cursor_new_for_display (display, GDK_WATCH);
689 gdk_window_set_cursor (widget->window, cursor);
690 gdk_cursor_unref (cursor);
691 gdk_display_flush (display);
695 /* Decrements the "watch cursor" level. If the level reaches
696 zero, the cursor is reset to its default shape. */
698 pop_watch_cursor (struct import_assistant *ia)
700 if (--ia->asst.watch_cursor == 0)
702 GtkWidget *widget = GTK_WIDGET (ia->asst.assistant);
703 gdk_window_set_cursor (widget->window, NULL);