1 /* PSPP - a program for statistical analysis.
2 Copyright (C) 1997-9, 2000, 2007, 2009, 2010 Free Software Foundation, Inc.
4 This program is free software: you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation, either version 3 of the License, or
7 (at your option) any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program. If not, see <http://www.gnu.org/licenses/>. */
25 #include <data/dictionary.h>
26 #include <data/procedure.h>
27 #include <data/settings.h>
28 #include <libpspp/getl.h>
29 #include <language/command.h>
30 #include <language/lexer/lexer.h>
31 #include <language/lexer/variable-parser.h>
32 #include <libpspp/cast.h>
33 #include <libpspp/ll.h>
34 #include <libpspp/message.h>
35 #include <libpspp/misc.h>
36 #include <libpspp/pool.h>
37 #include <libpspp/str.h>
38 #include <data/variable.h>
44 #define _(msgid) gettext (msgid)
46 /* A line repeated by DO REPEAT. */
49 struct ll ll; /* In struct repeat_block line_list. */
50 const char *file_name; /* File name. */
51 int line_number; /* Line number. */
52 struct substring text; /* Contents. */
55 /* The type of substitution made for a DO REPEAT macro. */
56 enum repeat_macro_type
62 /* Describes one DO REPEAT macro. */
65 struct ll ll; /* In struct repeat_block macros. */
66 enum repeat_macro_type type; /* Types of replacements. */
67 struct substring name; /* Macro name. */
68 struct substring *replacements; /* Macro replacement. */
71 /* A DO REPEAT...END REPEAT block. */
74 struct getl_interface parent;
76 struct pool *pool; /* Pool used for storage. */
77 struct dataset *ds; /* The dataset for this block */
79 struct ll_list lines; /* Lines in buffer. */
80 struct ll *cur_line; /* Last line output. */
81 int loop_cnt; /* Number of loops. */
82 int loop_idx; /* Number of loops so far. */
84 struct ll_list macros; /* Table of macros. */
86 bool print; /* Print lines as executed? */
89 static bool parse_specification (struct lexer *, struct repeat_block *);
90 static bool parse_lines (struct lexer *, struct repeat_block *);
91 static void create_vars (struct repeat_block *);
93 static struct repeat_macro *find_macro (struct repeat_block *,
94 struct substring name);
96 static int parse_ids (struct lexer *, const struct dictionary *dict,
97 struct repeat_macro *, struct pool *);
99 static int parse_numbers (struct lexer *, struct repeat_macro *,
102 static int parse_strings (struct lexer *, struct repeat_macro *,
105 static void do_repeat_filter (struct getl_interface *,
107 static bool do_repeat_read (struct getl_interface *,
109 static void do_repeat_close (struct getl_interface *);
110 static bool always_false (const struct getl_interface *);
111 static const char *do_repeat_name (const struct getl_interface *);
112 static int do_repeat_location (const struct getl_interface *);
115 cmd_do_repeat (struct lexer *lexer, struct dataset *ds)
117 struct repeat_block *block;
119 block = pool_create_container (struct repeat_block, pool);
121 ll_init (&block->lines);
122 block->cur_line = ll_null (&block->lines);
124 ll_init (&block->macros);
126 if (!parse_specification (lexer, block) || !parse_lines (lexer, block))
131 block->parent.read = do_repeat_read;
132 block->parent.close = do_repeat_close;
133 block->parent.filter = do_repeat_filter;
134 block->parent.interactive = always_false;
135 block->parent.name = do_repeat_name;
136 block->parent.location = do_repeat_location;
138 if (!ll_is_empty (&block->lines))
139 getl_include_source (lex_get_source_stream (lexer),
141 lex_current_syntax_mode (lexer),
142 lex_current_error_mode (lexer)
145 pool_destroy (block->pool);
150 pool_destroy (block->pool);
151 return CMD_CASCADING_FAILURE;
154 /* Parses the whole DO REPEAT command specification.
157 parse_specification (struct lexer *lexer, struct repeat_block *block)
159 struct substring first_name;
164 struct repeat_macro *macro;
165 struct dictionary *dict = dataset_dict (block->ds);
168 /* Get a stand-in variable name and make sure it's unique. */
169 if (!lex_force_id (lexer))
171 if (dict_lookup_var (dict, lex_tokcstr (lexer)))
172 msg (SW, _("Dummy variable name `%s' hides dictionary variable `%s'."),
173 lex_tokcstr (lexer), lex_tokcstr (lexer));
174 if (find_macro (block, lex_tokss (lexer)))
176 msg (SE, _("Dummy variable name `%s' is given twice."),
177 lex_tokcstr (lexer));
181 /* Make a new macro. */
182 macro = pool_alloc (block->pool, sizeof *macro);
183 ss_alloc_substring_pool (¯o->name, lex_tokss (lexer), block->pool);
184 ll_push_tail (&block->macros, ¯o->ll);
186 /* Skip equals sign. */
188 if (!lex_force_match (lexer, T_EQUALS))
191 /* Get the details of the variable's possible values. */
192 if (lex_token (lexer) == T_ID)
193 count = parse_ids (lexer, dict, macro, block->pool);
194 else if (lex_is_number (lexer))
195 count = parse_numbers (lexer, macro, block->pool);
196 else if (lex_is_string (lexer))
197 count = parse_strings (lexer, macro, block->pool);
200 lex_error (lexer, NULL);
205 if (lex_token (lexer) != T_SLASH && lex_token (lexer) != T_ENDCMD)
207 lex_error (lexer, NULL);
211 /* If this is the first variable then it defines how many
212 replacements there must be; otherwise enforce this number of
214 if (block->loop_cnt == 0)
216 block->loop_cnt = count;
217 first_name = macro->name;
219 else if (block->loop_cnt != count)
221 msg (SE, _("Dummy variable `%.*s' had %d "
222 "substitutions, so `%.*s' must also, but %d "
224 (int) ss_length (first_name), ss_data (first_name),
226 (int) ss_length (macro->name), ss_data (macro->name),
231 lex_match (lexer, T_SLASH);
233 while (lex_token (lexer) != T_ENDCMD);
238 /* Finds and returns a DO REPEAT macro with the given NAME, or
239 NULL if there is none */
240 static struct repeat_macro *
241 find_macro (struct repeat_block *block, struct substring name)
243 struct repeat_macro *macro;
245 ll_for_each (macro, struct repeat_macro, ll, &block->macros)
246 if (ss_equals (macro->name, name))
252 /* Advances LINE past white space and an identifier, if present.
253 Returns true if KEYWORD matches the identifer, false
256 recognize_keyword (struct substring *line, const char *keyword)
259 ss_ltrim (line, ss_cstr (CC_SPACES));
260 ss_get_bytes (line, lex_id_get_length (*line), &id);
261 return lex_id_match (ss_cstr (keyword), id);
264 /* Returns true if LINE contains a DO REPEAT command, false
267 recognize_do_repeat (struct substring line)
269 return (recognize_keyword (&line, "do")
270 && recognize_keyword (&line, "repeat"));
273 /* Returns true if LINE contains an END REPEAT command, false
274 otherwise. Sets *PRINT to true for END REPEAT PRINT, false
277 recognize_end_repeat (struct substring line, bool *print)
279 if (!recognize_keyword (&line, "end")
280 || !recognize_keyword (&line, "repeat"))
283 *print = recognize_keyword (&line, "print");
287 /* Read all the lines we are going to substitute, inside the DO
288 REPEAT...END REPEAT block. */
290 parse_lines (struct lexer *lexer, struct repeat_block *block)
292 char *previous_file_name;
295 previous_file_name = NULL;
300 const char *cur_file_name;
301 struct repeat_line *line;
303 bool command_ends_before_line, command_ends_after_line;
305 /* Retrieve an input line and make a copy of it. */
306 if (!lex_get_line_raw (lexer))
308 msg (SE, _("DO REPEAT without END REPEAT."));
311 ds_init_string (&text, lex_entire_line_ds (lexer));
313 /* Record file name. */
314 cur_file_name = getl_source_name (lex_get_source_stream (lexer));
315 if (cur_file_name != NULL &&
316 (previous_file_name == NULL
317 || !strcmp (cur_file_name, previous_file_name)))
318 previous_file_name = pool_strdup (block->pool, cur_file_name);
320 /* Create a line structure. */
321 line = pool_alloc (block->pool, sizeof *line);
322 line->file_name = previous_file_name;
323 line->line_number = getl_source_location (lex_get_source_stream (lexer));
324 ss_alloc_substring_pool (&line->text, ds_ss (&text), block->pool);
327 /* Check whether the line contains a DO REPEAT or END
329 lex_preprocess_line (&text,
330 lex_current_syntax_mode (lexer),
331 &command_ends_before_line,
332 &command_ends_after_line);
333 if (recognize_do_repeat (ds_ss (&text)))
335 if (settings_get_syntax () == COMPATIBLE)
336 msg (SE, _("DO REPEAT may not nest in compatibility mode."));
340 else if (recognize_end_repeat (ds_ss (&text), &block->print)
341 && nesting_level-- == 0)
343 lex_discard_line (lexer);
349 /* Add the line to the list. */
350 ll_push_tail (&block->lines, &line->ll);
354 /* Creates variables for the given DO REPEAT. */
356 create_vars (struct repeat_block *block)
358 struct repeat_macro *macro;
360 ll_for_each (macro, struct repeat_macro, ll, &block->macros)
361 if (macro->type == VAR_NAMES)
365 for (i = 0; i < block->loop_cnt; i++)
367 /* Ignore return value: if the variable already
368 exists there is no harm done. */
369 char *var_name = ss_xstrdup (macro->replacements[i]);
370 dict_create_var (dataset_dict (block->ds), var_name, 0);
376 /* Parses a set of ids for DO REPEAT. */
378 parse_ids (struct lexer *lexer, const struct dictionary *dict,
379 struct repeat_macro *macro, struct pool *pool)
384 macro->type = VAR_NAMES;
385 if (!parse_mixed_vars_pool (lexer, dict, pool, &replacements, &n, PV_NONE))
388 macro->replacements = pool_nalloc (pool, n, sizeof *macro->replacements);
389 for (i = 0; i < n; i++)
390 macro->replacements[i] = ss_cstr (replacements[i]);
394 /* Adds REPLACEMENT to MACRO's list of replacements, which has
395 *USED elements and has room for *ALLOCATED. Allocates memory
398 add_replacement (struct substring replacement,
399 struct repeat_macro *macro, struct pool *pool,
400 size_t *used, size_t *allocated)
402 if (*used == *allocated)
403 macro->replacements = pool_2nrealloc (pool, macro->replacements, allocated,
404 sizeof *macro->replacements);
405 macro->replacements[(*used)++] = replacement;
408 /* Parses a list or range of numbers for DO REPEAT. */
410 parse_numbers (struct lexer *lexer, struct repeat_macro *macro,
414 size_t allocated = 0;
417 macro->replacements = NULL;
421 bool integer_value_seen;
424 /* Parse A TO B into a, b. */
425 if (!lex_force_num (lexer))
428 if ( (integer_value_seen = lex_is_integer (lexer) ) )
429 a = lex_integer (lexer);
431 a = lex_number (lexer);
434 if (lex_token (lexer) == T_TO)
436 if ( !integer_value_seen )
438 msg (SE, _("Ranges may only have integer bounds"));
442 if (!lex_force_int (lexer))
444 b = lex_integer (lexer);
447 msg (SE, _("%g TO %g is an invalid range."), a, b);
455 for (i = a; i <= b; i++)
456 add_replacement (ss_cstr (pool_asprintf (pool, "%g", i)),
457 macro, pool, &used, &allocated);
459 lex_match (lexer, T_COMMA);
461 while (lex_token (lexer) != T_SLASH && lex_token (lexer) != T_ENDCMD);
466 /* Parses a list of strings for DO REPEAT. */
468 parse_strings (struct lexer *lexer, struct repeat_macro *macro, struct pool *pool)
471 size_t allocated = 0;
474 macro->replacements = NULL;
480 if (!lex_force_string (lexer))
482 msg (SE, _("String expected."));
486 string = lex_token_representation (lexer);
487 pool_register (pool, free, string);
488 add_replacement (ss_cstr (string), macro, pool, &used, &allocated);
491 lex_match (lexer, T_COMMA);
493 while (lex_token (lexer) != T_SLASH && lex_token (lexer) != T_ENDCMD);
499 cmd_end_repeat (struct lexer *lexer UNUSED, struct dataset *ds UNUSED)
501 msg (SE, _("No matching DO REPEAT."));
502 return CMD_CASCADING_FAILURE;
505 /* Finds a DO REPEAT macro with the given NAME and returns the
506 appropriate substitution if found, or NAME otherwise. */
507 static struct substring
508 find_substitution (struct repeat_block *block, struct substring name)
510 struct repeat_macro *macro = find_macro (block, name);
511 return macro ? macro->replacements[block->loop_idx] : name;
514 /* Makes appropriate DO REPEAT macro substitutions within the
517 do_repeat_filter (struct getl_interface *interface, struct string *line)
519 struct repeat_block *block
520 = UP_CAST (interface, struct repeat_block, parent);
521 bool in_apos, in_quote, dot;
522 struct substring input;
523 struct string output;
526 ds_init_empty (&output);
528 /* Strip trailing whitespace, check for & remove terminal dot. */
529 ds_rtrim (line, ss_cstr (CC_SPACES));
530 dot = ds_chomp (line, settings_get_endcmd ());
531 input = ds_ss (line);
532 in_apos = in_quote = false;
533 while ((c = ss_first (input)) != EOF)
535 if (c == '\'' && !in_quote)
537 else if (c == '"' && !in_apos)
538 in_quote = !in_quote;
540 if (in_quote || in_apos || !lex_is_id1 (c))
542 ds_put_byte (&output, c);
543 ss_advance (&input, 1);
548 ss_get_bytes (&input, lex_id_get_length (input), &id);
549 ds_put_substring (&output, find_substitution (block, id));
553 ds_put_byte (&output, settings_get_endcmd ());
555 ds_swap (line, &output);
556 ds_destroy (&output);
559 static struct repeat_line *
560 current_line (const struct getl_interface *interface)
562 struct repeat_block *block
563 = UP_CAST (interface, struct repeat_block, parent);
564 return (block->cur_line != ll_null (&block->lines)
565 ? ll_data (block->cur_line, struct repeat_line, ll)
569 /* Function called by getl to read a line. Puts the line in
570 OUTPUT and its syntax mode in *SYNTAX. Returns true if a line
571 was obtained, false if the source is exhausted. */
573 do_repeat_read (struct getl_interface *interface,
574 struct string *output)
576 struct repeat_block *block
577 = UP_CAST (interface, struct repeat_block, parent);
578 struct repeat_line *line;
580 block->cur_line = ll_next (block->cur_line);
581 if (block->cur_line == ll_null (&block->lines))
584 if (block->loop_idx >= block->loop_cnt)
587 block->cur_line = ll_head (&block->lines);
590 line = current_line (interface);
591 ds_assign_substring (output, line->text);
595 /* Frees a DO REPEAT block.
596 Called by getl to close out the DO REPEAT block. */
598 do_repeat_close (struct getl_interface *interface)
600 struct repeat_block *block
601 = UP_CAST (interface, struct repeat_block, parent);
602 pool_destroy (block->pool);
607 always_false (const struct getl_interface *i UNUSED)
612 /* Returns the name of the source file from which the previous
613 line was originally obtained, or a null pointer if none. */
615 do_repeat_name (const struct getl_interface *interface)
617 struct repeat_line *line = current_line (interface);
618 return line ? line->file_name : NULL;
621 /* Returns the line number in the source file from which the
622 previous line was originally obtained, or 0 if none. */
624 do_repeat_location (const struct getl_interface *interface)
626 struct repeat_line *line = current_line (interface);
627 return line ? line->line_number : 0;