X-Git-Url: https://pintos-os.org/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=src%2Flanguage%2Fdictionary%2Fmissing-values.c;h=a369c2ea6999a802f00b9d8b723f244d2f4a2ffe;hb=480832dcecdf63fa6f115ba3a09a1befd511f290;hp=e37fa987deddfb3dd642b777d8582a1fd3070d75;hpb=81fff61a96bece351e381ad3fef8ab1248a952ba;p=pspp diff --git a/src/language/dictionary/missing-values.c b/src/language/dictionary/missing-values.c index e37fa987de..a369c2ea69 100644 --- a/src/language/dictionary/missing-values.c +++ b/src/language/dictionary/missing-values.c @@ -1,156 +1,168 @@ -/* PSPP - computes sample statistics. - Copyright (C) 1997-9, 2000 Free Software Foundation, Inc. - Written by Ben Pfaff . +/* PSPP - a program for statistical analysis. + Copyright (C) 1997-9, 2000, 2006, 2009, 2010, 2011, 2013 Free Software Foundation, Inc. - This program is free software; you can redistribute it and/or - modify it under the terms of the GNU General Public License as - published by the Free Software Foundation; either version 2 of the - License, or (at your option) any later version. + This program is free software: you can redistribute it and/or modify + it under the terms of the GNU General Public License as published by + the Free Software Foundation, either version 3 of the License, or + (at your option) any later version. - This program is distributed in the hope that it will be useful, but - WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU - General Public License for more details. + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. You should have received a copy of the GNU General Public License - along with this program; if not, write to the Free Software - Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA - 02110-1301, USA. */ + along with this program. If not, see . */ #include #include -#include -#include -#include -#include -#include -#include -#include -#include -#include -#include +#include "data/data-in.h" +#include "data/dictionary.h" +#include "data/dataset.h" +#include "data/format.h" +#include "data/missing-values.h" +#include "data/value.h" +#include "data/variable.h" +#include "language/command.h" +#include "language/lexer/lexer.h" +#include "language/lexer/value-parser.h" +#include "language/lexer/variable-parser.h" +#include "libpspp/i18n.h" +#include "libpspp/message.h" +#include "libpspp/str.h" #include "gettext.h" #define _(msgid) gettext (msgid) int -cmd_missing_values (void) +cmd_missing_values (struct lexer *lexer, struct dataset *ds) { - struct variable **v; + struct dictionary *dict = dataset_dict (ds); + struct variable **v = NULL; size_t nv; - int retval = CMD_FAILURE; - bool deferred_errors = false; + bool ok = true; - while (token != '.') + while (lex_token (lexer) != T_ENDCMD) { size_t i; - if (!parse_variables (default_dict, &v, &nv, PV_NONE)) - goto done; + if (!parse_variables (lexer, dict, &v, &nv, PV_NONE)) + goto error; - if (!lex_match ('(')) - { - lex_error (_("expecting `('")); - goto done; - } + if (!lex_force_match (lexer, T_LPAREN)) + goto error; for (i = 0; i < nv; i++) - mv_init (&v[i]->miss, v[i]->width); + var_clear_missing_values (v[i]); - if (!lex_match (')')) + if (!lex_match (lexer, T_RPAREN)) { struct missing_values mv; for (i = 0; i < nv; i++) - if (v[i]->type != v[0]->type) + if (var_get_type (v[i]) != var_get_type (v[0])) { - const struct variable *n = v[0]->type == NUMERIC ? v[0] : v[i]; - const struct variable *s = v[0]->type == NUMERIC ? v[i] : v[0]; + const struct variable *n = var_is_numeric (v[0]) ? v[0] : v[i]; + const struct variable *s = var_is_numeric (v[0]) ? v[i] : v[0]; msg (SE, _("Cannot mix numeric variables (e.g. %s) and " "string variables (e.g. %s) within a single list."), - n->name, s->name); - goto done; + var_get_name (n), var_get_name (s)); + goto error; } - if (v[0]->type == NUMERIC) + if (var_is_numeric (v[0])) { mv_init (&mv, 0); - while (!lex_match (')')) + while (!lex_match (lexer, T_RPAREN)) { + enum fmt_type type = var_get_print_format (v[0])->type; double x, y; bool ok; - if (!parse_num_range (&x, &y, &v[0]->print)) - goto done; - + if (!parse_num_range (lexer, &x, &y, &type)) + goto error; + ok = (x == y ? mv_add_num (&mv, x) - : mv_add_num_range (&mv, x, y)); + : mv_add_range (&mv, x, y)); if (!ok) - deferred_errors = true; + ok = false; - lex_match (','); + lex_match (lexer, T_COMMA); } } - else + else { - mv_init (&mv, MAX_SHORT_STRING); - while (!lex_match (')')) + const char *encoding = dict_get_encoding (dict); + + mv_init (&mv, MV_MAX_STRING); + while (!lex_match (lexer, T_RPAREN)) { - if (!lex_force_string ()) - { - deferred_errors = true; - break; - } + const char *utf8_s; + size_t utf8_trunc_len; + size_t utf8_len; - if (ds_length (&tokstr) > MAX_SHORT_STRING) + char *raw_s; + + if (!lex_force_string (lexer)) { - ds_truncate (&tokstr, MAX_SHORT_STRING); - msg (SE, _("Truncating missing value to short string " - "length (%d characters)."), - MAX_SHORT_STRING); + ok = false; + break; } - else - ds_rpad (&tokstr, MAX_SHORT_STRING, ' '); - if (!mv_add_str (&mv, ds_data (&tokstr))) - deferred_errors = true; - - lex_get (); - lex_match (','); + /* Truncate the string to fit in 8 bytes in the dictionary + encoding. */ + utf8_s = lex_tokcstr (lexer); + utf8_len = ss_length (lex_tokss (lexer)); + utf8_trunc_len = utf8_encoding_trunc_len (utf8_s, encoding, + MV_MAX_STRING); + if (utf8_trunc_len < utf8_len) + msg (SE, _("Truncating missing value to maximum " + "acceptable length (%d bytes)."), + MV_MAX_STRING); + + /* Recode to dictionary encoding and add. */ + raw_s = recode_string (encoding, "UTF-8", + utf8_s, utf8_trunc_len); + if (!mv_add_str (&mv, CHAR_CAST (const uint8_t *, raw_s), + strlen (raw_s))) + ok = false; + free (raw_s); + + lex_get (lexer); + lex_match (lexer, T_COMMA); } } - - for (i = 0; i < nv; i++) + + for (i = 0; i < nv; i++) { - if (!mv_is_resizable (&mv, v[i]->width)) + if (mv_is_resizable (&mv, var_get_width (v[i]))) + var_set_missing_values (v[i], &mv); + else { msg (SE, _("Missing values provided are too long to assign " "to variable of width %d."), - v[i]->width); - deferred_errors = true; - } - else - { - mv_copy (&v[i]->miss, &mv); - mv_resize (&v[i]->miss, v[i]->width); + var_get_width (v[i])); + ok = false; } } + + mv_destroy (&mv); } - lex_match ('/'); + lex_match (lexer, T_SLASH); free (v); v = NULL; } - retval = lex_end_of_command (); - - done: + + free (v); + return ok ? CMD_SUCCESS : CMD_FAILURE; + +error: free (v); - if (deferred_errors) - retval = CMD_FAILURE; - return retval; + return CMD_FAILURE; }