X-Git-Url: https://pintos-os.org/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=src%2Flanguage%2Fstats%2Foneway.q;h=9b45119f8664f1ae948a5bfc838479fa8115f921;hb=f4810d3c8656b3b3ab26303d2dae70fc361db7fb;hp=9837d4ceb7ad6c5ec06c82014c8051829d034f37;hpb=8444d8d47de5e5f8d076b6f43f73c2c29494031e;p=pspp diff --git a/src/language/stats/oneway.q b/src/language/stats/oneway.q index 9837d4ceb7..9b45119f86 100644 --- a/src/language/stats/oneway.q +++ b/src/language/stats/oneway.q @@ -1,7 +1,6 @@ /* PSPP - One way ANOVA. -*-c-*- -Copyright (C) 1997-9, 2000 Free Software Foundation, Inc. -Author: John Darrington 2004 +Copyright (C) 1997-9, 2000, 2007 Free Software Foundation, Inc. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as @@ -19,31 +18,36 @@ Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */ #include + #include -#include +#include #include #include -#include -#include -#include + #include +#include #include +#include +#include +#include +#include #include -#include +#include #include -#include +#include +#include +#include #include +#include +#include #include -#include -#include -#include -#include -#include -#include -#include +#include #include #include #include +#include +#include +#include "sort-criteria.h" #include "gettext.h" #define _(msgid) gettext (msgid) @@ -53,29 +57,27 @@ Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA /* (specification) "ONEWAY" (oneway_): *^variables=custom; - +missing=miss:!analysis/listwise, - incl:include/!exclude; - contrast= double list; - statistics[st_]=descriptives,homogeneity. + missing=miss:!analysis/listwise, + incl:include/!exclude; + +contrast= double list; + +statistics[st_]=descriptives,homogeneity. */ /* (declarations) */ /* (functions) */ - - -static int bad_weight_warn = 1; +static bool bad_weight_warn = true; static struct cmd_oneway cmd; /* The independent variable */ -static struct variable *indep_var; +static const struct variable *indep_var; /* Number of dependent variables */ static size_t n_vars; /* The dependent variables */ -static struct variable **vars; +static const struct variable **vars; /* A hash table containing all the distinct values of the independent @@ -84,14 +86,12 @@ static struct hsh_table *global_group_hash ; /* The number of distinct values of the independent variable, when all missing values are disregarded */ -static int ostensible_number_of_groups=-1; - +static int ostensible_number_of_groups = -1; -/* Function to use for testing for missing values */ -static is_missing_func *value_is_missing; - -static bool run_oneway(const struct casefile *cf, void *_mode); +static bool run_oneway(const struct ccase *first, + const struct casefile *cf, + void *_mode, const struct dataset *); /* Routines to show the output tables */ @@ -111,20 +111,14 @@ void output_oneway(void); int -cmd_oneway(void) +cmd_oneway (struct lexer *lexer, struct dataset *ds) { int i; bool ok; - if ( !parse_oneway(&cmd) ) + if ( !parse_oneway (lexer, ds, &cmd, NULL) ) return CMD_FAILURE; - /* If /MISSING=INCLUDE is set, then user missing values are ignored */ - if (cmd.incl == ONEWAY_INCLUDE ) - value_is_missing = mv_is_value_system_missing; - else - value_is_missing = mv_is_value_missing; - /* What statistics were requested */ if ( cmd.sbc_statistics ) { @@ -144,7 +138,7 @@ cmd_oneway(void) } } - ok = multipass_procedure_with_splits (run_oneway, &cmd); + ok = multipass_procedure_with_splits (ds, run_oneway, &cmd); free (vars); free_oneway (&cmd); @@ -181,7 +175,8 @@ output_oneway(void) sum += subc_list_double_at(&cmd.dl_contrast[i],j); if ( sum != 0.0 ) - msg(SW,_("Coefficients for contrast %d do not total zero"),i + 1); + msg(SW,_("Coefficients for contrast %d do not total zero"), + (int) i + 1); } if ( stat_tables & STAT_DESC ) @@ -218,17 +213,19 @@ output_oneway(void) /* Parser for the variables sub command */ static int -oneway_custom_variables(struct cmd_oneway *cmd UNUSED) +oneway_custom_variables (struct lexer *lexer, + struct dataset *ds, struct cmd_oneway *cmd UNUSED, + void *aux UNUSED) { + struct dictionary *dict = dataset_dict (ds); - lex_match('='); + lex_match (lexer, '='); - if ((token != T_ID || dict_lookup_var (default_dict, tokid) == NULL) - && token != T_ALL) + if ((lex_token (lexer) != T_ID || dict_lookup_var (dict, lex_tokid (lexer)) == NULL) + && lex_token (lexer) != T_ALL) return 2; - - if (!parse_variables (default_dict, &vars, &n_vars, + if (!parse_variables_const (lexer, dict, &vars, &n_vars, PV_DUPLICATE | PV_NUMERIC | PV_NO_SCRATCH) ) { @@ -238,19 +235,17 @@ oneway_custom_variables(struct cmd_oneway *cmd UNUSED) assert(n_vars); - if ( ! lex_match(T_BY)) + if ( ! lex_match (lexer, T_BY)) return 2; - - indep_var = parse_variable(); + indep_var = parse_variable (lexer, dict); if ( !indep_var ) { - msg(SE,_("`%s' is not a variable name"),tokid); + msg(SE,_("`%s' is not a variable name"),lex_tokid (lexer)); return 0; } - return 1; } @@ -357,10 +352,9 @@ show_anova_table(void) tab_title (t, _("ANOVA")); tab_submit (t); - - } + /* Show the descriptives table */ static void show_descriptives(void) @@ -428,7 +422,8 @@ show_descriptives(void) const char *s = var_to_string(vars[v]); - struct group_statistics *const *gs_array = hsh_sort(gp->group_hash); + struct group_statistics *const *gs_array = + (struct group_statistics *const *) hsh_sort(gp->group_hash); int count = 0; tab_text (t, 0, row, TAB_LEFT | TAT_TITLE, s); @@ -440,7 +435,8 @@ show_descriptives(void) gs = gs_array[count]; tab_text (t, 1, row + count, - TAB_LEFT | TAT_TITLE ,value_to_string(&gs->id,indep_var)); + TAB_LEFT | TAT_TITLE, var_get_value_name(indep_var, + &gs->id)); /* Now fill in the numbers ... */ @@ -566,14 +562,12 @@ show_homogeneity(void) } tab_submit (t); - - } /* Show the contrast coefficients table */ static void -show_contrast_coeffs(short *bad_contrast) +show_contrast_coeffs (short *bad_contrast) { int n_cols = 2 + ostensible_number_of_groups; int n_rows = 2 + cmd.sbc_contrast; @@ -628,7 +622,7 @@ show_contrast_coeffs(short *bad_contrast) group_value = group_values[count]; tab_text (t, count + 2, 1, TAB_CENTER | TAT_TITLE, - value_to_string(group_value, indep_var)); + var_get_value_name (indep_var, group_value)); for (i = 0 ; i < cmd.sbc_contrast ; ++i ) { @@ -874,7 +868,7 @@ precalc ( struct cmd_oneway *cmd UNUSED ) (hsh_compare_func *) compare_group, (hsh_hash_func *) hash_group, (hsh_free_func *) free_group, - (void *) indep_var->width ); + (void *) var_get_width (indep_var) ); totals->sum=0; @@ -886,53 +880,56 @@ precalc ( struct cmd_oneway *cmd UNUSED ) } } +static void +free_value (void *value_, const void *aux UNUSED) +{ + union value *value = value_; + free (value); +} static bool -run_oneway(const struct casefile *cf, void *cmd_) +run_oneway(const struct ccase *first, const struct casefile *cf, + void *cmd_, const struct dataset *ds) { struct casereader *r; struct ccase c; + struct casefilter *filter = NULL; struct cmd_oneway *cmd = (struct cmd_oneway *) cmd_; + output_split_file_values (ds, first); + global_group_hash = hsh_create(4, (hsh_compare_func *) compare_values, (hsh_hash_func *) hash_value, - 0, - (void *) indep_var->width ); + free_value, + (void *) var_get_width (indep_var) ); + precalc(cmd); - for(r = casefile_get_reader (cf); + filter = casefilter_create ( (cmd->incl != ONEWAY_INCLUDE + ? MV_ANY : MV_SYSTEM), + vars, n_vars ); + + for(r = casefile_get_reader (cf, filter); casereader_read (r, &c) ; case_destroy (&c)) { size_t i; const double weight = - dict_get_case_weight(default_dict,&c,&bad_weight_warn); - - const union value *indep_val = case_data (&c, indep_var->fv); + dict_get_case_weight (dataset_dict (ds), &c, &bad_weight_warn); - /* Deal with missing values */ - if ( value_is_missing(&indep_var->miss, indep_val) ) + const union value *indep_val; + void **p; + + if ( casefilter_variable_missing (filter, &c, indep_var)) continue; - /* Skip the entire case if /MISSING=LISTWISE is set */ - if ( cmd->miss == ONEWAY_LISTWISE ) - { - for(i = 0; i < n_vars ; ++i) - { - const struct variable *v = vars[i]; - const union value *val = case_data (&c, v->fv); - - if (value_is_missing(&v->miss, val) ) - break; - } - if ( i != n_vars ) - continue; - - } - + indep_val = case_data (&c, indep_var); + p = hsh_probe (global_group_hash, indep_val); + if (*p == NULL) + *p = value_dup (indep_val, var_get_width (indep_var)); hsh_insert ( global_group_hash, (void *) indep_val ); @@ -940,7 +937,7 @@ run_oneway(const struct casefile *cf, void *cmd_) { const struct variable *v = vars[i]; - const union value *val = case_data (&c, v->fv); + const union value *val = case_data (&c, v); struct group_proc *gp = group_proc_get (vars[i]); struct hsh_table *group_hash = gp->group_hash; @@ -962,8 +959,8 @@ run_oneway(const struct casefile *cf, void *cmd_) hsh_insert ( group_hash, (void *) gs ); } - - if (! value_is_missing(&v->miss, val) ) + + if (! casefilter_variable_missing (filter, &c, v)) { struct group_statistics *totals = &gp->ugs; @@ -992,15 +989,17 @@ run_oneway(const struct casefile *cf, void *cmd_) } } + casereader_destroy (r); postcalc(cmd); if ( stat_tables & STAT_HOMO ) - levene(cf, indep_var, n_vars, vars, - (cmd->miss == ONEWAY_LISTWISE) ? LEV_LISTWISE : LEV_ANALYSIS , - value_is_missing); + levene (dataset_dict (ds), cf, indep_var, n_vars, vars, + filter); + + casefilter_destroy (filter); ostensible_number_of_groups = hsh_count (global_group_hash);