X-Git-Url: https://pintos-os.org/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=src%2Flanguage%2Fstats%2Foneway.q;h=ed0add5835e62691ab1009b286b864f2c90d51f9;hb=4f2f805c653f0dc901924944ea4c55309ff14d32;hp=9cdb7db5a098bb868fa72c8d89ed961956687d37;hpb=dcf9b154cbcaa35c3d8459a201b77eec8bcb30bd;p=pspp diff --git a/src/language/stats/oneway.q b/src/language/stats/oneway.q index 9cdb7db5a0..ed0add5835 100644 --- a/src/language/stats/oneway.q +++ b/src/language/stats/oneway.q @@ -1,7 +1,6 @@ /* PSPP - One way ANOVA. -*-c-*- Copyright (C) 1997-9, 2000 Free Software Foundation, Inc. -Author: John Darrington 2004 This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as @@ -19,30 +18,36 @@ Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */ #include + #include -#include "message.h" +#include #include #include -#include -#include "alloc.h" -#include "str.h" -#include "case.h" -#include "dictionary.h" -#include "command.h" -#include "lexer.h" -#include "message.h" -#include "magic.h" -#include "misc.h" -#include "table.h" -#include "manager.h" -#include "value-labels.h" -#include "variable.h" -#include "procedure.h" -#include "hash.h" -#include "casefile.h" -#include "group-proc.h" -#include "group.h" -#include "levene.h" + +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include "sort-criteria.h" #include "gettext.h" #define _(msgid) gettext (msgid) @@ -52,17 +57,15 @@ Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA /* (specification) "ONEWAY" (oneway_): *^variables=custom; - +missing=miss:!analysis/listwise, - incl:include/!exclude; - contrast= double list; - statistics[st_]=descriptives,homogeneity. + missing=miss:!analysis/listwise, + incl:include/!exclude; + +contrast= double list; + +statistics[st_]=descriptives,homogeneity. */ /* (declarations) */ /* (functions) */ - - -static int bad_weight_warn = 1; +static bool bad_weight_warn = true; static struct cmd_oneway cmd; @@ -83,14 +86,12 @@ static struct hsh_table *global_group_hash ; /* The number of distinct values of the independent variable, when all missing values are disregarded */ -static int ostensible_number_of_groups=-1; - - -/* Function to use for testing for missing values */ -static is_missing_func *value_is_missing; +static int ostensible_number_of_groups = -1; -static bool run_oneway(const struct casefile *cf, void *_mode); +static bool run_oneway(const struct ccase *first, + const struct casefile *cf, + void *_mode, const struct dataset *); /* Routines to show the output tables */ @@ -110,20 +111,14 @@ void output_oneway(void); int -cmd_oneway(void) +cmd_oneway (struct lexer *lexer, struct dataset *ds) { int i; bool ok; - if ( !parse_oneway(&cmd) ) + if ( !parse_oneway (lexer, ds, &cmd, NULL) ) return CMD_FAILURE; - /* If /MISSING=INCLUDE is set, then user missing values are ignored */ - if (cmd.incl == ONEWAY_INCLUDE ) - value_is_missing = mv_is_value_system_missing; - else - value_is_missing = mv_is_value_missing; - /* What statistics were requested */ if ( cmd.sbc_statistics ) { @@ -143,7 +138,7 @@ cmd_oneway(void) } } - ok = multipass_procedure_with_splits (run_oneway, &cmd); + ok = multipass_procedure_with_splits (ds, run_oneway, &cmd); free (vars); free_oneway (&cmd); @@ -217,17 +212,19 @@ output_oneway(void) /* Parser for the variables sub command */ static int -oneway_custom_variables(struct cmd_oneway *cmd UNUSED) +oneway_custom_variables (struct lexer *lexer, + struct dataset *ds, struct cmd_oneway *cmd UNUSED, + void *aux UNUSED) { + struct dictionary *dict = dataset_dict (ds); - lex_match('='); + lex_match (lexer, '='); - if ((token != T_ID || dict_lookup_var (default_dict, tokid) == NULL) - && token != T_ALL) + if ((lex_token (lexer) != T_ID || dict_lookup_var (dict, lex_tokid (lexer)) == NULL) + && lex_token (lexer) != T_ALL) return 2; - - if (!parse_variables (default_dict, &vars, &n_vars, + if (!parse_variables (lexer, dict, &vars, &n_vars, PV_DUPLICATE | PV_NUMERIC | PV_NO_SCRATCH) ) { @@ -237,19 +234,17 @@ oneway_custom_variables(struct cmd_oneway *cmd UNUSED) assert(n_vars); - if ( ! lex_match(T_BY)) + if ( ! lex_match (lexer, T_BY)) return 2; - - indep_var = parse_variable(); + indep_var = parse_variable (lexer, dict); if ( !indep_var ) { - msg(SE,_("`%s' is not a variable name"),tokid); + msg(SE,_("`%s' is not a variable name"),lex_tokid (lexer)); return 0; } - return 1; } @@ -354,12 +349,11 @@ show_anova_table(void) } - tab_title (t, 0, _("ANOVA")); + tab_title (t, _("ANOVA")); tab_submit (t); - - } + /* Show the descriptives table */ static void show_descriptives(void) @@ -411,7 +405,7 @@ show_descriptives(void) tab_text (t, 9, 1, TAB_CENTER | TAT_TITLE, _("Maximum")); - tab_title (t, 0, _("Descriptives")); + tab_title (t, _("Descriptives")); row = 2; @@ -427,7 +421,8 @@ show_descriptives(void) const char *s = var_to_string(vars[v]); - struct group_statistics *const *gs_array = hsh_sort(gp->group_hash); + struct group_statistics *const *gs_array = + (struct group_statistics *const *) hsh_sort(gp->group_hash); int count = 0; tab_text (t, 0, row, TAB_LEFT | TAT_TITLE, s); @@ -439,7 +434,8 @@ show_descriptives(void) gs = gs_array[count]; tab_text (t, 1, row + count, - TAB_LEFT | TAT_TITLE ,value_to_string(&gs->id,indep_var)); + TAB_LEFT | TAT_TITLE, var_get_value_name(indep_var, + &gs->id)); /* Now fill in the numbers ... */ @@ -540,7 +536,7 @@ show_homogeneity(void) tab_text (t, 4, 0, TAB_CENTER | TAT_TITLE, _("Significance")); - tab_title (t, 0, _("Test of Homogeneity of Variances")); + tab_title (t, _("Test of Homogeneity of Variances")); for ( v=0 ; v < n_vars ; ++v ) { @@ -565,14 +561,12 @@ show_homogeneity(void) } tab_submit (t); - - } /* Show the contrast coefficients table */ static void -show_contrast_coeffs(short *bad_contrast) +show_contrast_coeffs (short *bad_contrast) { int n_cols = 2 + ostensible_number_of_groups; int n_rows = 2 + cmd.sbc_contrast; @@ -610,7 +604,7 @@ show_contrast_coeffs(short *bad_contrast) tab_vline(t, TAL_2, 2, 0, n_rows - 1); - tab_title (t, 0, _("Contrast Coefficients")); + tab_title (t, _("Contrast Coefficients")); tab_text (t, 0, 2, TAB_LEFT | TAT_TITLE, _("Contrast")); @@ -627,7 +621,7 @@ show_contrast_coeffs(short *bad_contrast) group_value = group_values[count]; tab_text (t, count + 2, 1, TAB_CENTER | TAT_TITLE, - value_to_string(group_value, indep_var)); + var_get_value_name (indep_var, group_value)); for (i = 0 ; i < cmd.sbc_contrast ; ++i ) { @@ -677,7 +671,7 @@ show_contrast_tests(short *bad_contrast) tab_vline(t, TAL_2, 3, 0, n_rows - 1); - tab_title (t, 0, _("Contrast Tests")); + tab_title (t, _("Contrast Tests")); tab_text (t, 2, 0, TAB_CENTER | TAT_TITLE, _("Contrast")); tab_text (t, 3, 0, TAB_CENTER | TAT_TITLE, _("Value of Contrast")); @@ -873,7 +867,7 @@ precalc ( struct cmd_oneway *cmd UNUSED ) (hsh_compare_func *) compare_group, (hsh_hash_func *) hash_group, (hsh_free_func *) free_group, - (void *) indep_var->width ); + (void *) var_get_width (indep_var) ); totals->sum=0; @@ -887,51 +881,43 @@ precalc ( struct cmd_oneway *cmd UNUSED ) static bool -run_oneway(const struct casefile *cf, void *cmd_) +run_oneway(const struct ccase *first, const struct casefile *cf, + void *cmd_, const struct dataset *ds) { struct casereader *r; struct ccase c; + struct casefilter *filter = NULL; struct cmd_oneway *cmd = (struct cmd_oneway *) cmd_; + output_split_file_values (ds, first); + global_group_hash = hsh_create(4, (hsh_compare_func *) compare_values, (hsh_hash_func *) hash_value, 0, - (void *) indep_var->width ); + (void *) var_get_width (indep_var) ); + precalc(cmd); - for(r = casefile_get_reader (cf); + filter = casefilter_create ( (cmd->incl != ONEWAY_INCLUDE), + vars, n_vars ); + + for(r = casefile_get_reader (cf, filter); casereader_read (r, &c) ; case_destroy (&c)) { size_t i; const double weight = - dict_get_case_weight(default_dict,&c,&bad_weight_warn); + dict_get_case_weight (dataset_dict (ds), &c, &bad_weight_warn); - const union value *indep_val = case_data (&c, indep_var->fv); + const union value *indep_val; - /* Deal with missing values */ - if ( value_is_missing(&indep_var->miss, indep_val) ) + if ( casefilter_variable_missing (filter, &c, indep_var)) continue; - /* Skip the entire case if /MISSING=LISTWISE is set */ - if ( cmd->miss == ONEWAY_LISTWISE ) - { - for(i = 0; i < n_vars ; ++i) - { - const struct variable *v = vars[i]; - const union value *val = case_data (&c, v->fv); - - if (value_is_missing(&v->miss, val) ) - break; - } - if ( i != n_vars ) - continue; - - } - + indep_val = case_data (&c, indep_var); hsh_insert ( global_group_hash, (void *) indep_val ); @@ -939,7 +925,7 @@ run_oneway(const struct casefile *cf, void *cmd_) { const struct variable *v = vars[i]; - const union value *val = case_data (&c, v->fv); + const union value *val = case_data (&c, v); struct group_proc *gp = group_proc_get (vars[i]); struct hsh_table *group_hash = gp->group_hash; @@ -961,8 +947,8 @@ run_oneway(const struct casefile *cf, void *cmd_) hsh_insert ( group_hash, (void *) gs ); } - - if (! value_is_missing(&v->miss, val) ) + + if (! casefilter_variable_missing (filter, &c, v)) { struct group_statistics *totals = &gp->ugs; @@ -991,15 +977,17 @@ run_oneway(const struct casefile *cf, void *cmd_) } } + casereader_destroy (r); postcalc(cmd); if ( stat_tables & STAT_HOMO ) - levene(cf, indep_var, n_vars, vars, - (cmd->miss == ONEWAY_LISTWISE) ? LEV_LISTWISE : LEV_ANALYSIS , - value_is_missing); + levene (dataset_dict (ds), cf, indep_var, n_vars, vars, + filter); + + casefilter_destroy (filter); ostensible_number_of_groups = hsh_count (global_group_hash);