X-Git-Url: https://pintos-os.org/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=src%2Flanguage%2Fstats%2Ffriedman.c;h=55e42489f4e3a420790c7184c432b1968d5f17af;hb=ee254a81d976fae12a67e799a4aedee47c6b0bed;hp=319648527df41386af33587e0b546db1a32c46c5;hpb=2c327bbf83aee01efec9a44157521888e34f81f5;p=pspp diff --git a/src/language/stats/friedman.c b/src/language/stats/friedman.c index 319648527d..55e42489f4 100644 --- a/src/language/stats/friedman.c +++ b/src/language/stats/friedman.c @@ -1,5 +1,5 @@ /* PSPP - a program for statistical analysis. -*-c-*- - Copyright (C) 2010 Free Software Foundation, Inc. + Copyright (C) 2010, 2011 Free Software Foundation, Inc. This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by @@ -17,22 +17,22 @@ #include -#include "friedman.h" +#include "language/stats/friedman.h" #include #include -#include - -#include -#include -#include -#include -#include -#include - +#include "data/casereader.h" +#include "data/dataset.h" +#include "data/dictionary.h" +#include "data/format.h" +#include "data/variable.h" +#include "libpspp/message.h" +#include "libpspp/misc.h" +#include "output/pivot-table.h" #include "gettext.h" +#define N_(msgid) msgid #define _(msgid) gettext (msgid) @@ -41,16 +41,16 @@ struct friedman double *rank_sum; double cc; double chi_sq; + double w; const struct dictionary *dict; }; -static void show_ranks_box (const struct one_sample_test *ost, +static void show_ranks_box (const struct one_sample_test *ost, const struct friedman *fr); static void show_sig_box (const struct one_sample_test *ost, const struct friedman *fr); - struct datum { long posn; @@ -65,7 +65,7 @@ cmp_x (const void *a_, const void *b_) if (a->x < b->x) return -1; - + return (a->x > b->x); } @@ -77,17 +77,17 @@ cmp_posn (const void *a_, const void *b_) if (a->posn < b->posn) return -1; - + return (a->posn > b->posn); } void friedman_execute (const struct dataset *ds, - struct casereader *input, - enum mv_class exclude, - const struct npar_test *test, - bool exact UNUSED, - double timer UNUSED) + struct casereader *input, + enum mv_class exclude, + const struct npar_test *test, + bool exact UNUSED, + double timer UNUSED) { double numerator = 0.0; double denominator = 0.0; @@ -96,45 +96,50 @@ friedman_execute (const struct dataset *ds, const struct dictionary *dict = dataset_dict (ds); const struct variable *weight = dict_get_weight (dict); - struct one_sample_test *ft = UP_CAST (test, struct one_sample_test, parent); + struct one_sample_test *ost = UP_CAST (test, struct one_sample_test, parent); + struct friedman_test *ft = UP_CAST (ost, struct friedman_test, parent); bool warn = true; - double sigma_t = 0.0; - struct datum *row = xcalloc (ft->n_vars, sizeof *row); - + double sigma_t = 0.0; + struct datum *row = XCALLOC (ost->n_vars, struct datum); + double rsq; struct friedman fr; - fr.rank_sum = xcalloc (ft->n_vars, sizeof *fr.rank_sum); + fr.rank_sum = xcalloc (ost->n_vars, sizeof *fr.rank_sum); fr.cc = 0.0; fr.dict = dict; - for (v = 0; v < ft->n_vars; ++v) + for (v = 0; v < ost->n_vars; ++v) { row[v].posn = v; fr.rank_sum[v] = 0.0; } input = casereader_create_filter_weight (input, dict, &warn, NULL); + input = casereader_create_filter_missing (input, + ost->vars, ost->n_vars, + exclude, 0, 0); + for (; (c = casereader_read (input)); case_unref (c)) { double prev_x = SYSMIS; int run_length = 0; - const double w = weight ? case_data (c, weight)->f: 1.0; + const double w = weight ? case_num (c, weight) : 1.0; fr.cc += w; - for (v = 0; v < ft->n_vars; ++v) + for (v = 0; v < ost->n_vars; ++v) { - const struct variable *var = ft->vars[v]; + const struct variable *var = ost->vars[v]; const union value *val = case_data (c, var); row[v].x = val->f; } - qsort (row, ft->n_vars, sizeof *row, cmp_x); - for (v = 0; v < ft->n_vars; ++v) + qsort (row, ost->n_vars, sizeof *row, cmp_x); + for (v = 0; v < ost->n_vars; ++v) { double x = row[v].x; /* Replace value by the Rank */ - if ( prev_x == x) + if (prev_x == x) { /* Deal with ties */ int i; @@ -150,144 +155,121 @@ friedman_execute (const struct dataset *ds, else { row[v].x = v + 1; - if ( run_length > 0) + if (run_length > 0) { double t = run_length + 1; - sigma_t += pow3 (t) - t; + sigma_t += w * (pow3 (t) - t); } run_length = 0; } prev_x = x; } - if ( run_length > 0) + if (run_length > 0) { double t = run_length + 1; - sigma_t += pow3 (t) - t; + sigma_t += w * (pow3 (t) - t); } - qsort (row, ft->n_vars, sizeof *row, cmp_posn); - - for (v = 0; v < ft->n_vars; ++v) - fr.rank_sum[v] += row[v].x; + qsort (row, ost->n_vars, sizeof *row, cmp_posn); + for (v = 0; v < ost->n_vars; ++v) + fr.rank_sum[v] += row[v].x * w; } casereader_destroy (input); free (row); - for (v = 0; v < ft->n_vars; ++v) + for (v = 0; v < ost->n_vars; ++v) { numerator += pow2 (fr.rank_sum[v]); } - numerator *= 12.0 / (fr.cc * ft->n_vars * ( ft->n_vars + 1)); - numerator -= 3 * fr.cc * ( ft->n_vars + 1); + rsq = numerator; + + numerator *= 12.0 / (fr.cc * ost->n_vars * (ost->n_vars + 1)); + numerator -= 3 * fr.cc * (ost->n_vars + 1); - denominator = 1 - sigma_t / ( fr.cc * ft->n_vars * ( pow2 (ft->n_vars) - 1)); + denominator = 1 - sigma_t / (fr.cc * ost->n_vars * (pow2 (ost->n_vars) - 1)); fr.chi_sq = numerator / denominator; - show_ranks_box (ft, &fr); + if (ft->kendalls_w) + { + fr.w = 12 * rsq ; + fr.w -= 3 * pow2 (fr.cc) * + ost->n_vars * pow2 (ost->n_vars + 1); + + fr.w /= pow2 (fr.cc) * (pow3 (ost->n_vars) - ost->n_vars) + - fr.cc * sigma_t; + } + else + fr.w = SYSMIS; - show_sig_box (ft, &fr); + show_ranks_box (ost, &fr); + show_sig_box (ost, &fr); free (fr.rank_sum); } -#include static void show_ranks_box (const struct one_sample_test *ost, const struct friedman *fr) { - const struct variable *weight = dict_get_weight (fr->dict); - const struct fmt_spec *wfmt = weight ? var_get_print_format (weight) : &F_8_0; - - int i; - const int row_headers = 1; - const int column_headers = 1; - struct tab_table *table = - tab_create (row_headers + 1, column_headers + ost->n_vars); - - tab_headers (table, row_headers, 0, column_headers, 0); - - tab_title (table, _("Ranks")); - - /* Vertical lines inside the box */ - tab_box (table, 1, 0, -1, TAL_1, - row_headers, 0, tab_nc (table) - 1, tab_nr (table) - 1 ); - - /* Box around the table */ - tab_box (table, TAL_2, TAL_2, -1, -1, - 0, 0, tab_nc (table) - 1, tab_nr (table) - 1 ); + struct pivot_table *table = pivot_table_create (N_("Ranks")); + pivot_dimension_create (table, PIVOT_AXIS_COLUMN, N_("Mean Rank"), + N_("Mean Rank"), PIVOT_RC_OTHER); - tab_text (table, 1, 0, 0, _("Mean Rank")); + struct pivot_dimension *variables = pivot_dimension_create ( + table, PIVOT_AXIS_ROW, N_("Variable")); - tab_hline (table, TAL_2, 0, tab_nc (table) - 1, column_headers); - tab_vline (table, TAL_2, row_headers, 0, tab_nr (table) - 1); - - for (i = 0 ; i < ost->n_vars ; ++i) + for (size_t i = 0 ; i < ost->n_vars ; ++i) { - tab_text (table, 0, row_headers + i, - TAB_LEFT, var_to_string (ost->vars[i])); + int row = pivot_category_create_leaf ( + variables->root, pivot_value_new_variable (ost->vars[i])); - tab_double (table, 1, row_headers + i, - 0, fr->rank_sum[i] / fr->cc, wfmt); + pivot_table_put2 (table, 0, row, + pivot_value_new_number (fr->rank_sum[i] / fr->cc)); } - tab_submit (table); + pivot_table_submit (table); } static void show_sig_box (const struct one_sample_test *ost, const struct friedman *fr) { - const struct variable *weight = dict_get_weight (fr->dict); - const struct fmt_spec *wfmt = weight ? var_get_print_format (weight) : &F_8_0; - - const int row_headers = 1; - const int column_headers = 0; - struct tab_table *table = - tab_create (row_headers + 1, column_headers + 4); - - tab_headers (table, row_headers, 0, column_headers, 0); - - tab_title (table, _("Test Statistics")); - - tab_text (table, 0, column_headers, - TAT_TITLE | TAB_LEFT , _("N")); - - tab_text (table, 0, 1 + column_headers, - TAT_TITLE | TAB_LEFT , _("Chi-Square")); - - tab_text (table, 0, 2 + column_headers, - TAT_TITLE | TAB_LEFT, _("df")); - - tab_text (table, 0, 3 + column_headers, - TAT_TITLE | TAB_LEFT, _("Asymp. Sig.")); - - /* Box around the table */ - tab_box (table, TAL_2, TAL_2, -1, -1, - 0, 0, tab_nc (table) - 1, tab_nr (table) - 1 ); - - - tab_hline (table, TAL_2, 0, tab_nc (table) -1, column_headers); - tab_vline (table, TAL_2, row_headers, 0, tab_nr (table) - 1); - - tab_double (table, 1, column_headers, - 0, fr->cc, wfmt); - - tab_double (table, 1, column_headers + 1, - 0, fr->chi_sq, 0); - - tab_double (table, 1, column_headers + 2, - 0, ost->n_vars - 1, &F_8_0); - - tab_double (table, 1, column_headers + 3, - 0, gsl_cdf_chisq_Q (fr->chi_sq, ost->n_vars - 1), - 0); - - tab_submit (table); + const struct friedman_test *ft = UP_CAST (ost, const struct friedman_test, parent); + + struct pivot_table *table = pivot_table_create (N_("Test Statistics")); + pivot_table_set_weight_var (table, dict_get_weight (fr->dict)); + + struct pivot_dimension *statistics = pivot_dimension_create ( + table, PIVOT_AXIS_ROW, N_("Statistics"), + N_("N"), PIVOT_RC_COUNT); + if (ft->kendalls_w) + pivot_category_create_leaves (statistics->root, N_("Kendall's W"), + PIVOT_RC_OTHER); + pivot_category_create_leaves (statistics->root, + N_("Chi-Square"), PIVOT_RC_OTHER, + N_("df"), PIVOT_RC_INTEGER, + N_("Asymp. Sig."), PIVOT_RC_SIGNIFICANCE); + + double entries[5]; + int n = 0; + + entries[n++] = fr->cc; + if (ft->kendalls_w) + entries[n++] = fr->w; + entries[n++] = fr->chi_sq; + entries[n++] = ost->n_vars - 1; + entries[n++] = gsl_cdf_chisq_Q (fr->chi_sq, ost->n_vars - 1); + assert (n <= sizeof entries / sizeof *entries); + + for (size_t i = 0; i < n; i++) + pivot_table_put1 (table, i, pivot_value_new_number (entries[i])); + + pivot_table_submit (table); }