X-Git-Url: https://pintos-os.org/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=src%2Flanguage%2Fstats%2Ffriedman.c;h=55e42489f4e3a420790c7184c432b1968d5f17af;hb=ee254a81d976fae12a67e799a4aedee47c6b0bed;hp=4a0201e6ac112b3ecfbd5bbbfc0b856424939a71;hpb=50a07c54d38b3dc85db5c1318d67890e386710f9;p=pspp diff --git a/src/language/stats/friedman.c b/src/language/stats/friedman.c index 4a0201e6ac..55e42489f4 100644 --- a/src/language/stats/friedman.c +++ b/src/language/stats/friedman.c @@ -1,5 +1,5 @@ /* PSPP - a program for statistical analysis. -*-c-*- - Copyright (C) 2010 Free Software Foundation, Inc. + Copyright (C) 2010, 2011 Free Software Foundation, Inc. This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by @@ -17,22 +17,22 @@ #include -#include "friedman.h" +#include "language/stats/friedman.h" #include #include -#include - -#include -#include -#include -#include -#include -#include - +#include "data/casereader.h" +#include "data/dataset.h" +#include "data/dictionary.h" +#include "data/format.h" +#include "data/variable.h" +#include "libpspp/message.h" +#include "libpspp/misc.h" +#include "output/pivot-table.h" #include "gettext.h" +#define N_(msgid) msgid #define _(msgid) gettext (msgid) @@ -41,16 +41,16 @@ struct friedman double *rank_sum; double cc; double chi_sq; + double w; const struct dictionary *dict; }; -static void show_ranks_box (const struct one_sample_test *ost, +static void show_ranks_box (const struct one_sample_test *ost, const struct friedman *fr); static void show_sig_box (const struct one_sample_test *ost, const struct friedman *fr); - struct datum { long posn; @@ -65,7 +65,7 @@ cmp_x (const void *a_, const void *b_) if (a->x < b->x) return -1; - + return (a->x > b->x); } @@ -77,17 +77,17 @@ cmp_posn (const void *a_, const void *b_) if (a->posn < b->posn) return -1; - + return (a->posn > b->posn); } void friedman_execute (const struct dataset *ds, - struct casereader *input, - enum mv_class exclude, - const struct npar_test *test, - bool exact UNUSED, - double timer UNUSED) + struct casereader *input, + enum mv_class exclude, + const struct npar_test *test, + bool exact UNUSED, + double timer UNUSED) { double numerator = 0.0; double denominator = 0.0; @@ -96,17 +96,18 @@ friedman_execute (const struct dataset *ds, const struct dictionary *dict = dataset_dict (ds); const struct variable *weight = dict_get_weight (dict); - struct one_sample_test *ft = UP_CAST (test, struct one_sample_test, parent); + struct one_sample_test *ost = UP_CAST (test, struct one_sample_test, parent); + struct friedman_test *ft = UP_CAST (ost, struct friedman_test, parent); bool warn = true; - double sigma_t = 0.0; - struct datum *row = xcalloc (ft->n_vars, sizeof *row); - + double sigma_t = 0.0; + struct datum *row = XCALLOC (ost->n_vars, struct datum); + double rsq; struct friedman fr; - fr.rank_sum = xcalloc (ft->n_vars, sizeof *fr.rank_sum); + fr.rank_sum = xcalloc (ost->n_vars, sizeof *fr.rank_sum); fr.cc = 0.0; fr.dict = dict; - for (v = 0; v < ft->n_vars; ++v) + for (v = 0; v < ost->n_vars; ++v) { row[v].posn = v; fr.rank_sum[v] = 0.0; @@ -114,7 +115,7 @@ friedman_execute (const struct dataset *ds, input = casereader_create_filter_weight (input, dict, &warn, NULL); input = casereader_create_filter_missing (input, - ft->vars, ft->n_vars, + ost->vars, ost->n_vars, exclude, 0, 0); for (; (c = casereader_read (input)); case_unref (c)) @@ -122,23 +123,23 @@ friedman_execute (const struct dataset *ds, double prev_x = SYSMIS; int run_length = 0; - const double w = weight ? case_data (c, weight)->f: 1.0; + const double w = weight ? case_num (c, weight) : 1.0; fr.cc += w; - for (v = 0; v < ft->n_vars; ++v) + for (v = 0; v < ost->n_vars; ++v) { - const struct variable *var = ft->vars[v]; + const struct variable *var = ost->vars[v]; const union value *val = case_data (c, var); row[v].x = val->f; } - qsort (row, ft->n_vars, sizeof *row, cmp_x); - for (v = 0; v < ft->n_vars; ++v) + qsort (row, ost->n_vars, sizeof *row, cmp_x); + for (v = 0; v < ost->n_vars; ++v) { double x = row[v].x; /* Replace value by the Rank */ - if ( prev_x == x) + if (prev_x == x) { /* Deal with ties */ int i; @@ -154,7 +155,7 @@ friedman_execute (const struct dataset *ds, else { row[v].x = v + 1; - if ( run_length > 0) + if (run_length > 0) { double t = run_length + 1; sigma_t += w * (pow3 (t) - t); @@ -163,131 +164,112 @@ friedman_execute (const struct dataset *ds, } prev_x = x; } - if ( run_length > 0) + if (run_length > 0) { double t = run_length + 1; - sigma_t += w * (pow3 (t) - t ); + sigma_t += w * (pow3 (t) - t); } - qsort (row, ft->n_vars, sizeof *row, cmp_posn); + qsort (row, ost->n_vars, sizeof *row, cmp_posn); - for (v = 0; v < ft->n_vars; ++v) + for (v = 0; v < ost->n_vars; ++v) fr.rank_sum[v] += row[v].x * w; } casereader_destroy (input); free (row); - for (v = 0; v < ft->n_vars; ++v) + for (v = 0; v < ost->n_vars; ++v) { numerator += pow2 (fr.rank_sum[v]); } - numerator *= 12.0 / (fr.cc * ft->n_vars * ( ft->n_vars + 1)); - numerator -= 3 * fr.cc * ( ft->n_vars + 1); + rsq = numerator; - denominator = 1 - sigma_t / ( fr.cc * ft->n_vars * ( pow2 (ft->n_vars) - 1)); + numerator *= 12.0 / (fr.cc * ost->n_vars * (ost->n_vars + 1)); + numerator -= 3 * fr.cc * (ost->n_vars + 1); + + denominator = 1 - sigma_t / (fr.cc * ost->n_vars * (pow2 (ost->n_vars) - 1)); fr.chi_sq = numerator / denominator; - show_ranks_box (ft, &fr); + if (ft->kendalls_w) + { + fr.w = 12 * rsq ; + fr.w -= 3 * pow2 (fr.cc) * + ost->n_vars * pow2 (ost->n_vars + 1); - show_sig_box (ft, &fr); + fr.w /= pow2 (fr.cc) * (pow3 (ost->n_vars) - ost->n_vars) + - fr.cc * sigma_t; + } + else + fr.w = SYSMIS; + + show_ranks_box (ost, &fr); + show_sig_box (ost, &fr); free (fr.rank_sum); } -#include static void show_ranks_box (const struct one_sample_test *ost, const struct friedman *fr) { - int i; - const int row_headers = 1; - const int column_headers = 1; - struct tab_table *table = - tab_create (row_headers + 1, column_headers + ost->n_vars); - - tab_headers (table, row_headers, 0, column_headers, 0); - - tab_title (table, _("Ranks")); - - /* Vertical lines inside the box */ - tab_box (table, 1, 0, -1, TAL_1, - row_headers, 0, tab_nc (table) - 1, tab_nr (table) - 1 ); - - /* Box around the table */ - tab_box (table, TAL_2, TAL_2, -1, -1, - 0, 0, tab_nc (table) - 1, tab_nr (table) - 1 ); - + struct pivot_table *table = pivot_table_create (N_("Ranks")); - tab_text (table, 1, 0, 0, _("Mean Rank")); + pivot_dimension_create (table, PIVOT_AXIS_COLUMN, N_("Mean Rank"), + N_("Mean Rank"), PIVOT_RC_OTHER); - tab_hline (table, TAL_2, 0, tab_nc (table) - 1, column_headers); - tab_vline (table, TAL_2, row_headers, 0, tab_nr (table) - 1); + struct pivot_dimension *variables = pivot_dimension_create ( + table, PIVOT_AXIS_ROW, N_("Variable")); - for (i = 0 ; i < ost->n_vars ; ++i) + for (size_t i = 0 ; i < ost->n_vars ; ++i) { - tab_text (table, 0, row_headers + i, - TAB_LEFT, var_to_string (ost->vars[i])); + int row = pivot_category_create_leaf ( + variables->root, pivot_value_new_variable (ost->vars[i])); - tab_double (table, 1, row_headers + i, - 0, fr->rank_sum[i] / fr->cc, 0); + pivot_table_put2 (table, 0, row, + pivot_value_new_number (fr->rank_sum[i] / fr->cc)); } - tab_submit (table); + pivot_table_submit (table); } static void show_sig_box (const struct one_sample_test *ost, const struct friedman *fr) { - const struct variable *weight = dict_get_weight (fr->dict); - const struct fmt_spec *wfmt = weight ? var_get_print_format (weight) : &F_8_0; - - const int row_headers = 1; - const int column_headers = 0; - struct tab_table *table = - tab_create (row_headers + 1, column_headers + 4); - - tab_headers (table, row_headers, 0, column_headers, 0); - - tab_title (table, _("Test Statistics")); - - tab_text (table, 0, column_headers, - TAT_TITLE | TAB_LEFT , _("N")); - - tab_text (table, 0, 1 + column_headers, - TAT_TITLE | TAB_LEFT , _("Chi-Square")); - - tab_text (table, 0, 2 + column_headers, - TAT_TITLE | TAB_LEFT, _("df")); - - tab_text (table, 0, 3 + column_headers, - TAT_TITLE | TAB_LEFT, _("Asymp. Sig.")); - - /* Box around the table */ - tab_box (table, TAL_2, TAL_2, -1, -1, - 0, 0, tab_nc (table) - 1, tab_nr (table) - 1 ); - - - tab_hline (table, TAL_2, 0, tab_nc (table) -1, column_headers); - tab_vline (table, TAL_2, row_headers, 0, tab_nr (table) - 1); - - tab_double (table, 1, column_headers, - 0, fr->cc, wfmt); - - tab_double (table, 1, column_headers + 1, - 0, fr->chi_sq, 0); - - tab_double (table, 1, column_headers + 2, - 0, ost->n_vars - 1, &F_8_0); - - tab_double (table, 1, column_headers + 3, - 0, gsl_cdf_chisq_Q (fr->chi_sq, ost->n_vars - 1), - 0); - - tab_submit (table); + const struct friedman_test *ft = UP_CAST (ost, const struct friedman_test, parent); + + struct pivot_table *table = pivot_table_create (N_("Test Statistics")); + pivot_table_set_weight_var (table, dict_get_weight (fr->dict)); + + struct pivot_dimension *statistics = pivot_dimension_create ( + table, PIVOT_AXIS_ROW, N_("Statistics"), + N_("N"), PIVOT_RC_COUNT); + if (ft->kendalls_w) + pivot_category_create_leaves (statistics->root, N_("Kendall's W"), + PIVOT_RC_OTHER); + pivot_category_create_leaves (statistics->root, + N_("Chi-Square"), PIVOT_RC_OTHER, + N_("df"), PIVOT_RC_INTEGER, + N_("Asymp. Sig."), PIVOT_RC_SIGNIFICANCE); + + double entries[5]; + int n = 0; + + entries[n++] = fr->cc; + if (ft->kendalls_w) + entries[n++] = fr->w; + entries[n++] = fr->chi_sq; + entries[n++] = ost->n_vars - 1; + entries[n++] = gsl_cdf_chisq_Q (fr->chi_sq, ost->n_vars - 1); + assert (n <= sizeof entries / sizeof *entries); + + for (size_t i = 0; i < n; i++) + pivot_table_put1 (table, i, pivot_value_new_number (entries[i])); + + pivot_table_submit (table); }