X-Git-Url: https://pintos-os.org/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=src%2Ffactor_stats.c;h=79c9b80ca8b2a4c2e9c46b5016377f348805f95c;hb=e582516e80e5a04f10a651515a35b616911cf4d6;hp=2ba785a7d8e8c7044b2f42fa3ff2c94f96124d02;hpb=379aeac5640a20a122990640fdd33bdfa592a3c1;p=pspp-builds.git diff --git a/src/factor_stats.c b/src/factor_stats.c index 2ba785a7..79c9b80c 100644 --- a/src/factor_stats.c +++ b/src/factor_stats.c @@ -25,6 +25,7 @@ Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA #include "algorithm.h" #include "alloc.h" #include "moments.h" +#include "percentiles.h" #include #include @@ -43,6 +44,7 @@ metrics_precalc(struct metrics *m) m->min = DBL_MAX; m->max = -DBL_MAX; + m->histogram = 0; m->moments = moments1_create(MOMENT_KURTOSIS); @@ -51,9 +53,6 @@ metrics_precalc(struct metrics *m) (hsh_hash_func *) hash_value, (hsh_free_func *) weighted_value_free, (void *) 0); - - - } @@ -126,7 +125,6 @@ metrics_postcalc(struct metrics *m) int i; int j = 1; - moments1_calculate (m->moments, &m->n, &m->mean, &m->var, &m->skewness, &m->kurtosis); @@ -144,20 +142,25 @@ metrics_postcalc(struct metrics *m) m->wvp = (struct weighted_value **) hsh_sort(m->ordered_data); m->n_data = hsh_count(m->ordered_data); - if ( m->n_data == 0 ) + /* Trimmed mean calculation */ + if ( m->n_data <= 1 ) { m->trimmed_mean = m->mean; return; } + m->histogram = histogram_create(10, m->min, m->max); - /* Trimmed mean calculation */ + for ( i = 0 ; i < m->n_data ; ++i ) + { + struct weighted_value **wv = (m->wvp) ; + gsl_histogram_accumulate(m->histogram, wv[i]->v.f, wv[i]->w); + } tc = m->n * 0.05 ; k1 = -1; k2 = -1; - for ( i = 0 ; i < m->n_data ; ++i ) { cc += m->wvp[i]->w; @@ -169,9 +172,10 @@ metrics_postcalc(struct metrics *m) if ( cc < tc ) k1 = i; - } + + k2 = m->n_data; for ( i = m->n_data -1 ; i >= 0; --i ) { @@ -180,6 +184,18 @@ metrics_postcalc(struct metrics *m) } + /* Calculate the percentiles */ + ptiles(m->ptile_hash, m->wvp, m->n_data, m->n, m->ptile_alg); + + tukey_hinges(m->wvp, m->n_data, m->n, m->hinge); + + /* Special case here */ + if ( k1 + 1 == k2 ) + { + m->trimmed_mean = m->wvp[k2]->v.f; + return; + } + m->trimmed_mean = 0; for ( i = k1 + 2 ; i <= k2 - 1 ; ++i ) { @@ -191,13 +207,6 @@ metrics_postcalc(struct metrics *m) m->trimmed_mean += (m->wvp[k1 + 1]->cc - tc) * m->wvp[k1 + 1]->v.f ; m->trimmed_mean /= 0.9 * m->n ; - m->histogram = histogram_create(10, m->min, m->max); - - for ( i = 0 ; i < m->n_data ; ++i ) - { - struct weighted_value **wv = (m->wvp) ; - gsl_histogram_accumulate(m->histogram, wv[i]->v.f, wv[i]->w); - } } @@ -217,7 +226,12 @@ weighted_value_create(void) void weighted_value_free(struct weighted_value *wv) { - struct case_node *cn = wv->case_nos; + struct case_node *cn ; + + if ( !wv ) + return ; + + cn = wv->case_nos; while(cn) { @@ -247,16 +261,29 @@ create_factor_statistics (int n, union value *id0, union value *id1) f->id[0] = *id0; f->id[1] = *id1; f->m = xmalloc( sizeof ( struct metrics ) * n ) ; + memset (f->m, 0, sizeof(struct metrics) * n); + f->n_var = n; return f; } +void +metrics_destroy(struct metrics *m) +{ + hsh_destroy(m->ordered_data); + hsh_destroy(m->ptile_hash); + if ( m-> histogram ) + gsl_histogram_free(m->histogram); +} + void factor_statistics_free(struct factor_statistics *f) { - hsh_destroy(f->m->ordered_data); - gsl_histogram_free(f->m->histogram); + + int i; + for ( i = 0 ; i < f->n_var; ++i ) + metrics_destroy(&f->m[i]); free(f->m) ; free(f); }