#include "math/interaction.h"
#include "math/box-whisker.h"
#include "math/categoricals.h"
+#include "math/chart-geometry.h"
#include "math/histogram.h"
#include "math/moments.h"
#include "math/np.h"
if (examine->histogram)
{
+ /* Sturges Rule */
+ double bin_width = abs (es[v].minimum - es[v].maximum)
+ / (1 + log2 (es[v].cc))
+ ;
+
+ bin_width = chart_rounded_tick (bin_width);
+
es[v].histogram =
- histogram_create (10, es[v].minimum, es[v].maximum);
+ histogram_create (bin_width, es[v].minimum, es[v].maximum);
}
es[v].sorted_reader = casewriter_make_reader (es[v].sorted_writer);
#include "libpspp/str.h"
#include "math/histogram.h"
#include "math/moments.h"
+#include "math/chart-geometry.h"
+
#include "output/chart-item.h"
#include "output/charts/piechart.h"
#include "output/charts/plot-hist.h"
{
double x_min, x_max, valid_freq;
int i;
-
+ double bin_width;
struct histogram *histogram;
double iqr;
- int bins;
/* Find out the extremes of the x value, within the range to be included in
the histogram, and sum the total frequency of those values. */
/* Freedman-Diaconis' choice of bin width. */
iqr = calculate_iqr (frq);
- if (iqr != SYSMIS)
- {
- double bin_width = 2 * iqr / pow (valid_freq, 1.0 / 3.0);
- bins = (x_max - x_min) / bin_width;
- if (bins < 5)
- bins = 5;
- else if (bins > 400)
- bins = 400;
- }
- else
- bins = 5;
+ bin_width = 2 * iqr / pow (valid_freq, 1.0 / 3.0);
+ bin_width = chart_rounded_tick (bin_width);
- histogram = histogram_create (bins, x_min, x_max);
+ histogram = histogram_create (bin_width, x_min, x_max);
for (i = 0; i < ft->n_valid; i++)
{
const struct freq *f = &ft->valid[i];
struct histogram *
-histogram_create (int bins, double min, double max)
+histogram_create (double bin_width, double min, double max)
{
+ int bins;
struct histogram *h = xmalloc (sizeof *h);
struct statistic *stat = &h->parent;
- double upper_limit, lower_limit;
-
- double bin_width = chart_rounded_tick ((max - min) / (double) bins);
- double bin_width_2 = bin_width / 2.0;
+ const short max_sign = max >= 0;
+ const short min_sign = min >= 0;
- int n = ceil (max / (bin_width_2) ) ;
+ double upper_limit, lower_limit;
assert (max >= min);
- if ( ! (n % 2 ) ) n++;
- upper_limit = n * bin_width_2;
+ lower_limit = trunc (2 * abs (min) / bin_width) - 1;
+ lower_limit *= bin_width / 2;
+ lower_limit *= min_sign;
- n = floor (min / (bin_width_2) ) ;
- if ( ! (n % 2 ) ) n--;
- lower_limit = n * bin_width_2;
+ upper_limit = trunc (2 * abs(max) / bin_width) + 1;
+ upper_limit *= bin_width / 2;
+ upper_limit *= max_sign;
+
+ bins = (upper_limit - lower_limit) / bin_width;
h->gsl_hist = gsl_histogram_alloc (bins);
+
gsl_histogram_set_ranges_uniform (h->gsl_hist, lower_limit, upper_limit);
stat->accumulate = acc;
gsl_histogram *gsl_hist;
};
-struct histogram * histogram_create (int bins, double max, double min);
+struct histogram * histogram_create (double bin_width, double max, double min);
void histogram_add (struct histogram *h, double y, double c);