projects
/
pspp
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
Add code to read character encoding to dissect-sysfile.
[pspp]
/
src
/
language
/
stats
/
crosstabs.q
diff --git
a/src/language/stats/crosstabs.q
b/src/language/stats/crosstabs.q
index e57d9343c724ec96b2cb5badf2ec5eaa1fed48c1..68d11e307e0ff41584d1ffae0ef4abd6d8c9ff74 100644
(file)
--- a/
src/language/stats/crosstabs.q
+++ b/
src/language/stats/crosstabs.q
@@
-1,5
+1,5
@@
/* PSPP - a program for statistical analysis.
/* PSPP - a program for statistical analysis.
- Copyright (C) 1997-9, 2000, 2006 Free Software Foundation, Inc.
+ Copyright (C) 1997-9, 2000, 2006
, 2009
Free Software Foundation, Inc.
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
@@
-46,13
+46,10
@@
#include <language/dictionary/split-file.h>
#include <language/lexer/lexer.h>
#include <language/lexer/variable-parser.h>
#include <language/dictionary/split-file.h>
#include <language/lexer/lexer.h>
#include <language/lexer/variable-parser.h>
-#include <libpspp/alloc.h>
#include <libpspp/array.h>
#include <libpspp/assertion.h>
#include <libpspp/compiler.h>
#include <libpspp/hash.h>
#include <libpspp/array.h>
#include <libpspp/assertion.h>
#include <libpspp/compiler.h>
#include <libpspp/hash.h>
-#include <libpspp/magic.h>
-#include <libpspp/message.h>
#include <libpspp/message.h>
#include <libpspp/misc.h>
#include <libpspp/pool.h>
#include <libpspp/message.h>
#include <libpspp/misc.h>
#include <libpspp/pool.h>
@@
-61,6
+58,8
@@
#include <output/table.h>
#include "minmax.h"
#include <output/table.h>
#include "minmax.h"
+#include "xalloc.h"
+#include "xmalloca.h"
#include "gettext.h"
#define _(msgid) gettext (msgid)
#include "gettext.h"
#define _(msgid) gettext (msgid)
@@
-178,8
+177,8
@@
static struct pool *pl_col; /* For column data. */
static int internal_cmd_crosstabs (struct lexer *lexer, struct dataset *ds);
static void precalc (struct casereader *, const struct dataset *);
static int internal_cmd_crosstabs (struct lexer *lexer, struct dataset *ds);
static void precalc (struct casereader *, const struct dataset *);
-static void calc_general (struct ccase *, const struct dataset *);
-static void calc_integer (struct ccase *, const struct dataset *);
+static void calc_general (
const
struct ccase *, const struct dataset *);
+static void calc_integer (
const
struct ccase *, const struct dataset *);
static void postcalc (void);
static void submit (struct tab_table *);
static void postcalc (void);
static void submit (struct tab_table *);
@@
-191,11
+190,16
@@
int
cmd_crosstabs (struct lexer *lexer, struct dataset *ds)
{
int result = internal_cmd_crosstabs (lexer, ds);
cmd_crosstabs (struct lexer *lexer, struct dataset *ds)
{
int result = internal_cmd_crosstabs (lexer, ds);
+ int i;
free (variables);
pool_destroy (pl_tc);
pool_destroy (pl_col);
free (variables);
pool_destroy (pl_tc);
pool_destroy (pl_col);
+ for (i = 0; i < nxtab; i++)
+ free (xtab[i]);
+ free (xtab);
+
return result;
}
return result;
}
@@
-301,16
+305,16
@@
internal_cmd_crosstabs (struct lexer *lexer, struct dataset *ds)
grouper = casegrouper_create_splits (input, dataset_dict (ds));
while (casegrouper_get_next_group (grouper, &group))
{
grouper = casegrouper_create_splits (input, dataset_dict (ds));
while (casegrouper_get_next_group (grouper, &group))
{
- struct ccase c;
+ struct ccase
*
c;
precalc (group, ds);
precalc (group, ds);
- for (;
casereader_read (group, &c); case_destroy (&
c))
+ for (;
(c = casereader_read (group)) != NULL; case_unref (
c))
{
if (mode == GENERAL)
{
if (mode == GENERAL)
- calc_general (
&
c, ds);
+ calc_general (c, ds);
else
else
- calc_integer (
&
c, ds);
+ calc_integer (c, ds);
}
casereader_destroy (group);
}
casereader_destroy (group);
@@
-356,7
+360,7
@@
crs_custom_tables (struct lexer *lexer, struct dataset *ds, struct cmd_crosstabs
goto done;
if (xalloc_oversized (nx, by_nvar[n_by]))
{
goto done;
if (xalloc_oversized (nx, by_nvar[n_by]))
{
- msg (SE, _("Too many crosstabulation variables or dimensions."));
+ msg (SE, _("Too many cross
-
tabulation variables or dimensions."));
goto done;
}
nx *= by_nvar[n_by];
goto done;
}
nx *= by_nvar[n_by];
@@
-514,12
+518,14
@@
static unsigned hash_table_entry (const void *, const void *);
static void
precalc (struct casereader *input, const struct dataset *ds)
{
static void
precalc (struct casereader *input, const struct dataset *ds)
{
- struct ccase c;
+ struct ccase
*
c;
- if (!casereader_peek (input, 0, &c))
- return;
- output_split_file_values (ds, &c);
- case_destroy (&c);
+ c = casereader_peek (input, 0);
+ if (c != NULL)
+ {
+ output_split_file_values (ds, c);
+ case_unref (c);
+ }
if (mode == GENERAL)
{
if (mode == GENERAL)
{
@@
-547,7
+553,7
@@
precalc (struct casereader *input, const struct dataset *ds)
sorted_tab = xnrealloc (sorted_tab,
n_sorted_tab + count, sizeof *sorted_tab);
sorted_tab = xnrealloc (sorted_tab,
n_sorted_tab + count, sizeof *sorted_tab);
- v =
local_alloc
(sizeof *v * x->nvar);
+ v =
xmalloca
(sizeof *v * x->nvar);
for (j = 2; j < x->nvar; j++)
v[j] = get_var_range (x->vars[j])->min;
for (j = 0; j < count; j++)
for (j = 2; j < x->nvar; j++)
v[j] = get_var_range (x->vars[j])->min;
for (j = 0; j < count; j++)
@@
-581,7
+587,7
@@
precalc (struct casereader *input, const struct dataset *ds)
break;
}
}
break;
}
}
-
local_free
(v);
+
freea
(v);
}
sorted_tab = xnrealloc (sorted_tab,
}
sorted_tab = xnrealloc (sorted_tab,
@@
-593,7
+599,7
@@
precalc (struct casereader *input, const struct dataset *ds)
/* Form crosstabulations for general mode. */
static void
/* Form crosstabulations for general mode. */
static void
-calc_general (struct ccase *c, const struct dataset *ds)
+calc_general (
const
struct ccase *c, const struct dataset *ds)
{
/* Missing values to exclude. */
enum mv_class exclude = (cmd.miss == CRS_TABLE ? MV_ANY
{
/* Missing values to exclude. */
enum mv_class exclude = (cmd.miss == CRS_TABLE ? MV_ANY
@@
-611,7
+617,7
@@
calc_general (struct ccase *c, const struct dataset *ds)
struct crosstab *x = xtab[t];
const size_t entry_size = (sizeof (struct table_entry)
+ sizeof (union value) * (x->nvar - 1));
struct crosstab *x = xtab[t];
const size_t entry_size = (sizeof (struct table_entry)
+ sizeof (union value) * (x->nvar - 1));
- struct table_entry *te =
local_alloc
(entry_size);
+ struct table_entry *te =
xmalloca
(entry_size);
/* Construct table entry for the current record and table. */
te->table = t;
/* Construct table entry for the current record and table. */
te->table = t;
@@
-632,12
+638,14
@@
calc_general (struct ccase *c, const struct dataset *ds)
te->values[j].f = case_num (c, x->vars[j]);
else
{
te->values[j].f = case_num (c, x->vars[j]);
else
{
- memcpy (te->values[j].s, case_str (c, x->vars[j]),
- var_get_width (x->vars[j]));
+ size_t n = var_get_width (x->vars[j]);
+ if (n > MAX_SHORT_STRING)
+ n = MAX_SHORT_STRING;
+ memcpy (te->values[j].s, case_str (c, x->vars[j]), n);
/* Necessary in order to simplify comparisons. */
memset (&te->values[j].s[var_get_width (x->vars[j])], 0,
/* Necessary in order to simplify comparisons. */
memset (&te->values[j].s[var_get_width (x->vars[j])], 0,
- sizeof (union value) -
var_get_width (x->vars[j])
);
+ sizeof (union value) -
n
);
}
}
}
}
}
}
@@
-660,12
+668,12
@@
calc_general (struct ccase *c, const struct dataset *ds)
}
next_crosstab:
}
next_crosstab:
-
local_free
(te);
+
freea
(te);
}
}
static void
}
}
static void
-calc_integer (struct ccase *c, const struct dataset *ds)
+calc_integer (
const
struct ccase *c, const struct dataset *ds)
{
bool bad_warn = true;
{
bool bad_warn = true;
@@
-822,6
+830,16
@@
postcalc (void)
}
hsh_destroy (gen_tab);
}
hsh_destroy (gen_tab);
+ if (mode == INTEGER)
+ {
+ int i;
+ for (i = 0; i < n_sorted_tab; i++)
+ {
+ free (sorted_tab[i]->u.data);
+ free (sorted_tab[i]);
+ }
+ free (sorted_tab);
+ }
}
static void insert_summary (struct tab_table *, int tab_index, double valid);
}
static void insert_summary (struct tab_table *, int tab_index, double valid);
@@
-910,7
+928,7
@@
insert_summary (struct tab_table *t, int tab_index, double valid)
/* Crosstabulation name. */
{
/* Crosstabulation name. */
{
- char *buf =
local_alloc
(128 * x->nvar);
+ char *buf =
xmalloca
(128 * x->nvar);
char *cp = buf;
int i;
char *cp = buf;
int i;
@@
-923,7
+941,7
@@
insert_summary (struct tab_table *t, int tab_index, double valid)
}
tab_text (t, 0, 0, TAB_LEFT, buf);
}
tab_text (t, 0, 0, TAB_LEFT, buf);
-
local_free
(buf);
+
freea
(buf);
}
/* Counts and percentages. */
}
/* Counts and percentages. */
@@
-1050,7
+1068,7
@@
output_pivot_table (struct table_entry **pb, struct table_entry **pe,
/* Title. */
{
/* Title. */
{
- char *title =
local_alloc
(x->nvar * 64 + 128);
+ char *title =
xmalloca
(x->nvar * 64 + 128);
char *cp = title;
int i;
char *cp = title;
int i;
@@
-1116,7
+1134,7
@@
output_pivot_table (struct table_entry **pb, struct table_entry **pe,
strcpy (cp, "].");
tab_title (table, "%s", title);
strcpy (cp, "].");
tab_title (table, "%s", title);
-
local_free
(title);
+
freea
(title);
}
tab_offset (table, 0, 2);
}
tab_offset (table, 0, 2);
@@
-1657,7
+1675,7
@@
enum_var_values (struct table_entry **entries, int entry_cnt, int var_idx,
if (mode == GENERAL)
{
if (mode == GENERAL)
{
- int width =
var_get_width (v
);
+ int width =
MIN (var_get_width (v), MAX_SHORT_STRING
);
int i;
*values = xnmalloc (entry_cnt, sizeof **values);
int i;
*values = xnmalloc (entry_cnt, sizeof **values);
@@
-1844,7
+1862,6
@@
display_crosstabulation (void)
tab_offset (table, -1, tab_row (table) - num_cells * n_rows);
for (r = 0; r < n_rows; r++)
{
tab_offset (table, -1, tab_row (table) - num_cells * n_rows);
for (r = 0; r < n_rows; r++)
{
- char suffix = 0;
bool mark_missing = false;
if (cmd.miss == CRS_REPORT
bool mark_missing = false;
if (cmd.miss == CRS_REPORT
@@
-1853,6
+1870,7
@@
display_crosstabulation (void)
for (i = 0; i < num_cells; i++)
{
for (i = 0; i < num_cells; i++)
{
+ char suffix = 0;
double v;
switch (cells[i])
double v;
switch (cells[i])
@@
-1861,7
+1879,7
@@
display_crosstabulation (void)
v = row_tot[r];
break;
case CRS_CL_ROW:
v = row_tot[r];
break;
case CRS_CL_ROW:
- v = 100.;
+ v = 100.
0
;
suffix = '%';
break;
case CRS_CL_COLUMN:
suffix = '%';
break;
case CRS_CL_COLUMN:
@@
-1899,7
+1917,6
@@
display_crosstabulation (void)
{
double ct = c < n_cols ? col_tot[c] : W;
bool mark_missing = false;
{
double ct = c < n_cols ? col_tot[c] : W;
bool mark_missing = false;
- char suffix = 0;
int i;
if (cmd.miss == CRS_REPORT && c < n_cols
int i;
if (cmd.miss == CRS_REPORT && c < n_cols
@@
-1908,13
+1925,13
@@
display_crosstabulation (void)
for (i = 0; i < num_cells; i++)
{
for (i = 0; i < num_cells; i++)
{
+ char suffix = 0;
double v;
switch (cells[i])
{
case CRS_CL_COUNT:
v = ct;
double v;
switch (cells[i])
{
case CRS_CL_COUNT:
v = ct;
- suffix = '%';
break;
case CRS_CL_ROW:
v = ct / W * 100.;
break;
case CRS_CL_ROW:
v = ct / W * 100.;
@@
-1937,7
+1954,7
@@
display_crosstabulation (void)
NOT_REACHED ();
}
NOT_REACHED ();
}
-
format_cell_entry (table, c, i, v, suffix, mark_missing);
+ format_cell_entry (table, c, i, v, suffix, mark_missing);
}
last_row = i;
}
}
last_row = i;
}
@@
-2439,7
+2456,7
@@
calc_r (double *X, double *Y, double *r, double *ase_0, double *ase_1)
for (sum_Xr = sum_X2r = 0., i = 0; i < n_rows; i++)
{
sum_Xr += X[i] * row_tot[i];
for (sum_Xr = sum_X2r = 0., i = 0; i < n_rows; i++)
{
sum_Xr += X[i] * row_tot[i];
- sum_X2r +=
X[i] * X[i]
* row_tot[i];
+ sum_X2r +=
pow2 (X[i])
* row_tot[i];
}
Xbar = sum_Xr / W;
}
Xbar = sum_Xr / W;
@@
-2451,11
+2468,11
@@
calc_r (double *X, double *Y, double *r, double *ase_0, double *ase_1)
Ybar = sum_Yc / W;
S = sum_XYf - sum_Xr * sum_Yc / W;
Ybar = sum_Yc / W;
S = sum_XYf - sum_Xr * sum_Yc / W;
- SX = sum_X2r -
sum_Xr * sum_Xr
/ W;
- SY = sum_Y2c -
sum_Yc * sum_Yc
/ W;
+ SX = sum_X2r -
pow2 (sum_Xr)
/ W;
+ SY = sum_Y2c -
pow2 (sum_Yc)
/ W;
T = sqrt (SX * SY);
*r = S / T;
T = sqrt (SX * SY);
*r = S / T;
- *ase_0 = sqrt ((sum_X2Y2f -
(sum_XYf *
sum_XYf) / W) / (sum_X2r * sum_Y2c));
+ *ase_0 = sqrt ((sum_X2Y2f -
pow2 (
sum_XYf) / W) / (sum_X2r * sum_Y2c));
{
double s, c, y, t;
{
double s, c, y, t;
@@
-2545,9
+2562,9
@@
calc_symmetric (double v[N_SYMMETRIC], double ase[N_SYMMETRIC],
Dr = Dc = W * W;
for (r = 0; r < n_rows; r++)
Dr = Dc = W * W;
for (r = 0; r < n_rows; r++)
- Dr -=
row_tot[r] * row_tot[r]
;
+ Dr -=
pow2 (row_tot[r])
;
for (c = 0; c < n_cols; c++)
for (c = 0; c < n_cols; c++)
- Dc -=
col_tot[c] * col_tot[c]
;
+ Dc -=
pow2 (col_tot[c])
;
}
{
}
{
@@
-2720,8
+2737,8
@@
calc_symmetric (double v[N_SYMMETRIC], double ase[N_SYMMETRIC],
/* Spearman correlation, Pearson's r. */
if (cmd.a_statistics[CRS_ST_CORR])
{
/* Spearman correlation, Pearson's r. */
if (cmd.a_statistics[CRS_ST_CORR])
{
- double *R =
local_alloc
(sizeof *R * n_rows);
- double *C =
local_alloc
(sizeof *C * n_cols);
+ double *R =
xmalloca
(sizeof *R * n_rows);
+ double *C =
xmalloca
(sizeof *C * n_cols);
{
double y, t, c = 0., s = 0.;
{
double y, t, c = 0., s = 0.;
@@
-2760,8
+2777,8
@@
calc_symmetric (double v[N_SYMMETRIC], double ase[N_SYMMETRIC],
calc_r (R, C, &v[6], &t[6], &ase[6]);
t[6] = v[6] / t[6];
calc_r (R, C, &v[6], &t[6], &ase[6]);
t[6] = v[6] / t[6];
-
local_free
(R);
-
local_free
(C);
+
freea
(R);
+
freea
(C);
calc_r ((double *) rows, (double *) cols, &v[7], &t[7], &ase[7]);
t[7] = v[7] / t[7];
calc_r ((double *) rows, (double *) cols, &v[7], &t[7], &ase[7]);
t[7] = v[7] / t[7];
@@
-3056,10
+3073,10
@@
calc_directional (double v[N_DIRECTIONAL], double ase[N_DIRECTIONAL],
}
for (sum_ri2 = 0., i = 0; i < n_rows; i++)
}
for (sum_ri2 = 0., i = 0; i < n_rows; i++)
- sum_ri2 +=
row_tot[i] * row_tot[i]
;
+ sum_ri2 +=
pow2 (row_tot[i])
;
for (sum_cj2 = 0., j = 0; j < n_cols; j++)
for (sum_cj2 = 0., j = 0; j < n_cols; j++)
- sum_cj2 +=
col_tot[j] * col_tot[j]
;
+ sum_cj2 +=
pow2 (col_tot[j])
;
v[3] = (W * sum_fij2_ci - sum_ri2) / (W * W - sum_ri2);
v[4] = (W * sum_fij2_ri - sum_cj2) / (W * W - sum_cj2);
v[3] = (W * sum_fij2_ci - sum_ri2) / (W * W - sum_ri2);
v[4] = (W * sum_fij2_ri - sum_cj2) / (W * W - sum_cj2);
@@
-3149,9
+3166,9
@@
calc_directional (double v[N_DIRECTIONAL], double ase[N_DIRECTIONAL],
for (sum_Xr = sum_X2r = 0., i = 0; i < n_rows; i++)
{
sum_Xr += rows[i].f * row_tot[i];
for (sum_Xr = sum_X2r = 0., i = 0; i < n_rows; i++)
{
sum_Xr += rows[i].f * row_tot[i];
- sum_X2r +=
rows[i].f * rows[i].f
* row_tot[i];
+ sum_X2r +=
pow2 (rows[i].f)
* row_tot[i];
}
}
- SX = sum_X2r -
sum_Xr * sum_Xr
/ W;
+ SX = sum_X2r -
pow2 (sum_Xr)
/ W;
for (SXW = 0., j = 0; j < n_cols; j++)
{
for (SXW = 0., j = 0; j < n_cols; j++)
{
@@
-3159,7
+3176,7
@@
calc_directional (double v[N_DIRECTIONAL], double ase[N_DIRECTIONAL],
for (cum = 0., i = 0; i < n_rows; i++)
{
for (cum = 0., i = 0; i < n_rows; i++)
{
- SXW +=
rows[i].f * rows[i].f
* mat[j + i * n_cols];
+ SXW +=
pow2 (rows[i].f)
* mat[j + i * n_cols];
cum += rows[i].f * mat[j + i * n_cols];
}
cum += rows[i].f * mat[j + i * n_cols];
}
@@
-3176,7
+3193,7
@@
calc_directional (double v[N_DIRECTIONAL], double ase[N_DIRECTIONAL],
for (sum_Yc = sum_Y2c = 0., i = 0; i < n_cols; i++)
{
sum_Yc += cols[i].f * col_tot[i];
for (sum_Yc = sum_Y2c = 0., i = 0; i < n_cols; i++)
{
sum_Yc += cols[i].f * col_tot[i];
- sum_Y2c +=
cols[i].f * cols[i].f
* col_tot[i];
+ sum_Y2c +=
pow2 (cols[i].f)
* col_tot[i];
}
SY = sum_Y2c - sum_Yc * sum_Yc / W;
}
SY = sum_Y2c - sum_Yc * sum_Yc / W;
@@
-3186,7
+3203,7
@@
calc_directional (double v[N_DIRECTIONAL], double ase[N_DIRECTIONAL],
for (cum = 0., j = 0; j < n_cols; j++)
{
for (cum = 0., j = 0; j < n_cols; j++)
{
- SYW +=
cols[j].f * cols[j].f
* mat[j + i * n_cols];
+ SYW +=
pow2 (cols[j].f)
* mat[j + i * n_cols];
cum += cols[j].f * mat[j + i * n_cols];
}
cum += cols[j].f * mat[j + i * n_cols];
}