1 /* PSPP - a program for statistical analysis.
2 Copyright (C) 2021 Free Software Foundation, Inc.
4 This program is free software: you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation, either version 3 of the License, or
7 (at your option) any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program. If not, see <http://www.gnu.org/licenses/>. */
21 #include "data/any-reader.h"
22 #include "data/any-writer.h"
23 #include "data/casereader.h"
24 #include "data/casewriter.h"
25 #include "data/dataset.h"
26 #include "data/dictionary.h"
27 #include "language/data-io/file-handle.h"
28 #include "language/data-io/matrix-reader.h"
29 #include "language/lexer/lexer.h"
30 #include "language/command.h"
33 #define _(msgid) gettext (msgid)
36 cmd_mconvert (struct lexer *lexer, struct dataset *ds)
39 struct file_handle *in = NULL;
40 struct file_handle *out = NULL;
41 while (lex_token (lexer) != T_ENDCMD)
43 if (lex_match_id (lexer, "APPEND"))
45 else if (lex_match_id (lexer, "REPLACE"))
49 if (lex_match_id (lexer, "MATRIX"))
50 lex_match (lexer, T_EQUALS);
52 struct file_handle **fhp = (lex_match_id (lexer, "IN") ? &in
53 : lex_match_id (lexer, "OUT") ? &out
57 lex_error_expecting (lexer, "IN", "OUT", "APPEND", "REPLACE");
60 if (!lex_force_match (lexer, T_LPAREN))
64 if (lex_match (lexer, T_ASTERISK))
68 *fhp = fh_parse (lexer, FH_REF_FILE, dataset_session (ds));
73 if (!lex_force_match (lexer, T_RPAREN))
77 lex_match (lexer, T_SLASH);
80 if (!in && !dataset_has_source (ds))
82 msg (SE, _("No active file is defined and no external file is "
83 "specified on MATRIX=IN."));
91 struct casereader *cr = any_reader_open_and_decode (in, NULL, &d, NULL);
95 struct matrix_reader *mr = matrix_reader_create (d, cr);
98 casereader_destroy (cr);
103 struct casewriter *cw = any_writer_open (out, d);
106 matrix_reader_destroy (mr);
107 casereader_destroy (cr);
114 struct matrix_material mm;
115 struct casereader *group;
116 if (!matrix_reader_next (&mm, mr, &group))
119 bool add_corr = mm.cov && !mm.corr;
120 bool add_cov = mm.corr && !mm.cov;
121 bool remove_corr = add_cov && !append;
122 bool remove_cov = add_corr && !append;
124 struct ccase *model = casereader_peek (group, 0);
125 for (size_t i = 0; i < mr->n_fvars; i++)
126 *case_num_rw (model, mr->fvars[i]) = SYSMIS;
130 struct ccase *c = casereader_read (group);
134 struct substring rowtype = matrix_reader_get_string (c, mr->rowtype);
135 if ((remove_cov && ss_equals_case (rowtype, ss_cstr ("COV")))
136 || (remove_corr && ss_equals_case (rowtype, ss_cstr ("CORR"))))
139 casewriter_write (cw, c);
141 casereader_destroy (group);
145 assert (mm.cov->size1 == mr->n_cvars);
146 assert (mm.cov->size2 == mr->n_cvars);
148 for (size_t y = 0; y < mr->n_cvars; y++)
150 struct ccase *c = case_clone (model);
151 for (size_t x = 0; x < mr->n_cvars; x++)
153 double d1 = gsl_matrix_get (mm.cov, x, x);
154 double d2 = gsl_matrix_get (mm.cov, y, y);
155 double cov = gsl_matrix_get (mm.cov, y, x);
156 *case_num_rw (c, mr->cvars[x]) = cov / sqrt (d1 * d2);
158 matrix_reader_set_string (c, mr->rowtype, ss_cstr ("CORR"));
159 matrix_reader_set_string (c, mr->varname,
160 ss_cstr (var_get_name (mr->cvars[y])));
161 casewriter_write (cw, c);
164 struct ccase *c = case_clone (model);
165 for (size_t x = 0; x < mr->n_cvars; x++)
167 double variance = gsl_matrix_get (mm.cov, x, x);
168 *case_num_rw (c, mr->cvars[x]) = sqrt (variance);
170 matrix_reader_set_string (c, mr->rowtype, ss_cstr ("STDDEV"));
171 matrix_reader_set_string (c, mr->varname, ss_empty ());
172 casewriter_write (cw, c);
177 assert (mm.corr->size1 == mr->n_cvars);
178 assert (mm.corr->size2 == mr->n_cvars);
180 for (size_t y = 0; y < mr->n_cvars; y++)
182 struct ccase *c = case_clone (model);
183 for (size_t x = 0; x < mr->n_cvars; x++)
185 double d1 = gsl_matrix_get (mm.var_matrix, x, x);
186 double d2 = gsl_matrix_get (mm.var_matrix, y, y);
187 double corr = gsl_matrix_get (mm.corr, y, x);
188 *case_num_rw (c, mr->cvars[x]) = corr * sqrt (d1 * d2);
190 matrix_reader_set_string (c, mr->rowtype, ss_cstr ("COV"));
191 matrix_reader_set_string (c, mr->varname,
192 ss_cstr (var_get_name (mr->cvars[y])));
193 casewriter_write (cw, c);
200 matrix_reader_destroy (mr);
201 casewriter_destroy (cw);