1 /* PSPP - computes sample statistics.
2 Copyright (C) 1997-9, 2000, 2006 Free Software Foundation, Inc.
4 This program is free software; you can redistribute it and/or
5 modify it under the terms of the GNU General Public License as
6 published by the Free Software Foundation; either version 2 of the
7 License, or (at your option) any later version.
9 This program is distributed in the hope that it will be useful, but
10 WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software
16 Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
21 #include "sys-file-writer.h"
22 #include "sys-file-private.h"
32 #include <libpspp/alloc.h>
33 #include <libpspp/hash.h>
34 #include <libpspp/magic.h>
35 #include <libpspp/message.h>
36 #include <libpspp/misc.h>
37 #include <libpspp/str.h>
38 #include <libpspp/version.h>
40 #include <data/case.h>
41 #include <data/casewriter-provider.h>
42 #include <data/casewriter.h>
43 #include <data/dictionary.h>
44 #include <data/file-handle-def.h>
45 #include <data/format.h>
46 #include <data/missing-values.h>
47 #include <data/settings.h>
48 #include <data/value-labels.h>
49 #include <data/variable.h>
54 #define _(msgid) gettext (msgid)
56 /* Find 64-bit floating-point type. */
59 #define FLT64_MAX FLT_MAX
60 #elif SIZEOF_DOUBLE == 8
62 #define FLT64_MAX DBL_MAX
63 #elif SIZEOF_LONG_DOUBLE == 8
64 #define flt64 long double
65 #define FLT64_MAX LDBL_MAX
67 #error Which one of your basic types is 64-bit floating point?
70 /* Figure out SYSMIS value for flt64. */
71 #include <libpspp/magic.h>
72 #if SIZEOF_DOUBLE == 8
73 #define second_lowest_flt64 second_lowest_value
75 #error Must define second_lowest_flt64 for your architecture.
78 /* Record Type 1: General Information. */
81 char rec_type[4] ; /* 00: Record-type code, "$FL2". */
82 char prod_name[60] ; /* 04: Product identification. */
83 int32_t layout_code ; /* 40: 2. */
84 int32_t nominal_case_size ; /* 44: Number of `value's per case.
85 Note: some systems set this to -1 */
86 int32_t compress ; /* 48: 1=compressed, 0=not compressed. */
87 int32_t weight_idx ; /* 4c: 1-based index of weighting var, or 0. */
88 int32_t case_cnt ; /* 50: Number of cases, -1 if unknown. */
89 flt64 bias ; /* 54: Compression bias (100.0). */
90 char creation_date[9] ; /* 5c: `dd mmm yy' creation date of file. */
91 char creation_time[8] ; /* 65: `hh:mm:ss' 24-hour creation time. */
92 char file_label[64] ; /* 6d: File label. */
93 char padding[3] ; /* ad: Ignored padding. */
94 } ATTRIBUTE((packed)) ;
96 /* Record Type 2: Variable. */
97 struct sysfile_variable
99 int32_t rec_type ; /* 2. */
100 int32_t type ; /* 0=numeric, 1-255=string width,
101 -1=continued string. */
102 int32_t has_var_label ; /* 1=has a variable label, 0=doesn't. */
103 int32_t n_missing_values ; /* Missing value code of -3,-2,0,1,2, or 3. */
104 int32_t print ; /* Print format. */
105 int32_t write ; /* Write format. */
106 char name[SHORT_NAME_LEN] ; /* Variable name. */
107 /* The rest of the structure varies. */
108 } ATTRIBUTE((packed)) ;
110 /* Compression bias used by PSPP. Values between (1 -
111 COMPRESSION_BIAS) and (251 - COMPRESSION_BIAS) inclusive can be
113 #define COMPRESSION_BIAS 100
115 /* System file writer. */
118 struct file_handle *fh; /* File handle. */
119 FILE *file; /* File stream. */
121 int needs_translation; /* 0=use fast path, 1=translation needed. */
122 int compress; /* 1=compressed, 0=not compressed. */
123 int case_cnt; /* Number of cases written so far. */
124 size_t flt64_cnt; /* Number of flt64 elements in case. */
125 bool has_vls; /* Does the dict have very long strings? */
127 /* Compression buffering. */
128 flt64 *buf; /* Buffered data. */
129 flt64 *end; /* Buffer end. */
130 flt64 *ptr; /* Current location in buffer. */
131 unsigned char *x; /* Location in current instruction octet. */
132 unsigned char *y; /* End of instruction octet. */
135 struct sfm_var *vars; /* Variables. */
136 size_t var_cnt; /* Number of variables. */
137 size_t var_cnt_vls; /* Number of variables including
138 very long string components. */
141 /* A variable in a system file. */
144 int width; /* 0=numeric, otherwise string width. */
145 int fv; /* Index into case. */
146 size_t flt64_cnt; /* Number of flt64 elements. */
149 static struct casewriter_class sys_file_casewriter_class;
151 static char *append_string_max (char *, const char *, const char *);
152 static void write_header (struct sfm_writer *, const struct dictionary *);
153 static void buf_write (struct sfm_writer *, const void *, size_t);
154 static void write_variable (struct sfm_writer *, const struct variable *);
155 static void write_value_labels (struct sfm_writer *,
156 struct variable *, int idx);
157 static void write_rec_7_34 (struct sfm_writer *);
159 static void write_longvar_table (struct sfm_writer *w,
160 const struct dictionary *dict);
162 static void write_vls_length_table (struct sfm_writer *w,
163 const struct dictionary *dict);
166 static void write_variable_display_parameters (struct sfm_writer *w,
167 const struct dictionary *dict);
169 static void write_documents (struct sfm_writer *, const struct dictionary *);
171 bool write_error (const struct sfm_writer *);
172 bool close_writer (struct sfm_writer *);
175 var_flt64_cnt (const struct variable *v)
177 assert(sizeof(flt64) == MAX_SHORT_STRING);
178 return sfm_width_to_bytes(var_get_width (v)) / MAX_SHORT_STRING ;
182 var_flt64_cnt_nom (const struct variable *v)
184 return (var_is_numeric (v)
185 ? 1 : DIV_RND_UP (var_get_width (v), sizeof (flt64)));
189 /* Returns default options for writing a system file. */
190 struct sfm_write_options
191 sfm_writer_default_options (void)
193 struct sfm_write_options opts;
194 opts.create_writeable = true;
195 opts.compress = get_scompression ();
201 /* Return a short variable name to be used as the continuation of the
202 variable with the short name SN.
204 FIXME: Need to resolve clashes somehow.
208 cont_var_name(const char *sn, int idx)
210 static char s[SHORT_NAME_LEN + 1];
212 char abb[SHORT_NAME_LEN + 1 - 3]= {0};
214 strncpy(abb, sn, SHORT_NAME_LEN - 3);
216 snprintf(s, SHORT_NAME_LEN + 1, "%s%03d", abb, idx);
222 /* Opens the system file designated by file handle FH for writing
223 cases from dictionary D according to the given OPTS. If
224 COMPRESS is nonzero, the system file will be compressed.
226 No reference to D is retained, so it may be modified or
227 destroyed at will after this function returns. D is not
228 modified by this function, except to assign short names. */
230 sfm_open_writer (struct file_handle *fh, struct dictionary *d,
231 struct sfm_write_options opts)
233 struct sfm_writer *w = NULL;
240 if (opts.version != 2 && opts.version != 3)
242 msg (ME, _("Unknown system file version %d. Treating as version %d."),
248 mode = S_IRUSR | S_IRGRP | S_IROTH;
249 if (opts.create_writeable)
250 mode |= S_IWUSR | S_IWGRP | S_IWOTH;
251 fd = open (fh_get_file_name (fh), O_WRONLY | O_CREAT | O_TRUNC, mode);
255 /* Open file handle. */
256 if (!fh_open (fh, FH_REF_FILE, "system file", "we"))
259 /* Create and initialize writer. */
260 w = xmalloc (sizeof *w);
262 w->file = fdopen (fd, "w");
264 w->needs_translation = dict_compacting_would_change (d);
265 w->compress = opts.compress;
270 w->buf = w->end = w->ptr = NULL;
273 w->var_cnt = dict_get_var_cnt (d);
274 w->var_cnt_vls = w->var_cnt;
275 w->vars = xnmalloc (w->var_cnt, sizeof *w->vars);
276 for (i = 0; i < w->var_cnt; i++)
278 const struct variable *dv = dict_get_var (d, i);
279 struct sfm_var *sv = &w->vars[i];
280 sv->width = var_get_width (dv);
281 /* spss compatibility nonsense */
282 if ( var_get_width (dv) >= MIN_VERY_LONG_STRING )
285 sv->fv = var_get_case_index (dv);
286 sv->flt64_cnt = var_flt64_cnt (dv);
289 /* Check that file create succeeded. */
296 /* Write the file header. */
299 /* Write basic variable info. */
300 dict_assign_short_names (d);
301 for (i = 0; i < dict_get_var_cnt (d); i++)
304 const struct variable *v = dict_get_var(d, i);
305 int wcount = var_get_width (v);
308 struct variable *var_cont = var_clone (v);
309 var_set_short_name (var_cont, var_get_short_name (v));
310 if ( var_is_alpha (v))
314 var_clear_missing_values (var_cont);
315 var_set_short_name (var_cont,
316 cont_var_name (var_get_short_name (v),
318 var_clear_label (var_cont);
322 if ( wcount >= MIN_VERY_LONG_STRING )
324 var_set_width (var_cont, MIN_VERY_LONG_STRING - 1);
325 wcount -= EFFECTIVE_LONG_STRING_LENGTH;
329 var_set_width (var_cont, wcount);
330 wcount -= var_get_width (var_cont);
334 write_variable (w, var_cont);
335 var_destroy (var_cont);
339 /* Write out value labels. */
340 for (idx = i = 0; i < dict_get_var_cnt (d); i++)
342 struct variable *v = dict_get_var (d, i);
344 write_value_labels (w, v, idx);
345 idx += var_flt64_cnt (v);
348 if (dict_get_documents (d) != NULL)
349 write_documents (w, d);
353 write_variable_display_parameters (w, d);
355 if (opts.version >= 3)
356 write_longvar_table (w, d);
358 write_vls_length_table(w, d);
360 /* Write end-of-headers record. */
366 } ATTRIBUTE((packed))
369 rec_999.rec_type = 999;
372 buf_write (w, &rec_999, sizeof rec_999);
377 w->buf = xnmalloc (128, sizeof *w->buf);
379 w->end = &w->buf[128];
380 w->x = (unsigned char *) w->ptr++;
381 w->y = (unsigned char *) w->ptr;
387 return casewriter_create (&sys_file_casewriter_class, w);
394 msg (ME, _("Error opening \"%s\" for writing as a system file: %s."),
395 fh_get_file_name (fh), strerror (errno));
399 /* Returns value of X truncated to two least-significant digits. */
410 /* Write the sysfile_header header to system file W. */
412 write_header (struct sfm_writer *w, const struct dictionary *d)
414 struct sysfile_header hdr;
420 memcpy (hdr.rec_type, "$FL2", 4);
422 p = stpcpy (hdr.prod_name, "@(#) SPSS DATA FILE ");
423 p = append_string_max (p, version, &hdr.prod_name[60]);
424 p = append_string_max (p, " - ", &hdr.prod_name[60]);
425 p = append_string_max (p, host_system, &hdr.prod_name[60]);
426 memset (p, ' ', &hdr.prod_name[60] - p);
431 for (i = 0; i < dict_get_var_cnt (d); i++)
433 w->flt64_cnt += var_flt64_cnt (dict_get_var (d, i));
435 hdr.nominal_case_size = w->flt64_cnt;
437 hdr.compress = w->compress;
439 if (dict_get_weight (d) != NULL)
441 const struct variable *weight_var;
442 int recalc_weight_idx = 1;
445 weight_var = dict_get_weight (d);
448 struct variable *v = dict_get_var (d, i);
451 recalc_weight_idx += var_flt64_cnt (v);
453 hdr.weight_idx = recalc_weight_idx;
459 hdr.bias = COMPRESSION_BIAS;
461 if (time (&t) == (time_t) -1)
463 memcpy (hdr.creation_date, "01 Jan 70", 9);
464 memcpy (hdr.creation_time, "00:00:00", 8);
468 static const char *month_name[12] =
470 "Jan", "Feb", "Mar", "Apr", "May", "Jun",
471 "Jul", "Aug", "Sep", "Oct", "Nov", "Dec",
473 struct tm *tmp = localtime (&t);
474 int day = rerange (tmp->tm_mday);
475 int mon = rerange (tmp->tm_mon + 1);
476 int year = rerange (tmp->tm_year);
477 int hour = rerange (tmp->tm_hour + 1);
478 int min = rerange (tmp->tm_min + 1);
479 int sec = rerange (tmp->tm_sec + 1);
482 sprintf (buf, "%02d %s %02d", day, month_name[mon - 1], year);
483 memcpy (hdr.creation_date, buf, sizeof hdr.creation_date);
484 sprintf (buf, "%02d:%02d:%02d", hour - 1, min - 1, sec - 1);
485 memcpy (hdr.creation_time, buf, sizeof hdr.creation_time);
489 const char *label = dict_get_label (d);
493 buf_copy_str_rpad (hdr.file_label, sizeof hdr.file_label, label);
496 memset (hdr.padding, 0, sizeof hdr.padding);
498 buf_write (w, &hdr, sizeof hdr);
501 /* Translates format spec from internal form in SRC to system file
504 write_format_spec (const struct fmt_spec *src, int32_t *dest)
506 assert (fmt_check_output (src));
507 *dest = (fmt_to_io (src->type) << 16) | (src->w << 8) | src->d;
510 /* Write the variable record(s) for primary variable P and secondary
511 variable S to system file W. */
513 write_variable (struct sfm_writer *w, const struct variable *v)
515 struct sysfile_variable sv;
517 /* Missing values. */
518 struct missing_values mv;
519 flt64 m[3]; /* Missing value values. */
520 int nm; /* Number of missing values, possibly negative. */
521 const char *label = var_get_label (v);
524 sv.type = MIN (var_get_width (v), MIN_VERY_LONG_STRING - 1);
525 sv.has_var_label = label != NULL;
527 mv_copy (&mv, var_get_missing_values (v));
529 if (mv_has_range (&mv))
532 mv_pop_range (&mv, &x, &y);
533 m[nm++] = x == LOWEST ? second_lowest_flt64 : x;
534 m[nm++] = y == HIGHEST ? FLT64_MAX : y;
536 while (mv_has_value (&mv))
539 mv_pop_value (&mv, &value);
540 if (var_is_numeric (v))
543 buf_copy_rpad ((char *) &m[nm], sizeof m[nm], value.s,
547 if (mv_has_range (var_get_missing_values (v)))
550 sv.n_missing_values = nm;
551 write_format_spec (var_get_print_format (v), &sv.print);
552 write_format_spec (var_get_write_format (v), &sv.write);
553 buf_copy_str_rpad (sv.name, sizeof sv.name, var_get_short_name (v));
554 buf_write (w, &sv, sizeof sv);
562 } ATTRIBUTE((packed))
567 l.label_len = MIN (strlen (label), 255);
568 ext_len = ROUND_UP (l.label_len, sizeof l.label_len);
569 memcpy (l.label, label, l.label_len);
570 memset (&l.label[l.label_len], ' ', ext_len - l.label_len);
572 buf_write (w, &l, offsetof (struct label, label) + ext_len);
576 buf_write (w, m, sizeof *m * abs (nm));
578 if (var_is_alpha (v) && var_get_width (v) > (int) sizeof (flt64))
584 sv.has_var_label = 0;
585 sv.n_missing_values = 0;
586 memset (&sv.print, 0, sizeof sv.print);
587 memset (&sv.write, 0, sizeof sv.write);
588 memset (&sv.name, 0, sizeof sv.name);
590 pad_count = DIV_RND_UP (MIN(var_get_width (v), MIN_VERY_LONG_STRING - 1),
591 (int) sizeof (flt64)) - 1;
592 for (i = 0; i < pad_count; i++)
593 buf_write (w, &sv, sizeof sv);
597 /* Writes the value labels for variable V having system file
598 variable index IDX to system file W. */
600 write_value_labels (struct sfm_writer *w, struct variable *v, int idx)
602 struct value_label_rec
607 } ATTRIBUTE((packed));
614 } ATTRIBUTE((packed));
616 const struct val_labs *val_labs;
617 struct val_labs_iterator *i;
618 struct value_label_rec *vlr;
619 struct var_idx_rec vir;
624 val_labs = var_get_value_labels (v);
625 if (val_labs == NULL)
628 /* Pass 1: Count bytes. */
629 vlr_size = (sizeof (struct value_label_rec)
630 + sizeof (flt64) * (val_labs_count (val_labs) - 1));
631 for (vl = val_labs_first (val_labs, &i); vl != NULL;
632 vl = val_labs_next (val_labs, &i))
633 vlr_size += ROUND_UP (strlen (vl->label) + 1, sizeof (flt64));
635 /* Pass 2: Copy bytes. */
636 vlr = xmalloc (vlr_size);
638 vlr->n_labels = val_labs_count (val_labs);
640 for (vl = val_labs_first_sorted (val_labs, &i); vl != NULL;
641 vl = val_labs_next (val_labs, &i))
643 size_t len = strlen (vl->label);
645 *loc++ = vl->value.f;
646 *(unsigned char *) loc = len;
647 memcpy (&((char *) loc)[1], vl->label, len);
648 memset (&((char *) loc)[1 + len], ' ',
649 REM_RND_UP (len + 1, sizeof (flt64)));
650 loc += DIV_RND_UP (len + 1, sizeof (flt64));
653 buf_write (w, vlr, vlr_size);
658 vir.vars[0] = idx + 1;
659 buf_write (w, &vir, sizeof vir);
662 /* Writes record type 6, document record. */
664 write_documents (struct sfm_writer *w, const struct dictionary *d)
668 int32_t rec_type ; /* Always 6. */
669 int32_t n_lines ; /* Number of lines of documents. */
670 } ATTRIBUTE((packed)) rec_6;
672 const char * documents = dict_get_documents (d);
673 size_t doc_bytes = strlen (documents);
675 assert (doc_bytes % 80 == 0);
678 rec_6.n_lines = doc_bytes / 80;
679 buf_write (w, &rec_6, sizeof rec_6);
680 buf_write (w, documents, 80 * rec_6.n_lines);
683 /* Write the alignment, width and scale values */
685 write_variable_display_parameters (struct sfm_writer *w,
686 const struct dictionary *dict)
696 } ATTRIBUTE((packed)) vdp_hdr;
698 vdp_hdr.rec_type = 7;
699 vdp_hdr.subtype = 11;
700 vdp_hdr.elem_size = 4;
701 vdp_hdr.n_elem = w->var_cnt_vls * 3;
703 buf_write (w, &vdp_hdr, sizeof vdp_hdr);
705 for ( i = 0 ; i < w->var_cnt ; ++i )
713 } ATTRIBUTE((packed)) params;
715 v = dict_get_var(dict, i);
717 params.measure = (var_get_measure (v) == MEASURE_NOMINAL ? 1
718 : var_get_measure (v) == MEASURE_ORDINAL ? 2
720 params.width = var_get_display_width (v);
721 params.align = (var_get_alignment (v) == ALIGN_LEFT ? 0
722 : var_get_alignment (v) == ALIGN_RIGHT ? 1
725 buf_write (w, ¶ms, sizeof(params));
727 if (var_is_long_string (v))
729 int wcount = var_get_width (v) - EFFECTIVE_LONG_STRING_LENGTH ;
733 params.width = wcount >= MIN_VERY_LONG_STRING ? 32 : wcount;
735 buf_write (w, ¶ms, sizeof(params));
737 wcount -= EFFECTIVE_LONG_STRING_LENGTH ;
743 /* Writes the table of lengths for Very Long String Variables */
745 write_vls_length_table (struct sfm_writer *w,
746 const struct dictionary *dict)
755 } ATTRIBUTE((packed)) vls_hdr;
757 struct string vls_length_map;
759 ds_init_empty (&vls_length_map);
761 vls_hdr.rec_type = 7;
762 vls_hdr.subtype = 14;
763 vls_hdr.elem_size = 1;
766 for (i = 0; i < dict_get_var_cnt (dict); ++i)
768 const struct variable *v = dict_get_var (dict, i);
770 if ( var_get_width (v) < MIN_VERY_LONG_STRING )
773 ds_put_format (&vls_length_map, "%s=%05d",
774 var_get_short_name (v), var_get_width (v));
775 ds_put_char (&vls_length_map, '\0');
776 ds_put_char (&vls_length_map, '\t');
779 vls_hdr.n_elem = ds_length (&vls_length_map);
781 if ( vls_hdr.n_elem > 0 )
783 buf_write (w, &vls_hdr, sizeof vls_hdr);
784 buf_write (w, ds_data (&vls_length_map), ds_length (&vls_length_map));
787 ds_destroy (&vls_length_map);
790 /* Writes the long variable name table */
792 write_longvar_table (struct sfm_writer *w, const struct dictionary *dict)
800 } ATTRIBUTE((packed)) lv_hdr;
802 struct string long_name_map;
805 ds_init_empty (&long_name_map);
806 for (i = 0; i < dict_get_var_cnt (dict); i++)
808 struct variable *v = dict_get_var (dict, i);
811 ds_put_char (&long_name_map, '\t');
812 ds_put_format (&long_name_map, "%s=%s",
813 var_get_short_name (v), var_get_name (v));
818 lv_hdr.elem_size = 1;
819 lv_hdr.n_elem = ds_length (&long_name_map);
821 buf_write (w, &lv_hdr, sizeof lv_hdr);
822 buf_write (w, ds_data (&long_name_map), ds_length (&long_name_map));
824 ds_destroy (&long_name_map);
827 /* Writes record type 7, subtypes 3 and 4. */
829 write_rec_7_34 (struct sfm_writer *w)
835 int32_t data_type_3 ;
840 int32_t data_type_4 ;
843 } ATTRIBUTE((packed)) rec_7;
845 /* Components of the version number, from major to minor. */
846 int version_component[3];
848 /* Used to step through the version string. */
851 /* Parses the version string, which is assumed to be of the form
852 #.#x, where each # is a string of digits, and x is a single
854 version_component[0] = strtol (bare_version, &p, 10);
857 version_component[1] = strtol (bare_version, &p, 10);
858 version_component[2] = (isalpha ((unsigned char) *p)
859 ? tolower ((unsigned char) *p) - 'a' : 0);
861 rec_7.rec_type_3 = 7;
863 rec_7.data_type_3 = sizeof (int32_t);
865 rec_7.elem_3[0] = version_component[0];
866 rec_7.elem_3[1] = version_component[1];
867 rec_7.elem_3[2] = version_component[2];
868 rec_7.elem_3[3] = -1;
870 /* PORTME: 1=IEEE754, 2=IBM 370, 3=DEC VAX E. */
877 /* PORTME: 1=big-endian, 2=little-endian. */
884 /* PORTME: 1=EBCDIC, 2=7-bit ASCII, 3=8-bit ASCII, 4=DEC Kanji. */
887 rec_7.rec_type_4 = 7;
889 rec_7.data_type_4 = sizeof (flt64);
891 rec_7.elem_4[0] = -FLT64_MAX;
892 rec_7.elem_4[1] = FLT64_MAX;
893 rec_7.elem_4[2] = second_lowest_flt64;
895 buf_write (w, &rec_7, sizeof rec_7);
898 /* Write NBYTES starting at BUF to the system file represented by
901 buf_write (struct sfm_writer *w, const void *buf, size_t nbytes)
903 assert (buf != NULL);
904 fwrite (buf, nbytes, 1, w->file);
907 /* Copies string DEST to SRC with the proviso that DEST does not reach
908 byte END; no null terminator is copied. Returns a pointer to the
909 byte after the last byte copied. */
911 append_string_max (char *dest, const char *src, const char *end)
913 int nbytes = MIN (end - dest, (int) strlen (src));
914 memcpy (dest, src, nbytes);
915 return dest + nbytes;
918 /* Makes certain that the compression buffer of H has room for another
919 element. If there's not room, pads out the current instruction
920 octet with zero and dumps out the buffer. */
922 ensure_buf_space (struct sfm_writer *w)
924 if (w->ptr >= w->end)
926 memset (w->x, 0, w->y - w->x);
929 buf_write (w, w->buf, sizeof *w->buf * 128);
933 static void write_compressed_data (struct sfm_writer *w, const flt64 *elem);
935 /* Writes case C to system file W. */
937 sys_file_casewriter_write (struct casewriter *writer, void *w_,
940 struct sfm_writer *w = w_;
941 if (ferror (w->file))
943 casewriter_force_error (writer);
950 if (!w->needs_translation && !w->compress
951 && sizeof (flt64) == sizeof (union value) && ! w->has_vls )
953 /* Fast path: external and internal representations are the
954 same and the dictionary is properly ordered. Write
956 buf_write (w, case_data_all (c), sizeof (union value) * w->flt64_cnt);
960 /* Slow path: internal and external representations differ.
961 Write into a bounce buffer, then write to W. */
968 bounce_size = sizeof *bounce * w->flt64_cnt;
969 bounce = bounce_cur = local_alloc (bounce_size);
970 bounce_end = bounce + bounce_size;
972 for (i = 0; i < w->var_cnt; i++)
974 struct sfm_var *v = &w->vars[i];
976 memset(bounce_cur, ' ', v->flt64_cnt * sizeof (flt64));
980 *bounce_cur = case_num_idx (c, v->fv);
981 bounce_cur += v->flt64_cnt;
985 while (ofs < v->width)
987 int chunk = MIN (MIN_VERY_LONG_STRING - 1, v->width - ofs);
988 int nv = DIV_RND_UP (chunk, sizeof (flt64));
989 buf_copy_rpad ((char *) bounce_cur, nv * sizeof (flt64),
990 case_data_idx (c, v->fv)->s + ofs, chunk);
999 buf_write (w, bounce, bounce_size);
1001 write_compressed_data (w, bounce);
1003 local_free (bounce);
1010 sys_file_casewriter_destroy (struct casewriter *writer, void *w_)
1012 struct sfm_writer *w = w_;
1013 if (!close_writer (w))
1014 casewriter_force_error (writer);
1018 put_instruction (struct sfm_writer *w, unsigned char instruction)
1022 ensure_buf_space (w);
1023 w->x = (unsigned char *) w->ptr++;
1024 w->y = (unsigned char *) w->ptr;
1026 *w->x++ = instruction;
1030 put_element (struct sfm_writer *w, const flt64 *elem)
1032 ensure_buf_space (w);
1033 memcpy (w->ptr++, elem, sizeof *elem);
1037 write_compressed_data (struct sfm_writer *w, const flt64 *elem)
1041 for (i = 0; i < w->var_cnt; i++)
1043 struct sfm_var *v = &w->vars[i];
1047 if (*elem == -FLT64_MAX)
1048 put_instruction (w, 255);
1049 else if (*elem >= 1 - COMPRESSION_BIAS
1050 && *elem <= 251 - COMPRESSION_BIAS
1051 && *elem == (int) *elem)
1052 put_instruction (w, (int) *elem + COMPRESSION_BIAS);
1055 put_instruction (w, 253);
1056 put_element (w, elem);
1064 for (j = 0; j < v->flt64_cnt; j++, elem++)
1066 if (!memcmp (elem, " ", sizeof (flt64)))
1067 put_instruction (w, 254);
1070 put_instruction (w, 253);
1071 put_element (w, elem);
1078 /* Returns true if an I/O error has occurred on WRITER, false otherwise. */
1080 write_error (const struct sfm_writer *writer)
1082 return ferror (writer->file);
1085 /* Closes a system file after we're done with it.
1086 Returns true if successful, false if an I/O error occurred. */
1088 close_writer (struct sfm_writer *w)
1096 if (w->file != NULL)
1099 if (w->buf != NULL && w->ptr > w->buf)
1101 memset (w->x, 0, w->y - w->x);
1102 buf_write (w, w->buf, (w->ptr - w->buf) * sizeof *w->buf);
1106 ok = !write_error (w);
1108 /* Seek back to the beginning and update the number of cases.
1109 This is just a courtesy to later readers, so there's no need
1110 to check return values or report errors. */
1111 if (ok && !fseek (w->file, offsetof (struct sysfile_header, case_cnt),
1114 int32_t case_cnt = w->case_cnt;
1115 fwrite (&case_cnt, sizeof case_cnt, 1, w->file);
1119 if (fclose (w->file) == EOF)
1123 msg (ME, _("An I/O error occurred writing system file \"%s\"."),
1124 fh_get_file_name (w->fh));
1127 fh_close (w->fh, "system file", "we");
1136 static struct casewriter_class sys_file_casewriter_class =
1138 sys_file_casewriter_write,
1139 sys_file_casewriter_destroy,