1 /* PSPP - computes sample statistics.
2 Copyright (C) 1997-9, 2000, 2006 Free Software Foundation, Inc.
3 Written by Ben Pfaff <blp@gnu.org>.
5 This program is free software; you can redistribute it and/or
6 modify it under the terms of the GNU General Public License as
7 published by the Free Software Foundation; either version 2 of the
8 License, or (at your option) any later version.
10 This program is distributed in the hope that it will be useful, but
11 WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 General Public License for more details.
15 You should have received a copy of the GNU General Public License
16 along with this program; if not, write to the Free Software
17 Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
29 /* Reverses the order of NBYTES bytes at address P, thus converting
30 between little- and big-endian byte orders. */
32 buf_reverse (char *p, size_t nbytes)
34 char *h = p, *t = &h[nbytes - 1];
46 /* Finds the last NEEDLE of length NEEDLE_LEN in a HAYSTACK of length
47 HAYSTACK_LEN. Returns a pointer to the needle found. */
49 buf_find_reverse (const char *haystack, size_t haystack_len,
50 const char *needle, size_t needle_len)
53 for (i = haystack_len - needle_len; i >= 0; i--)
54 if (!memcmp (needle, &haystack[i], needle_len))
55 return (char *) &haystack[i];
59 /* Compares the SIZE bytes in A to those in B, disregarding case,
60 and returns a strcmp()-type result. */
62 buf_compare_case (const char *a_, const char *b_, size_t size)
64 const unsigned char *a = (unsigned char *) a_;
65 const unsigned char *b = (unsigned char *) b_;
69 unsigned char ac = toupper (*a++);
70 unsigned char bc = toupper (*b++);
73 return ac > bc ? 1 : -1;
79 /* Compares A of length A_LEN to B of length B_LEN. The shorter
80 string is considered to be padded with spaces to the length of
83 buf_compare_rpad (const char *a, size_t a_len, const char *b, size_t b_len)
88 min_len = a_len < b_len ? a_len : b_len;
89 result = memcmp (a, b, min_len);
98 for (idx = min_len; idx < b_len; idx++)
100 return ' ' > b[idx] ? 1 : -1;
104 for (idx = min_len; idx < a_len; idx++)
106 return a[idx] > ' ' ? 1 : -1;
112 /* Compares strin A to string B. The shorter string is
113 considered to be padded with spaces to the length of the
116 str_compare_rpad (const char *a, const char *b)
118 return buf_compare_rpad (a, strlen (a), b, strlen (b));
121 /* Copies string SRC to buffer DST, of size DST_SIZE bytes.
122 DST is truncated to DST_SIZE bytes or padded on the right with
125 buf_copy_str_rpad (char *dst, size_t dst_size, const char *src)
127 size_t src_len = strlen (src);
128 if (src_len >= dst_size)
129 memcpy (dst, src, dst_size);
132 memcpy (dst, src, src_len);
133 memset (&dst[src_len], ' ', dst_size - src_len);
137 /* Copies string SRC to buffer DST, of size DST_SIZE bytes.
138 DST is truncated to DST_SIZE bytes or padded on the left with
141 buf_copy_str_lpad (char *dst, size_t dst_size, const char *src)
143 size_t src_len = strlen (src);
144 if (src_len >= dst_size)
145 memcpy (dst, src, dst_size);
148 size_t pad_cnt = dst_size - src_len;
149 memset (&dst[0], ' ', pad_cnt);
150 memcpy (dst + pad_cnt, src, src_len);
154 /* Copies buffer SRC, of SRC_SIZE bytes, to DST, of DST_SIZE bytes.
155 DST is truncated to DST_SIZE bytes or padded on the right with
158 buf_copy_rpad (char *dst, size_t dst_size,
159 const char *src, size_t src_size)
161 if (src_size >= dst_size)
162 memmove (dst, src, dst_size);
165 memmove (dst, src, src_size);
166 memset (&dst[src_size], ' ', dst_size - src_size);
170 /* Copies string SRC to string DST, which is in a buffer DST_SIZE
172 Truncates DST to DST_SIZE - 1 characters or right-pads with
173 spaces to DST_SIZE - 1 characters if necessary. */
175 str_copy_rpad (char *dst, size_t dst_size, const char *src)
177 size_t src_len = strlen (src);
178 if (src_len < dst_size - 1)
180 memcpy (dst, src, src_len);
181 memset (&dst[src_len], ' ', dst_size - 1 - src_len);
184 memcpy (dst, src, dst_size - 1);
185 dst[dst_size - 1] = 0;
188 /* Copies SRC to DST, which is in a buffer DST_SIZE bytes long.
189 Truncates DST to DST_SIZE - 1 characters, if necessary. */
191 str_copy_trunc (char *dst, size_t dst_size, const char *src)
193 size_t src_len = strlen (src);
194 assert (dst_size > 0);
195 if (src_len + 1 < dst_size)
196 memcpy (dst, src, src_len + 1);
199 memcpy (dst, src, dst_size - 1);
200 dst[dst_size - 1] = '\0';
204 /* Copies buffer SRC, of SRC_LEN bytes,
205 to DST, which is in a buffer DST_SIZE bytes long.
206 Truncates DST to DST_SIZE - 1 characters, if necessary. */
208 str_copy_buf_trunc (char *dst, size_t dst_size,
209 const char *src, size_t src_size)
212 assert (dst_size > 0);
214 dst_len = src_size < dst_size ? src_size : dst_size - 1;
215 memcpy (dst, src, dst_len);
219 /* Converts each character in S to uppercase. */
221 str_uppercase (char *s)
223 for (; *s != '\0'; s++)
224 *s = toupper ((unsigned char) *s);
227 /* Converts each character in S to lowercase. */
229 str_lowercase (char *s)
231 for (; *s != '\0'; s++)
232 *s = tolower ((unsigned char) *s);
235 /* Initializes ST with initial contents S. */
237 ds_create (struct string *st, const char *s)
239 st->length = strlen (s);
240 st->capacity = 8 + st->length * 2;
241 st->string = xmalloc (st->capacity + 1);
242 strcpy (st->string, s);
245 /* Initializes DST with the contents of SRC between characters FIRST and LAST
248 ds_create_substr(struct string *dst, const struct string *src,
251 assert(last >= first);
252 dst->length = last - first + 1;
253 dst->capacity = 8 + dst->length * 2;
254 dst->string = xmalloc (dst->capacity + 1);
256 memcpy (dst->string, &src->string[first], dst->length);
260 /* Initializes ST, making room for at least CAPACITY characters. */
262 ds_init (struct string *st, size_t capacity)
266 st->capacity = capacity;
269 st->string = xmalloc (st->capacity + 1);
272 /* Replaces the contents of ST with STRING. STRING may overlap with
275 ds_replace (struct string *st, const char *string)
277 size_t new_length = strlen (string);
278 if (new_length > st->capacity)
280 /* The new length is longer than the allocated length, so
281 there can be no overlap. */
283 ds_concat (st, string, new_length);
287 /* Overlap is possible, but the new string will fit in the
288 allocated space, so we can just copy data. */
289 st->length = new_length;
290 memmove (st->string, string, st->length);
296 ds_destroy (struct string *st)
302 /* Swaps the contents of strings A and B. */
304 ds_swap (struct string *a, struct string *b)
306 struct string tmp = *a;
311 /* Truncates ST to zero length. */
313 ds_clear (struct string *st)
318 /* Pad ST on the right with copies of PAD until ST is at least
319 LENGTH characters in size. If ST is initially LENGTH
320 characters or longer, this is a no-op. */
322 ds_rpad (struct string *st, size_t length, char pad)
325 if (st->length < length)
327 if (st->capacity < length)
328 ds_extend (st, length);
329 memset (&st->string[st->length], pad, length - st->length);
334 /* Removes trailing spaces from ST.
335 Returns number of spaces removed. */
337 ds_rtrim_spaces (struct string *st)
340 while (isspace (ds_last (st)))
348 /* Removes leading spaces from ST.
349 Returns number of spaces removed. */
351 ds_ltrim_spaces (struct string *st)
353 int idx = ds_n_find(st, "\t ");
359 int len = ds_length(st);
364 ds_replace(st, &ds_c_str(st)[idx]);
370 /* If the last character in ST is C, removes it and returns true.
371 Otherwise, returns false without modifying ST. */
373 ds_chomp (struct string *st, char c_)
375 unsigned char c = c_;
376 if (ds_last (st) == c)
385 /* Ensures that ST can hold at least MIN_CAPACITY characters plus a null
388 ds_extend (struct string *st, size_t min_capacity)
390 if (min_capacity > st->capacity)
393 if (st->capacity < min_capacity)
394 st->capacity = min_capacity * 2;
396 st->string = xrealloc (st->string, st->capacity + 1);
400 /* Shrink ST to the minimum capacity need to contain its content. */
402 ds_shrink (struct string *st)
404 if (st->capacity != st->length)
406 st->capacity = st->length;
407 st->string = xrealloc (st->string, st->capacity + 1);
411 /* Truncates ST to at most LENGTH characters long. */
413 ds_truncate (struct string *st, size_t length)
415 if (length >= st->length)
420 /* Returns true if ST is empty, false otherwise. */
422 ds_is_empty (const struct string *st)
424 return st->length == 0;
427 /* Returns the length of ST. */
429 ds_length (const struct string *st)
434 /* Returns the allocation size of ST. */
436 ds_capacity (const struct string *st)
442 /* Returns the index of the first character in ST which
443 is an element of the set CS.
444 Returns -1 if no characters are found.
447 ds_find(const struct string *st, const char cs[])
451 for(i = 0; i < st->length ; ++i)
453 if ('\0' == st->string[i])
455 for (j = 0 ; j < strlen(cs) ; ++j)
457 if ( st->string[i] == cs[j])
464 /* Returns the index of the first character in ST which
465 is NOT an element of the set CS.
466 Returns -1 if no such character is found.
469 ds_n_find(const struct string *st, const char cs[])
473 for(i = 0; i < st->length ; ++i)
476 if ('\0' == st->string[i])
478 for (j = 0 ; j < strlen(cs) ; ++j)
480 if ( st->string[i] == cs[j])
494 /* Returns the first character in ST as a value in the range of
495 unsigned char. Returns EOF if ST is the empty string. */
497 ds_first (const struct string *st)
499 return st->length > 0 ? (unsigned char) st->string[0] : EOF;
502 /* Returns the last character in ST as a value in the range of
503 unsigned char. Returns EOF if ST is the empty string. */
505 ds_last (const struct string *st)
507 return st->length > 0 ? (unsigned char) st->string[st->length - 1] : EOF;
510 /* Returns the value of ST as a null-terminated string. */
512 ds_c_str (const struct string *st)
514 ((char *) st->string)[st->length] = '\0';
518 /* Returns the string data inside ST. */
520 ds_data (const struct string *st)
525 /* Returns a pointer to the null terminator ST.
526 This might not be an actual null character unless ds_c_str() has
527 been called since the last modification to ST. */
529 ds_end (const struct string *st)
531 return st->string + st->length;
534 /* Concatenates S onto ST. */
536 ds_puts (struct string *st, const char *s)
543 ds_extend (st, st->length + s_len);
544 strcpy (st->string + st->length, s);
548 /* Concatenates LEN characters from BUF onto ST. */
550 ds_concat (struct string *st, const char *buf, size_t len)
552 ds_extend (st, st->length + len);
553 memcpy (st->string + st->length, buf, len);
557 void ds_vprintf (struct string *st, const char *format, va_list args);
560 /* Formats FORMAT as a printf string and appends the result to ST. */
562 ds_printf (struct string *st, const char *format, ...)
566 va_start (args, format);
567 ds_vprintf(st,format,args);
572 /* Formats FORMAT as a printf string and appends the result to ST. */
574 ds_vprintf (struct string *st, const char *format, va_list args)
576 /* Fscking glibc silently changed behavior between 2.0 and 2.1.
577 Fsck fsck fsck. Before, it returned -1 on buffer overflow. Now,
578 it returns the number of characters (not bytes) that would have
585 avail = st->capacity - st->length + 1;
586 needed = vsnprintf (st->string + st->length, avail, format, args);
591 ds_extend (st, st->length + needed);
593 vsprintf (st->string + st->length, format, a1);
601 ds_extend (st, (st->capacity + 1) * 2);
602 avail = st->capacity - st->length + 1;
604 needed = vsnprintf (st->string + st->length, avail, format, a2);
610 st->length += needed;
613 /* Appends character CH to ST. */
615 ds_putc (struct string *st, int ch)
617 if (st->length == st->capacity)
618 ds_extend (st, st->length + 1);
619 st->string[st->length++] = ch;
622 /* Appends to ST a newline-terminated line read from STREAM.
623 Newline is the last character of ST on return, unless an I/O error
624 or end of file is encountered after reading some characters.
625 Returns 1 if a line is successfully read, or 0 if no characters at
626 all were read before an I/O error or end of file was
629 ds_gets (struct string *st, FILE *stream)
649 /* Reads a line from STREAM into ST, then preprocesses as follows:
651 - Splices lines terminated with `\'.
653 - Deletes comments introduced by `#' outside of single or double
656 - Trailing whitespace will be deleted.
658 Increments cust_ln as appropriate.
660 Returns nonzero only if a line was successfully read. */
662 ds_get_config_line (FILE *stream, struct string *st, struct file_locator *where)
664 /* Read the first line. */
666 where->line_number++;
667 if (!ds_gets (st, stream))
670 /* Read additional lines, if any. */
673 /* Remove trailing whitespace. */
675 char *s = ds_c_str (st);
676 size_t len = ds_length (st);
678 while (len > 0 && isspace ((unsigned char) s[len - 1]))
680 ds_truncate (st, len);
683 /* Check for trailing \. Remove if found, bail otherwise. */
684 if (ds_length (st) == 0 || ds_c_str (st)[ds_length (st) - 1] != '\\')
686 ds_truncate (st, ds_length (st) - 1);
688 /* Append another line and go around again. */
690 int success = ds_gets (st, stream);
691 where->line_number++;
697 /* Find a comment and remove. */
702 for (cp = ds_c_str (st); *cp; cp++)
707 else if (*cp == '\\')
710 else if (*cp == '\'' || *cp == '"')
714 ds_truncate (st, cp - ds_c_str (st));
722 /* Lengthed strings. */
724 /* Creates a new lengthed string LS with contents as a copy of
727 ls_create (struct fixed_string *ls, const char *s)
729 ls->length = strlen (s);
730 ls->string = xmalloc (ls->length + 1);
731 memcpy (ls->string, s, ls->length + 1);
734 /* Creates a new lengthed string LS with contents as a copy of
735 BUFFER with length LEN. */
737 ls_create_buffer (struct fixed_string *ls,
738 const char *buffer, size_t len)
741 ls->string = xmalloc (len + 1);
742 memcpy (ls->string, buffer, len);
743 ls->string[len] = '\0';
746 /* Sets the fields of LS to the specified values. */
748 ls_init (struct fixed_string *ls, const char *string, size_t length)
750 ls->string = (char *) string;
754 /* Copies the fields of SRC to DST. */
756 ls_shallow_copy (struct fixed_string *dst, const struct fixed_string *src)
761 /* Frees the memory backing LS. */
763 ls_destroy (struct fixed_string *ls)
768 /* Sets LS to a null pointer value. */
770 ls_null (struct fixed_string *ls)
775 /* Returns nonzero only if LS has a null pointer value. */
777 ls_null_p (const struct fixed_string *ls)
779 return ls->string == NULL;
782 /* Returns nonzero only if LS is a null pointer or has length 0. */
784 ls_empty_p (const struct fixed_string *ls)
786 return ls->string == NULL || ls->length == 0;
789 /* Returns the length of LS, which must not be null. */
791 ls_length (const struct fixed_string *ls)
796 /* Returns a pointer to the character string in LS. */
798 ls_c_str (const struct fixed_string *ls)
800 return (char *) ls->string;
803 /* Returns a pointer to the null terminator of the character string in
806 ls_end (const struct fixed_string *ls)
808 return (char *) (ls->string + ls->length);