X-Git-Url: https://pintos-os.org/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=dump2.c;h=15670ecf4bb7c8de1ba8986290fa0fde8f53046f;hb=00357578f9bdbe00e5237bdb82dc80ec2214cbef;hp=4fd7531ab530df5860a01cb27195008f47aef06d;hpb=c4b1f46d58ad414cb60147092e4cdc3ce207db8a;p=pspp diff --git a/dump2.c b/dump2.c index 4fd7531ab5..15670ecf4b 100644 --- a/dump2.c +++ b/dump2.c @@ -7,6 +7,7 @@ #include #include #include +#include "u8-mbtouc.h" static uint8_t *data; static size_t n, pos; @@ -86,10 +87,25 @@ all_ascii(const uint8_t *p) return true; } +static bool +all_utf8(const uint8_t *p) +{ + size_t len = strlen ((char *) p); + for (size_t ofs = 0, mblen; ofs < len; ofs += mblen) + { + ucs4_t uc; + + mblen = u8_mbtouc (&uc, p + ofs, len - ofs); + if (uc < 32 || uc == 127 || uc == 0xfffd) + return false; + } + return true; +} + static char * get_fixed_string(int len, const char *where) { - if (pos + len > n || !memchr(&data[pos], 0, len) || !all_ascii(&data[pos])) + if (pos + len > n || !memchr(&data[pos], 0, len) || !all_utf8(&data[pos])) { fprintf(stderr, "%s: 0x%x: bad fixed-width string\n", where, pos); exit(1); @@ -190,7 +206,7 @@ dump_raw(FILE *stream, int start, int end, const char *separator) } static void -dump_source(int count, int n_series) +dump_source(int end, int count, int n_series, const char *name) { const union { @@ -216,17 +232,22 @@ dump_source(int count, int n_series) printf ("\n"); } - if (!n_sysmis) + if (pos >= end) return; - printf ("\n %08x:", pos); - printf (" %d", get_u32()); - printf (", \"%s\"\n", get_string()); + match_u32_assert(1); + char *name2 = get_string(); + assert(!strcmp(name, name2)); printf ("\n %08x:", pos); int n_more_series = get_u32(); + if (n_series != n_more_series) + printf("different series counts: %d %d\n", n_series, n_more_series); + assert(n_more_series <= n_series); printf (" %d series to come\n", n_more_series); + int max1 = -1; + int ofs = pos; for (int i = 0; i < n_more_series; i++) { printf ("%08x:", pos); @@ -236,21 +257,45 @@ dump_source(int count, int n_series) { int x = get_u32(); int y = get_u32(); - printf (" (%d,%d)", x, y); + printf (" (%d, %d)", x, y); + if (y > max1) + max1 = y; } printf ("\n"); } printf ("\n%08x:", pos); int n_strings = get_u32(); + assert(n_strings == max1 + 1); printf (" %d strings\n", n_strings); + + char **strings = malloc(n_strings * sizeof *strings); for (int i = 0; i < n_strings; i++) { - int x = get_u32(); + int frequency = get_u32(); char *s = get_string(); - printf ("%d: \"%s\" (%d)\n", i, s, x); + printf ("%d: \"%s\" (%d)\n", i, s, frequency); + strings[i] = s; } printf ("\n"); + + assert (pos == end); + pos = ofs; + printf("Strings:\n"); + for (int i = 0; i < n_more_series; i++) + { + printf (" \"%s\"\n", get_string()); + int n_pairs = get_u32(); + for (int j = 0; j < n_pairs; j++) + { + int x = get_u32(); + //assert (x == j); + int y = get_u32(); + printf (" %d: \"%s\"\n", x, strings[y]); + } + printf ("\n"); + } + pos = end; } int @@ -284,6 +329,7 @@ main(int argc, char **argv) pos = 0; match_byte_assert(0); + int version = data[pos]; if (!match_byte(0xaf)) match_byte_assert(0xb0); int n_sources = data[pos++]; @@ -291,19 +337,38 @@ main(int argc, char **argv) match_u32_assert(s.st_size); printf ("%d sources\n", n_sources); + + struct source + { + int offset, count, n_series; + char *name; + } + sources[n_sources]; for (int i = 0; i < n_sources; i++) { - pos = 8 + 80 * i; int count = get_u32(); int n_series = get_u32(); int offset = get_u32(); - char *name = get_fixed_string(64); - int dunno = get_u32(); + char *name = get_fixed_string(version == 0xb0 ? 64 : 28); + int dunno = version == 0xb0 ? get_u32() : 0; printf ("source %d: %d series, %d observations per series, offset %08x, \"%s\", %x\n", i, n_series, count, offset, name, dunno); - pos = offset; - dump_source(count, n_series); + sources[i].offset = offset; + sources[i].count = count; + sources[i].n_series = n_series; + sources[i].name = name; + } + + for (int i = 0; i < n_sources; i++) + { + if (pos != sources[i].offset) + { + fprintf (stderr, "pos=0x%x expected=0x%x reading source %d\n", pos, sources[i].offset, i); + exit(1); + } + dump_source(i + 1 >= n_sources ? n : sources[i + 1].offset, sources[i].count, sources[i].n_series, sources[i].name); } + assert(pos == n); return 0; }