X-Git-Url: https://pintos-os.org/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=src%2Foutput%2Fspv%2Fspv-light-decoder.c;h=f1f3dba9607dc68599ceb4a3a755bd471a5754d0;hb=47af71b93ed4673d23594ed2b84743f15638f7b7;hp=cbf2aacdab096241d3dea195126eb48d8b5c34ee;hpb=f4cc5814b23b58ba474289e898bc96044c7a50b9;p=pspp diff --git a/src/output/spv/spv-light-decoder.c b/src/output/spv/spv-light-decoder.c index cbf2aacdab..f1f3dba960 100644 --- a/src/output/spv/spv-light-decoder.c +++ b/src/output/spv/spv-light-decoder.c @@ -22,6 +22,7 @@ #include #include #include +#include #include "libpspp/i18n.h" #include "libpspp/message.h" @@ -33,10 +34,21 @@ #include "gl/xalloc.h" #include "gl/xsize.h" +/* Returns a copy of S converted to UTF-8. S might be in UTF-8 already or it + might be in ENCODING (yes, this makes no sense). */ static char * -xstrdup_if_nonempty (const char *s) +to_utf8 (const char *s, const char *encoding) { - return s && s[0] ? xstrdup (s) : NULL; + size_t length = strlen (s); + return (u8_check (CHAR_CAST (const uint8_t *, s), length) + ? recode_string ("UTF-8", encoding, s, length) + : xstrdup (s)); +} + +static char * +to_utf8_if_nonempty (const char *s, const char *encoding) +{ + return s && s[0] ? to_utf8 (s, encoding) : NULL; } static void @@ -84,7 +96,7 @@ static char * WARN_UNUSED_RESULT decode_spvlb_color_string (const char *s, uint8_t def, struct cell_color *colorp) { - int r, g, b; + unsigned int r, g, b; if (!*s) r = g = b = def; else if (sscanf (s, "#%2x%2x%2x", &r, &g, &b) != 3) @@ -102,7 +114,7 @@ decode_spvlb_color_u32 (uint32_t x) static char * WARN_UNUSED_RESULT decode_spvlb_font_style (const struct spvlb_font_style *in, - struct font_style **outp) + const char *encoding, struct font_style **outp) { if (!in) { @@ -124,7 +136,7 @@ decode_spvlb_font_style (const struct spvlb_font_style *in, .underline = in->underline, .fg = { fg, fg }, .bg = { bg, bg }, - .typeface = xstrdup (in->typeface), + .typeface = to_utf8 (in->typeface, encoding), .size = in->size / 1.33, }; return NULL; @@ -220,17 +232,17 @@ decode_spvlb_cell_style (const struct spvlb_cell_style *in, static char *decode_spvlb_value ( const struct pivot_table *, const struct spvlb_value *, - struct pivot_value **) WARN_UNUSED_RESULT; + const char *encoding, struct pivot_value **) WARN_UNUSED_RESULT; static char * WARN_UNUSED_RESULT decode_spvlb_argument (const struct pivot_table *table, const struct spvlb_argument *in, - struct pivot_argument *out) + const char *encoding, struct pivot_argument *out) { if (in->value) { struct pivot_value *value; - char *error = decode_spvlb_value (table, in->value, &value); + char *error = decode_spvlb_value (table, in->value, encoding, &value); if (error) return error; @@ -244,7 +256,7 @@ decode_spvlb_argument (const struct pivot_table *table, out->values = xnmalloc (in->n_values, sizeof *out->values); for (size_t i = 0; i < in->n_values; i++) { - char *error = decode_spvlb_value (table, in->values[i], + char *error = decode_spvlb_value (table, in->values[i], encoding, &out->values[i]); if (error) { @@ -274,11 +286,12 @@ decode_spvlb_value_show (uint8_t in, enum settings_value_show *out) static char * WARN_UNUSED_RESULT decode_spvlb_value (const struct pivot_table *table, - const struct spvlb_value *in, struct pivot_value **outp) + const struct spvlb_value *in, + const char *encoding, struct pivot_value **outp) { *outp = NULL; - struct pivot_value *out = xzalloc (sizeof *out); + struct pivot_value *out = XZALLOC (struct pivot_value); const struct spvlb_value_mod *vm; char *error; @@ -289,6 +302,7 @@ decode_spvlb_value (const struct pivot_table *table, out->type = PIVOT_VALUE_NUMERIC; out->numeric.x = in->type_01.x; error = spv_decode_fmt_spec (in->type_01.format, &out->numeric.format); + out->numeric.honor_small = (in->type_01.format >> 16) == 40; if (error) return error; break; @@ -302,16 +316,18 @@ decode_spvlb_value (const struct pivot_table *table, error = decode_spvlb_value_show (in->type_02.show, &out->numeric.show); if (error) return NULL; - out->numeric.var_name = xstrdup_if_nonempty (in->type_02.var_name); - out->numeric.value_label = xstrdup_if_nonempty (in->type_02.value_label); + out->numeric.var_name = to_utf8_if_nonempty (in->type_02.var_name, + encoding); + out->numeric.value_label = to_utf8_if_nonempty (in->type_02.value_label, + encoding); break; case 3: vm = in->type_03.value_mod; out->type = PIVOT_VALUE_TEXT; - out->text.local = xstrdup (in->type_03.local); - out->text.c = xstrdup (in->type_03.c); - out->text.id = xstrdup (in->type_03.id); + out->text.local = to_utf8 (in->type_03.local, encoding); + out->text.c = to_utf8 (in->type_03.c, encoding); + out->text.id = to_utf8 (in->type_03.id, encoding); out->text.user_provided = !in->type_03.fixed; break; @@ -321,10 +337,11 @@ decode_spvlb_value (const struct pivot_table *table, error = decode_spvlb_value_show (in->type_04.show, &out->string.show); if (error) return NULL; - out->string.s = xstrdup (in->type_04.s); + out->string.s = to_utf8 (in->type_04.s, encoding); out->string.hex = (in->type_04.format >> 16) == fmt_to_io (FMT_AHEX); - out->string.var_name = xstrdup (in->type_04.var_name); - out->string.value_label = xstrdup_if_nonempty (in->type_04.value_label); + out->string.var_name = to_utf8 (in->type_04.var_name, encoding); + out->string.value_label = to_utf8_if_nonempty (in->type_04.value_label, + encoding); break; case 5: @@ -333,23 +350,24 @@ decode_spvlb_value (const struct pivot_table *table, error = decode_spvlb_value_show (in->type_05.show, &out->variable.show); if (error) return error; - out->variable.var_name = xstrdup (in->type_05.var_name); - out->variable.var_label = xstrdup_if_nonempty (in->type_05.var_label); + out->variable.var_name = to_utf8 (in->type_05.var_name, encoding); + out->variable.var_label = to_utf8_if_nonempty (in->type_05.var_label, + encoding); break; case 6: vm = in->type_06.value_mod; out->type = PIVOT_VALUE_TEXT; - out->text.local = xstrdup (in->type_06.local); - out->text.c = xstrdup (in->type_06.c); - out->text.id = xstrdup (in->type_06.id); + out->text.local = to_utf8 (in->type_06.local, encoding); + out->text.c = to_utf8 (in->type_06.c, encoding); + out->text.id = to_utf8 (in->type_06.id, encoding); out->text.user_provided = false; break; case -1: vm = in->type_else.value_mod; out->type = PIVOT_VALUE_TEMPLATE; - out->template.local = xstrdup (in->type_else.template); + out->template.local = to_utf8 (in->type_else.template, encoding); out->template.id = out->template.local; out->template.n_args = 0; out->template.args = xnmalloc (in->type_else.n_args, @@ -357,7 +375,7 @@ decode_spvlb_value (const struct pivot_table *table, for (size_t i = 0; i < in->type_else.n_args; i++) { error = decode_spvlb_argument (table, in->type_else.args[i], - &out->template.args[i]); + encoding, &out->template.args[i]); if (error) { pivot_value_destroy (out); @@ -375,17 +393,19 @@ decode_spvlb_value (const struct pivot_table *table, { if (vm->n_subscripts) { - out->n_subscripts = vm->n_subscripts; - out->subscripts = xnmalloc (vm->n_subscripts, - sizeof *out->subscripts); + struct pivot_value_ex *ex = pivot_value_ex_rw (out); + ex->n_subscripts = vm->n_subscripts; + ex->subscripts = xnmalloc (vm->n_subscripts, sizeof *ex->subscripts); for (size_t i = 0; i < vm->n_subscripts; i++) - out->subscripts[i] = xstrdup (vm->subscripts[i]); + ex->subscripts[i] = to_utf8 (vm->subscripts[i], encoding); } if (vm->n_refs) { - out->footnote_indexes = xnmalloc (vm->n_refs, - sizeof *out->footnote_indexes); + struct pivot_value_ex *ex = pivot_value_ex_rw (out); + ex->footnote_indexes = xnmalloc (vm->n_refs, + sizeof *ex->footnote_indexes); + for (size_t i = 0; i < vm->n_refs; i++) { uint16_t idx = vm->refs[i]; @@ -396,17 +416,19 @@ decode_spvlb_value (const struct pivot_table *table, idx, table->n_footnotes); } - out->footnote_indexes[out->n_footnotes++] = idx; + ex->footnote_indexes[ex->n_footnotes++] = idx; } + pivot_value_sort_footnotes (out); } if (vm->style_pair) { + struct pivot_value_ex *ex = pivot_value_ex_rw (out); error = decode_spvlb_font_style (vm->style_pair->font_style, - &out->font_style); + encoding, &ex->font_style); if (!error) error = decode_spvlb_cell_style (vm->style_pair->cell_style, - &out->cell_style); + &ex->cell_style); if (error) { pivot_value_destroy (out); @@ -418,7 +440,7 @@ decode_spvlb_value (const struct pivot_table *table, && vm->template_string->id && vm->template_string->id[0] && out->type == PIVOT_VALUE_TEMPLATE) - out->template.id = xstrdup (vm->template_string->id); + out->template.id = to_utf8 (vm->template_string->id, encoding); } *outp = out; @@ -426,7 +448,8 @@ decode_spvlb_value (const struct pivot_table *table, } static char * WARN_UNUSED_RESULT -decode_spvlb_area (const struct spvlb_area *in, struct table_area_style *out) +decode_spvlb_area (const struct spvlb_area *in, struct table_area_style *out, + const char *encoding) { char *error; @@ -466,7 +489,7 @@ decode_spvlb_area (const struct spvlb_area *in, struct table_area_style *out) .underline = in->underline, .fg = { fg0, in->alternate ? fg1 : fg0 }, .bg = { bg0, in->alternate ? bg1 : bg0 }, - .typeface = xstrdup (in->typeface), + .typeface = to_utf8 (in->typeface, encoding), .size = in->size / 1.33, }, .cell_style = { @@ -487,14 +510,16 @@ decode_spvlb_group (const struct pivot_table *, size_t n_categories, bool show_label, struct pivot_category *parent, - struct pivot_dimension *); + struct pivot_dimension *, + const char *encoding); static char * WARN_UNUSED_RESULT decode_spvlb_categories (const struct pivot_table *table, struct spvlb_category **categories, size_t n_categories, struct pivot_category *parent, - struct pivot_dimension *dimension) + struct pivot_dimension *dimension, + const char *encoding) { for (size_t i = 0; i < n_categories; i++) { @@ -503,7 +528,7 @@ decode_spvlb_categories (const struct pivot_table *table, { char *error = decode_spvlb_categories ( table, in->group->subcategories, in->group->n_subcategories, - parent, dimension); + parent, dimension, encoding); if (error) return error; @@ -511,11 +536,11 @@ decode_spvlb_categories (const struct pivot_table *table, } struct pivot_value *name; - char *error = decode_spvlb_value (table, in->name, &name); + char *error = decode_spvlb_value (table, in->name, encoding, &name); if (error) return error; - struct pivot_category *out = xzalloc (sizeof *out); + struct pivot_category *out = XZALLOC (struct pivot_category); out->name = name; out->parent = parent; out->dimension = dimension; @@ -523,7 +548,7 @@ decode_spvlb_categories (const struct pivot_table *table, { char *error = decode_spvlb_group (table, in->group->subcategories, in->group->n_subcategories, - true, out, dimension); + true, out, dimension, encoding); if (error) { pivot_category_destroy (out); @@ -553,7 +578,8 @@ decode_spvlb_group (const struct pivot_table *table, struct spvlb_category **categories, size_t n_categories, bool show_label, struct pivot_category *category, - struct pivot_dimension *dimension) + struct pivot_dimension *dimension, + const char *encoding) { category->subs = XCALLOC (n_categories, struct pivot_category *); category->n_subs = 0; @@ -561,7 +587,7 @@ decode_spvlb_group (const struct pivot_table *table, category->show_label = show_label; return decode_spvlb_categories (table, categories, n_categories, category, - dimension); + dimension, encoding); } static char * WARN_UNUSED_RESULT @@ -594,15 +620,16 @@ fill_leaves (struct pivot_category *category, static char * WARN_UNUSED_RESULT decode_spvlb_dimension (const struct pivot_table *table, const struct spvlb_dimension *in, - size_t idx, struct pivot_dimension **outp) + size_t idx, const char *encoding, + struct pivot_dimension **outp) { /* Convert most of the dimension. */ struct pivot_value *name; - char *error = decode_spvlb_value (table, in->name, &name); + char *error = decode_spvlb_value (table, in->name, encoding, &name); if (error) return error; - struct pivot_dimension *out = xzalloc (sizeof *out); + struct pivot_dimension *out = XZALLOC (struct pivot_dimension); out->level = UINT_MAX; out->top_index = idx; out->hide_all_labels = in->props->hide_all_labels; @@ -616,7 +643,7 @@ decode_spvlb_dimension (const struct pivot_table *table, }; error = decode_spvlb_group (table, in->categories, in->n_categories, !in->props->hide_dim_label, out->root, - out); + out, encoding); if (error) goto error; @@ -706,7 +733,7 @@ decode_data_index (uint64_t in, const struct pivot_table *table, size_t *out) { uint64_t remainder = in; - for (size_t i = table->n_dimensions - 1; i > 0; i--) + for (size_t i = table->n_dimensions - 1; i < table->n_dimensions; i--) { const struct pivot_dimension *d = table->dimensions[i]; if (d->n_leaves) @@ -717,16 +744,15 @@ decode_data_index (uint64_t in, const struct pivot_table *table, else out[i] = 0; } - if (remainder >= table->dimensions[0]->n_leaves) + if (remainder) return xasprintf ("out of range cell data index %"PRIu64, in); - out[0] = remainder; return NULL; } static char * WARN_UNUSED_RESULT decode_spvlb_cells (struct spvlb_cell **in, size_t n_in, - struct pivot_table *table) + struct pivot_table *table, const char *encoding) { if (!table->n_dimensions) return NULL; @@ -737,7 +763,7 @@ decode_spvlb_cells (struct spvlb_cell **in, size_t n_in, struct pivot_value *value; char *error = decode_data_index (in[i]->index, table, dindexes); if (!error) - error = decode_spvlb_value (table, in[i]->value, &value); + error = decode_spvlb_value (table, in[i]->value, encoding, &value); if (error) { free (dindexes); @@ -751,18 +777,18 @@ decode_spvlb_cells (struct spvlb_cell **in, size_t n_in, } static char * WARN_UNUSED_RESULT -decode_spvlb_footnote (const struct spvlb_footnote *in, +decode_spvlb_footnote (const struct spvlb_footnote *in, const char *encoding, size_t idx, struct pivot_table *table) { struct pivot_value *content; - char *error = decode_spvlb_value (table, in->text, &content); + char *error = decode_spvlb_value (table, in->text, encoding, &content); if (error) return error; struct pivot_value *marker = NULL; if (in->marker) { - error = decode_spvlb_value (table, in->marker, &marker); + error = decode_spvlb_value (table, in->marker, encoding, &marker); if (error) { pivot_value_destroy (content); @@ -785,19 +811,21 @@ decode_current_layer (uint64_t current_layer, struct pivot_table *table) table->current_layer = xnmalloc (axis->n_dimensions, sizeof *table->current_layer); + uint64_t remainder = current_layer; for (size_t i = 0; i < axis->n_dimensions; i++) { const struct pivot_dimension *d = axis->dimensions[i]; if (d->n_leaves) { - table->current_layer[i] = current_layer % d->n_leaves; - current_layer /= d->n_leaves; + table->current_layer[i] = remainder % d->n_leaves; + remainder /= d->n_leaves; } else table->current_layer[i] = 0; } - if (current_layer > 0) + if (remainder > 0) return xasprintf ("out of range layer data index %"PRIu64, current_layer); + return NULL; } @@ -810,12 +838,17 @@ decode_spvlb_table (const struct spvlb_table *in, struct pivot_table **outp) in->header->version); char *error = NULL; - struct pivot_table *out = xzalloc (sizeof *out); + struct pivot_table *out = XZALLOC (struct pivot_table); out->ref_cnt = 1; hmap_init (&out->cells); out->look = pivot_table_look_new_builtin_default (); out->settings = (struct fmt_settings) FMT_SETTINGS_INIT; + const struct spvlb_y1 *y1 = (in->formats->x0 ? in->formats->x0->y1 + : in->formats->x3 ? in->formats->x3->y1 + : NULL); + const char *encoding = spvlb_table_get_encoding (in); + /* Display settings. */ out->look->show_numeric_markers = !in->ts->show_alphabetic_markers; out->rotate_inner_column_labels = in->header->rotate_inner_column_labels; @@ -871,8 +904,8 @@ decode_spvlb_table (const struct spvlb_table *in, struct pivot_table **outp) &out->sizing[TABLE_HORZ].keeps, &out->sizing[TABLE_HORZ].n_keeps); - out->notes = xstrdup_if_nonempty (in->ts->notes); - out->look->name = xstrdup_if_nonempty (in->ts->table_look); + out->notes = to_utf8_if_nonempty (in->ts->notes, encoding); + out->look->name = to_utf8_if_nonempty (in->ts->table_look, encoding); /* Print settings. */ out->look->print_all_layers = in->ps->all_layers; @@ -881,7 +914,7 @@ decode_spvlb_table (const struct spvlb_table *in, struct pivot_table **outp) out->look->shrink_to_fit[TABLE_VERT] = in->ps->fit_length; out->look->top_continuation = in->ps->top_continuation; out->look->bottom_continuation = in->ps->bottom_continuation; - out->look->continuation = xstrdup (in->ps->continuation_string); + out->look->continuation = to_utf8 (in->ps->continuation_string, encoding); out->look->n_orphan_lines = in->ps->n_orphan_lines; /* Format settings. */ @@ -889,7 +922,7 @@ decode_spvlb_table (const struct spvlb_table *in, struct pivot_table **outp) if (epoch >= 1000 && epoch <= 9999) out->settings.epoch = epoch; char decimal = in->formats->y0->decimal; - if (decimal == '.' || decimal == '.') + if (decimal == '.' || decimal == ',') out->settings.decimal = decimal; else { @@ -908,16 +941,13 @@ decode_spvlb_table (const struct spvlb_table *in, struct pivot_table **outp) out->small = in->formats->x3 ? in->formats->x3->small : 0; /* Command information. */ - const struct spvlb_y1 *y1 = (in->formats->x0 ? in->formats->x0->y1 - : in->formats->x3 ? in->formats->x3->y1 - : NULL); if (y1) { - out->command_local = xstrdup (y1->command_local); - out->command_c = xstrdup (y1->command); - out->language = xstrdup (y1->language); + out->command_local = to_utf8 (y1->command_local, encoding); + out->command_c = to_utf8 (y1->command, encoding); + out->language = to_utf8 (y1->language, encoding); /* charset? */ - out->locale = xstrdup (y1->locale); + out->locale = to_utf8 (y1->locale, encoding); } /* Source information. */ @@ -925,8 +955,8 @@ decode_spvlb_table (const struct spvlb_table *in, struct pivot_table **outp) if (x3) { if (x3->dataset && x3->dataset[0] && x3->dataset[0] != 4) - out->dataset = xstrdup (x3->dataset); - out->datafile = xstrdup_if_nonempty (x3->datafile); + out->dataset = to_utf8 (x3->dataset, encoding); + out->datafile = to_utf8_if_nonempty (x3->datafile, encoding); out->date = x3->date; } @@ -948,32 +978,36 @@ decode_spvlb_table (const struct spvlb_table *in, struct pivot_table **outp) pivot_table_create_footnote__ (out, fn->n_footnotes - 1, NULL, NULL); for (size_t i = 0; i < fn->n_footnotes; i++) { - error = decode_spvlb_footnote (in->footnotes->footnotes[i], i, out); + error = decode_spvlb_footnote (in->footnotes->footnotes[i], + encoding, i, out); if (error) goto error; } } /* Title and caption. */ - error = decode_spvlb_value (out, in->titles->user_title, &out->title); + error = decode_spvlb_value (out, in->titles->user_title, encoding, + &out->title); if (error) goto error; - error = decode_spvlb_value (out, in->titles->subtype, &out->subtype); + error = decode_spvlb_value (out, in->titles->subtype, encoding, + &out->subtype); if (error) goto error; if (in->titles->corner_text) { error = decode_spvlb_value (out, in->titles->corner_text, - &out->corner_text); + encoding, &out->corner_text); if (error) goto error; } if (in->titles->caption) { - error = decode_spvlb_value (out, in->titles->caption, &out->caption); + error = decode_spvlb_value (out, in->titles->caption, encoding, + &out->caption); if (error) goto error; } @@ -982,7 +1016,8 @@ decode_spvlb_table (const struct spvlb_table *in, struct pivot_table **outp) /* Styles. */ for (size_t i = 0; i < PIVOT_N_AREAS; i++) { - error = decode_spvlb_area (in->areas->areas[i], &out->look->areas[i]); + error = decode_spvlb_area (in->areas->areas[i], &out->look->areas[i], + encoding); if (error) goto error; } @@ -999,7 +1034,7 @@ decode_spvlb_table (const struct spvlb_table *in, struct pivot_table **outp) for (size_t i = 0; i < out->n_dimensions; i++) { error = decode_spvlb_dimension (out, in->dimensions->dims[i], - i, &out->dimensions[i]); + i, encoding, &out->dimensions[i]); if (error) goto error; } @@ -1035,7 +1070,8 @@ decode_spvlb_table (const struct spvlb_table *in, struct pivot_table **outp) goto error; /* Data. */ - error = decode_spvlb_cells (in->cells->cells, in->cells->n_cells, out); + error = decode_spvlb_cells (in->cells->cells, in->cells->n_cells, out, + encoding); *outp = out; return NULL;