X-Git-Url: https://pintos-os.org/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=src%2Fdata%2Fdictionary.c;h=024f97b3d5dd45b5d94d5778582456af30aa19c5;hb=a0454ef2df24d238bdfd68553462c82daf6776ae;hp=7d67defbfecfc61fa3f3637ecfbb94c127c4b75a;hpb=7731fa51f095e615975cd53d35ba3cb681b82df1;p=pspp diff --git a/src/data/dictionary.c b/src/data/dictionary.c index 7d67defbfe..024f97b3d5 100644 --- a/src/data/dictionary.c +++ b/src/data/dictionary.c @@ -1,5 +1,5 @@ /* PSPP - a program for statistical analysis. - Copyright (C) 1997-9, 2000, 2006, 2007, 2009, 2010, 2011 Free Software Foundation, Inc. + Copyright (C) 1997-9, 2000, 2006, 2007, 2009, 2010, 2011, 2012 Free Software Foundation, Inc. This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by @@ -87,16 +87,8 @@ struct dictionary static void dict_unset_split_var (struct dictionary *, struct variable *); static void dict_unset_mrset_var (struct dictionary *, struct variable *); -void -dict_set_encoding (struct dictionary *d, const char *enc) -{ - if (enc) - { - free (d->encoding); - d->encoding = xstrdup (enc); - } -} - +/* Returns the encoding for data in dictionary D. The return value is a + nonnull string that contains an IANA character set name. */ const char * dict_get_encoding (const struct dictionary *d) { @@ -171,14 +163,16 @@ dict_copy_callbacks (struct dictionary *dest, dest->cb_data = src->cb_data; } -/* Creates and returns a new dictionary. */ +/* Creates and returns a new dictionary with the specified ENCODING. */ struct dictionary * -dict_create (void) +dict_create (const char *encoding) { struct dictionary *d = xzalloc (sizeof *d); + d->encoding = xstrdup (encoding); hmap_init (&d->name_map); attrset_init (&d->attributes); + return d; } @@ -189,19 +183,16 @@ dict_create (void) dictionary. If the new dictionary won't be used to access cases produced with the old dictionary, then the new dictionary's case indexes should be compacted with - dict_compact_values to save space. */ + dict_compact_values to save space. + + Callbacks are not cloned. */ struct dictionary * dict_clone (const struct dictionary *s) { struct dictionary *d; size_t i; - d = dict_create (); - - /* Set the new dictionary's encoding early so that string length limitations - are interpreted correctly. */ - if ( s->encoding) - d->encoding = xstrdup (s->encoding); + d = dict_create (s->encoding); for (i = 0; i < s->var_cnt; i++) { @@ -288,17 +279,6 @@ dict_clear (struct dictionary *d) attrset_clear (&d->attributes); } -/* Destroys the aux data for every variable in D, by calling - var_clear_aux() for each variable. */ -void -dict_clear_aux (struct dictionary *d) -{ - int i; - - for (i = 0; i < d->var_cnt; i++) - var_clear_aux (d->var[i].var); -} - /* Clears a dictionary and destroys it. */ void dict_destroy (struct dictionary *d) @@ -310,6 +290,7 @@ dict_destroy (struct dictionary *d) d->callbacks = NULL ; dict_clear (d); + string_array_destroy (&d->documents); hmap_destroy (&d->name_map); attrset_destroy (&d->attributes); dict_clear_mrsets (d); @@ -405,7 +386,7 @@ add_var (struct dictionary *d, struct variable *v) vardict->dict = d; vardict->var = v; hmap_insert (&d->name_map, &vardict->name_node, - hash_case_string (var_get_name (v), 0)); + utf8_hash_case_string (var_get_name (v), 0)); vardict->case_index = d->next_value_idx; var_set_vardict (v, vardict); @@ -495,10 +476,10 @@ dict_lookup_var (const struct dictionary *d, const char *name) struct vardict_info *vardict; HMAP_FOR_EACH_WITH_HASH (vardict, struct vardict_info, name_node, - hash_case_string (name, 0), &d->name_map) + utf8_hash_case_string (name, 0), &d->name_map) { struct variable *var = vardict->var; - if (!strcasecmp (var_get_name (var), name)) + if (!utf8_strcasecmp (var_get_name (var), name)) return var; } @@ -605,13 +586,9 @@ dict_delete_var (struct dictionary *d, struct variable *v) { int dict_index = var_get_dict_index (v); const int case_index = var_get_case_index (v); - const int width = var_get_width (v); assert (dict_contains_var (d, v)); - /* Delete aux data. */ - var_clear_aux (v); - dict_unset_split_var (d, v); dict_unset_mrset_var (d, v); @@ -633,13 +610,14 @@ dict_delete_var (struct dictionary *d, struct variable *v) /* Free memory. */ var_clear_vardict (v); - var_destroy (v); if ( d->changed ) d->changed (d, d->changed_data); invalidate_proto (d); if (d->callbacks && d->callbacks->var_deleted ) - d->callbacks->var_deleted (d, dict_index, case_index, width, d->cb_data); + d->callbacks->var_deleted (d, v, dict_index, case_index, d->cb_data); + + var_destroy (v); } /* Deletes the COUNT variables listed in VARS from D. This is @@ -750,7 +728,7 @@ rename_var (struct variable *v, const char *new_name) struct vardict_info *vardict = var_get_vardict (v); var_clear_vardict (v); var_set_name (v, new_name); - vardict->name_node.hash = hash_case_string (new_name, 0); + vardict->name_node.hash = utf8_hash_case_string (new_name, 0); var_set_vardict (v, vardict); } @@ -761,7 +739,7 @@ void dict_rename_var (struct dictionary *d, struct variable *v, const char *new_name) { - assert (!strcasecmp (var_get_name (v), new_name) + assert (!utf8_strcasecmp (var_get_name (v), new_name) || dict_lookup_var (d, new_name) == NULL); unindex_var (d, var_get_vardict (v)); @@ -1255,15 +1233,18 @@ dict_get_label (const struct dictionary *d) return d->label; } -/* Sets D's file label to LABEL, truncating it to a maximum of 60 - characters. +/* Sets D's file label to LABEL, truncating it to at most 60 bytes in D's + encoding. Removes D's label if LABEL is null or the empty string. */ void dict_set_label (struct dictionary *d, const char *label) { free (d->label); - d->label = label != NULL && label[0] != '\0' ? xstrndup (label, 60) : NULL; + if (label == NULL || label[0] == '\0') + d->label = NULL; + else + d->label = utf8_encoding_trunc (label, d->encoding, 60); } /* Returns the documents for D, as an UTF-8 encoded string_array. The @@ -1416,7 +1397,7 @@ dict_lookup_vector (const struct dictionary *d, const char *name) { size_t i; for (i = 0; i < d->vector_cnt; i++) - if (!strcasecmp (vector_get_name (d->vector[i]), name)) + if (!utf8_strcasecmp (vector_get_name (d->vector[i]), name)) return d->vector[i]; return NULL; } @@ -1461,7 +1442,7 @@ dict_lookup_mrset_idx (const struct dictionary *dict, const char *name) size_t i; for (i = 0; i < dict->n_mrsets; i++) - if (!strcasecmp (name, dict->mrsets[i]->name)) + if (!utf8_strcasecmp (name, dict->mrsets[i]->name)) return i; return SIZE_MAX; @@ -1660,7 +1641,7 @@ struct variable * dict_create_internal_var (int case_idx, int width) { if (internal_dict == NULL) - internal_dict = dict_create (); + internal_dict = dict_create ("UTF-8"); for (;;) {