X-Git-Url: https://pintos-os.org/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=src%2Fmath%2Fsort.c;h=3491a20bfd684abae50fe88f2f232d0bbe04a3e4;hb=81579d9e9f994fb2908f50af41c3eb033d216e58;hp=9e860c4657a83029fc923e835f30579b39d2ea1c;hpb=2165f59ab9eee5272b4037e45477811627cae078;p=pspp-builds.git diff --git a/src/math/sort.c b/src/math/sort.c index 9e860c46..3491a20b 100644 --- a/src/math/sort.c +++ b/src/math/sort.c @@ -1,5 +1,5 @@ /* PSPP - a program for statistical analysis. - Copyright (C) 1997-9, 2000, 2006 Free Software Foundation, Inc. + Copyright (C) 1997-9, 2000, 2006, 2009, 2011 Free Software Foundation, Inc. This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by @@ -16,21 +16,21 @@ #include -#include "sort.h" +#include "math/sort.h" #include -#include -#include -#include -#include -#include -#include -#include -#include -#include +#include "data/case.h" +#include "data/casereader.h" +#include "data/casewriter-provider.h" +#include "data/casewriter.h" +#include "data/settings.h" +#include "data/subcase.h" +#include "libpspp/array.h" +#include "libpspp/assertion.h" +#include "math/merge.h" -#include "xalloc.h" +#include "gl/xalloc.h" #include "gettext.h" #define _(msgid) gettext (msgid) @@ -41,42 +41,44 @@ int max_buffers = INT_MAX; struct sort_writer { - size_t value_cnt; + struct caseproto *proto; struct subcase ordering; struct merge *merge; struct pqueue *pqueue; struct casewriter *run; casenumber run_id; - struct ccase run_end; + struct ccase *run_end; }; static struct casewriter_class sort_casewriter_class; -static struct pqueue *pqueue_create (const struct subcase *, size_t); +static struct pqueue *pqueue_create (const struct subcase *, + const struct caseproto *); static void pqueue_destroy (struct pqueue *); static bool pqueue_is_full (const struct pqueue *); static bool pqueue_is_empty (const struct pqueue *); static void pqueue_push (struct pqueue *, struct ccase *, casenumber); -static void pqueue_pop (struct pqueue *, struct ccase *, casenumber *); +static struct ccase *pqueue_pop (struct pqueue *, casenumber *); static void output_record (struct sort_writer *); struct casewriter * -sort_create_writer (const struct subcase *ordering, size_t value_cnt) +sort_create_writer (const struct subcase *ordering, + const struct caseproto *proto) { struct sort_writer *sort; sort = xmalloc (sizeof *sort); - sort->value_cnt = value_cnt; + sort->proto = caseproto_ref (proto); subcase_clone (&sort->ordering, ordering); - sort->merge = merge_create (ordering, value_cnt); - sort->pqueue = pqueue_create (ordering, value_cnt); + sort->merge = merge_create (ordering, proto); + sort->pqueue = pqueue_create (ordering, proto); sort->run = NULL; sort->run_id = 0; - case_nullify (&sort->run_end); + sort->run_end = NULL; - return casewriter_create (value_cnt, &sort_casewriter_class, sort); + return casewriter_create (proto, &sort_casewriter_class, sort); } static void @@ -89,9 +91,9 @@ sort_casewriter_write (struct casewriter *writer UNUSED, void *sort_, if (pqueue_is_full (sort->pqueue)) output_record (sort); - next_run = (case_is_null (&sort->run_end) + next_run = (sort->run_end == NULL || subcase_compare_3way (&sort->ordering, c, - &sort->ordering, &sort->run_end) < 0); + &sort->ordering, sort->run_end) < 0); pqueue_push (sort->pqueue, c, sort->run_id + (next_run ? 1 : 0)); } @@ -104,7 +106,8 @@ sort_casewriter_destroy (struct casewriter *writer UNUSED, void *sort_) merge_destroy (sort->merge); pqueue_destroy (sort->pqueue); casewriter_destroy (sort->run); - case_destroy (&sort->run_end); + case_unref (sort->run_end); + caseproto_unref (sort->proto); free (sort); } @@ -117,7 +120,7 @@ sort_casewriter_convert_to_reader (struct casewriter *writer, void *sort_) if (sort->run == NULL && sort->run_id == 0) { /* In-core sort. */ - sort->run = mem_writer_create (casewriter_get_value_cnt (writer)); + sort->run = mem_writer_create (sort->proto); sort->run_id = 1; } while (!pqueue_is_empty (sort->pqueue)) @@ -134,12 +137,12 @@ sort_casewriter_convert_to_reader (struct casewriter *writer, void *sort_) static void output_record (struct sort_writer *sort) { - struct ccase min_case; + struct ccase *min_case; casenumber min_run_id; - pqueue_pop (sort->pqueue, &min_case, &min_run_id); + min_case = pqueue_pop (sort->pqueue, &min_run_id); #if 0 - printf ("\toutput: %f to run %d\n", case_num_idx (&min_case, 0), min_run_id); + printf ("\toutput: %f to run %d\n", case_num_idx (min_case, 0), min_run_id); #endif if (sort->run_id != min_run_id && sort->run != NULL) @@ -149,14 +152,13 @@ output_record (struct sort_writer *sort) } if (sort->run == NULL) { - sort->run = tmpfile_writer_create (sort->value_cnt); + sort->run = tmpfile_writer_create (sort->proto); sort->run_id = min_run_id; } - case_destroy (&sort->run_end); - case_clone (&sort->run_end, &min_case); - - casewriter_write (sort->run, &min_case); + case_unref (sort->run_end); + sort->run_end = case_ref (min_case); + casewriter_write (sort->run, min_case); } static struct casewriter_class sort_casewriter_class = @@ -167,19 +169,21 @@ static struct casewriter_class sort_casewriter_class = }; /* Reads all the cases from INPUT. Sorts the cases according to - ORDERING. Returns the sorted cases in a new casereader. */ + ORDERING. Returns the sorted cases in a new casereader. + INPUT is destroyed by this function. + */ struct casereader * sort_execute (struct casereader *input, const struct subcase *ordering) { struct casewriter *output = - sort_create_writer (ordering, casereader_get_value_cnt (input)); + sort_create_writer (ordering, casereader_get_proto (input)); casereader_transfer (input, output); return casewriter_make_reader (output); } /* Reads all the cases from INPUT. Sorts the cases in ascending order according to VARIABLE. Returns the sorted cases in a - new casereader. */ + new casereader. INPUT is destroyed by this function. */ struct casereader * sort_execute_1var (struct casereader *input, const struct variable *var) { @@ -204,7 +208,7 @@ struct pqueue struct pqueue_record { casenumber id; - struct ccase c; + struct ccase *c; casenumber idx; }; @@ -212,14 +216,13 @@ static int compare_pqueue_records_minheap (const void *a, const void *b, const void *pq_); static struct pqueue * -pqueue_create (const struct subcase *ordering, size_t value_cnt) +pqueue_create (const struct subcase *ordering, const struct caseproto *proto) { struct pqueue *pq; pq = xmalloc (sizeof *pq); subcase_clone (&pq->ordering, ordering); - pq->record_cap - = settings_get_workspace_cases (value_cnt); + pq->record_cap = settings_get_workspace_cases (proto); if (pq->record_cap > max_buffers) pq->record_cap = max_buffers; else if (pq->record_cap < min_buffers) @@ -238,10 +241,9 @@ pqueue_destroy (struct pqueue *pq) { while (!pqueue_is_empty (pq)) { - struct ccase c; casenumber id; - pqueue_pop (pq, &c, &id); - case_destroy (&c); + struct ccase *c = pqueue_pop (pq, &id); + case_unref (c); } subcase_destroy (&pq->ordering); free (pq->records); @@ -270,15 +272,15 @@ pqueue_push (struct pqueue *pq, struct ccase *c, casenumber id) r = &pq->records[pq->record_cnt++]; r->id = id; - case_move (&r->c, c); + r->c = c; r->idx = pq->idx++; push_heap (pq->records, pq->record_cnt, sizeof *pq->records, compare_pqueue_records_minheap, pq); } -static void -pqueue_pop (struct pqueue *pq, struct ccase *c, casenumber *id) +static struct ccase * +pqueue_pop (struct pqueue *pq, casenumber *id) { struct pqueue_record *r; @@ -289,7 +291,7 @@ pqueue_pop (struct pqueue *pq, struct ccase *c, casenumber *id) r = &pq->records[pq->record_cnt]; *id = r->id; - case_move (c, &r->c); + return r->c; } /* Compares record-run tuples A and B on id, then on case data, @@ -303,8 +305,7 @@ compare_pqueue_records_minheap (const void *a_, const void *b_, const struct pqueue *pq = pq_; int result = a->id < b->id ? -1 : a->id > b->id; if (result == 0) - result = subcase_compare_3way (&pq->ordering, &a->c, - &pq->ordering, &b->c); + result = subcase_compare_3way (&pq->ordering, a->c, &pq->ordering, b->c); if (result == 0) result = a->idx < b->idx ? -1 : a->idx > b->idx; return -result;