1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
|
/* -*- mode: c++; c-basic-offset: 2; indent-tabs-mode: nil; -*-
* vim:expandtab:shiftwidth=2:tabstop=2:smarttab:
*
* Copyright (C) 2008 Sun Microsystems, Inc.
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; version 2 of the License.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
*/
#ifndef DRIZZLED_UNIQUE_H
#define DRIZZLED_UNIQUE_H
#include <drizzled/tree.h>
/*
Unique -- class for unique (removing of duplicates).
Puts all values to the TREE. If the tree becomes too big,
it's dumped to the file. User can request sorted values, or
just iterate through them. In the last case tree merging is performed in
memory simultaneously with iteration, so it should be ~2-3x faster.
*/
namespace drizzled
{
namespace internal
{
typedef struct st_io_cache IO_CACHE;
}
class Unique : public memory::SqlAlloc
{
size_t max_in_memory_size;
TREE tree;
unsigned char *record_pointers;
uint32_t size;
public:
ulong elements;
Unique(qsort_cmp2 comp_func, void *comp_func_fixed_arg,
uint32_t size_arg, size_t max_in_memory_size_arg);
~Unique();
ulong elements_in_tree() { return tree.elements_in_tree; }
inline bool unique_add(void *ptr)
{
return (not tree_insert(&tree, ptr, 0, tree.custom_arg));
}
bool get(Table *table);
static double get_use_cost(uint32_t *buffer, uint32_t nkeys, uint32_t key_size,
size_t max_in_memory_size);
inline static int get_cost_calc_buff_size(ulong nkeys, uint32_t key_size,
size_t sortbuff_size)
{
register size_t max_elems_in_tree=
(1 + sortbuff_size / ALIGN_SIZE(sizeof(TREE_ELEMENT)+key_size));
return (int) (sizeof(uint32_t)*(1 + nkeys/max_elems_in_tree));
}
void reset();
bool walk(tree_walk_action action, void *walk_action_arg);
friend int unique_write_to_file(unsigned char* key, uint32_t count, Unique *unique);
friend int unique_write_to_ptrs(unsigned char* key, uint32_t count, Unique *unique);
};
} /* namespace drizzled */
#endif /* DRIZZLED_UNIQUE_H */
|