ha_tokudb.h 9.27 KB
Newer Older
1
#ifdef USE_PRAGMA_INTERFACE
2
#pragma interface               /* gcc class implementation */
3 4 5 6 7
#endif

#include <db.h>

typedef struct st_tokudb_share {
8 9 10 11 12 13
    char *table_name;
    uint table_name_length, use_count;
    pthread_mutex_t mutex;
    THR_LOCK lock;

    ulonglong auto_ident;
14
    ulonglong last_auto_increment;
Zardosht Kasheff's avatar
Zardosht Kasheff committed
15 16 17 18 19 20 21
    DB *status_block;
    //
    // DB that is indexed on the primary key
    //
    DB *file;
    //
    // array of all DB's that make up table, includes DB that
Zardosht Kasheff's avatar
Zardosht Kasheff committed
22 23
    // is indexed on the primary key, add 1 in case primary
    // key is hidden
Zardosht Kasheff's avatar
Zardosht Kasheff committed
24
    //
Zardosht Kasheff's avatar
Zardosht Kasheff committed
25 26
    DB *key_file[MAX_KEY +1];
    u_int32_t key_type[MAX_KEY +1];
27 28 29
    uint status, version;
    uint ref_length;
    bool fixed_length_primary_key, fixed_length_row;
30 31 32

} TOKUDB_SHARE;

Zardosht Kasheff's avatar
Zardosht Kasheff committed
33 34 35 36 37
typedef struct st_prim_key_part_info {
    uint offset;
    uint part_index;
} PRIM_KEY_PART_INFO;

Zardosht Kasheff's avatar
Zardosht Kasheff committed
38 39 40 41 42
typedef enum {
    lock_read = 0,
    lock_write
} TABLE_LOCK_TYPE;

43
class ha_tokudb : public handler {
44
private:
45 46 47
    THR_LOCK_DATA lock;         ///< MySQL lock
    TOKUDB_SHARE *share;        ///< Shared lock info

Zardosht Kasheff's avatar
Zardosht Kasheff committed
48 49 50 51 52 53 54 55 56
    //
    // last key returned by ha_tokudb's cursor
    //
    DBT last_key;
    //
    // current row pointed to by ha_tokudb's cursor
    // TODO: make sure current_row gets set properly
    //
    DBT current_row;
Zardosht Kasheff's avatar
Zardosht Kasheff committed
57 58 59
    //
    // pointer used for multi_alloc of key_buff, key_buff2, primary_key_buff
    //
60
    void *alloc_ptr;
Zardosht Kasheff's avatar
Zardosht Kasheff committed
61 62 63 64 65
    //
    // buffer used to temporarily store a "packed row" 
    // data pointer of a DBT will end up pointing to this
    // see pack_row for usage
    //
66
    uchar *rec_buff;
Zardosht Kasheff's avatar
Zardosht Kasheff committed
67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90
    //
    // number of bytes allocated in rec_buff
    //
    ulong alloced_rec_buff_length;
    //
    // buffer used to temporarily store a "packed key" 
    // data pointer of a DBT will end up pointing to this
    //
    uchar *key_buff; 
    //
    // buffer used to temporarily store a "packed key" 
    // data pointer of a DBT will end up pointing to this
    // This is used in functions that require the packing
    // of more than one key
    //
    uchar *key_buff2; 
    //
    // buffer used to temporarily store a "packed key" 
    // data pointer of a DBT will end up pointing to this
    // currently this is only used for a primary key in
    // the function update_row, hence the name. It 
    // does not carry any state throughout the class.
    //
    uchar *primary_key_buff;
Zardosht Kasheff's avatar
Zardosht Kasheff committed
91 92 93 94

    //
    // transaction used by ha_tokudb's cursor
    //
95
    DB_TXN *transaction;
Zardosht Kasheff's avatar
Zardosht Kasheff committed
96

Zardosht Kasheff's avatar
Zardosht Kasheff committed
97 98 99
    //
    // instance of cursor being used for init_xxx and rnd_xxx functions
    //
100
    DBC *cursor;
Zardosht Kasheff's avatar
Zardosht Kasheff committed
101 102 103
    //
    // flags that are returned in table_flags()
    //
104
    ulong int_table_flags;
Zardosht Kasheff's avatar
Zardosht Kasheff committed
105 106 107 108 109 110 111 112 113 114 115
    //
    // index into key_file that holds DB* that is indexed on
    // the primary_key. this->key_file[primary_index] == this->file
    //
    uint primary_key;
    uint last_dup_key;
    //
    // if set to 0, then the primary key is not hidden
    // if non-zero (not necessarily 1), primary key is hidden
    //
    uint hidden_primary_key;
116
    bool key_read, using_ignore;
Zardosht Kasheff's avatar
Zardosht Kasheff committed
117

Zardosht Kasheff's avatar
Zardosht Kasheff committed
118 119 120 121 122 123 124
    //
    // After a cursor encounters an error, the cursor will be unusable
    // In case MySQL attempts to do a cursor operation (such as rnd_next
    // or index_prev), we will gracefully return this error instead of crashing
    //
    int last_cursor_error;

Zardosht Kasheff's avatar
Zardosht Kasheff committed
125 126 127 128 129
    //
    // For instances where we successfully prelock a range or a table,
    // we set this to TRUE so that successive cursor calls can know
    // know to limit the locking overhead in a call to the fractal tree
    //
Zardosht Kasheff's avatar
Zardosht Kasheff committed
130
    bool range_lock_grabbed;
Zardosht Kasheff's avatar
Zardosht Kasheff committed
131

Zardosht Kasheff's avatar
Zardosht Kasheff committed
132
    PRIM_KEY_PART_INFO* primary_key_offsets;
Zardosht Kasheff's avatar
Zardosht Kasheff committed
133

134 135 136 137 138
    bool fix_rec_buff_for_blob(ulong length);
#define TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH 5 // QQQ why 5?
    uchar current_ident[TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH];

    ulong max_row_length(const uchar * buf);
Zardosht Kasheff's avatar
Zardosht Kasheff committed
139
    int pack_row(DBT * row, const uchar * record);
Zardosht Kasheff's avatar
Zardosht Kasheff committed
140
    void unpack_row(uchar * record, DBT * row, DBT* key);
141
    void unpack_key(uchar * record, DBT * key, uint index);
Zardosht Kasheff's avatar
Zardosht Kasheff committed
142 143
    DBT* create_dbt_key_from_key(DBT * key, KEY* key_info, uchar * buff, const uchar * record, int key_length = MAX_KEY_LENGTH);
    DBT *create_dbt_key_from_table(DBT * key, uint keynr, uchar * buff, const uchar * record, int key_length = MAX_KEY_LENGTH);
144 145
    DBT *pack_key(DBT * key, uint keynr, uchar * buff, const uchar * key_ptr, uint key_length);
    int remove_key(DB_TXN * trans, uint keynr, const uchar * record, DBT * prim_key);
Zardosht Kasheff's avatar
Zardosht Kasheff committed
146
    int remove_keys(DB_TXN * trans, const uchar * record, DBT * prim_key, key_map * keys);
147 148 149 150 151
    int restore_keys(DB_TXN * trans, key_map * changed_keys, uint primary_key, const uchar * old_row, DBT * old_key, const uchar * new_row, DBT * new_key);
    int key_cmp(uint keynr, const uchar * old_row, const uchar * new_row);
    int update_primary_key(DB_TXN * trans, bool primary_key_changed, const uchar * old_row, DBT * old_key, const uchar * new_row, DBT * prim_key, bool local_using_ignore);
    int read_row(int error, uchar * buf, uint keynr, DBT * row, DBT * key, bool);
    DBT *get_pos(DBT * to, uchar * pos);
Zardosht Kasheff's avatar
Zardosht Kasheff committed
152 153
 
    int open_secondary_table(DB** ptr, KEY* key_info, const char* name, int mode, u_int32_t* key_type);
Zardosht Kasheff's avatar
Zardosht Kasheff committed
154
    int acquire_table_lock (DB_TXN* trans, TABLE_LOCK_TYPE lt);
Zardosht Kasheff's avatar
Zardosht Kasheff committed
155
    int estimate_num_rows(DB* db, u_int64_t* num_rows);
Zardosht Kasheff's avatar
Zardosht Kasheff committed
156
 
157 158 159 160 161
public:
    ha_tokudb(handlerton * hton, TABLE_SHARE * table_arg);
    ~ha_tokudb() {
    } 
    const char *table_type() const {
162
        return "TOKUDB";
163 164
    } 
    const char *index_type(uint inx) {
165 166 167
        return "BTREE";
    }
    const char **bas_ext() const;
Zardosht Kasheff's avatar
Zardosht Kasheff committed
168 169 170 171 172

    //
    // Returns a bit mask of capabilities of storage engine. Capabilities 
    // defined in sql/handler.h
    //
173 174
    ulonglong table_flags(void) const {
        return int_table_flags;
175 176
    } 
    ulong index_flags(uint inx, uint part, bool all_parts) const;
177

Zardosht Kasheff's avatar
Zardosht Kasheff committed
178 179 180
    //
    // Returns limit on the number of keys imposed by tokudb.
    //
181
    uint max_supported_keys() const {
Zardosht Kasheff's avatar
Zardosht Kasheff committed
182
        return MAX_KEY;
183
    } 
Zardosht Kasheff's avatar
Zardosht Kasheff committed
184

185
    uint extra_rec_buf_length() const {
186
        return TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH;
187 188
    } 
    ha_rows estimate_rows_upper_bound();
Zardosht Kasheff's avatar
Zardosht Kasheff committed
189 190 191 192

    //
    // Returns the limit on the key length imposed by tokudb.
    //
193 194
    uint max_supported_key_length() const {
        return UINT_MAX32;
195
    } 
Zardosht Kasheff's avatar
Zardosht Kasheff committed
196 197 198 199

    //
    // Returns limit on key part length imposed by tokudb.
    //
200
    uint max_supported_key_part_length() const {
201
        return UINT_MAX32;
202 203
    } 
    const key_map *keys_to_use_for_scanning() {
204 205 206 207
        return &key_map_full;
    }

    double scan_time();
Zardosht Kasheff's avatar
Zardosht Kasheff committed
208
    double read_time(uint index, uint ranges, ha_rows rows);
209 210 211 212 213 214

    int open(const char *name, int mode, uint test_if_locked);
    int close(void);
    int create(const char *name, TABLE * form, HA_CREATE_INFO * create_info);
    int delete_table(const char *name);
    int rename_table(const char *from, const char *to);
215
#if 0
216 217 218
    int analyze(THD * thd, HA_CHECK_OPT * check_opt);
    int optimize(THD * thd, HA_CHECK_OPT * check_opt);
    int check(THD * thd, HA_CHECK_OPT * check_opt);
219
#endif
220 221 222 223
    int write_row(uchar * buf);
    int update_row(const uchar * old_data, uchar * new_data);
    int delete_row(const uchar * buf);

Zardosht Kasheff's avatar
Zardosht Kasheff committed
224
    int prepare_index_scan();
225 226 227 228
    int index_init(uint index, bool sorted);
    int index_end();
    int index_read(uchar * buf, const uchar * key, uint key_len, enum ha_rkey_function find_flag);
    int index_read_idx(uchar * buf, uint index, const uchar * key, uint key_len, enum ha_rkey_function find_flag);
229
#if 0
230
    int index_read_last(uchar * buf, const uchar * key, uint key_len);
231
#endif
232 233 234 235 236 237 238 239 240 241 242
    int index_next(uchar * buf);
    int index_next_same(uchar * buf, const uchar * key, uint keylen);
    int index_prev(uchar * buf);
    int index_first(uchar * buf);
    int index_last(uchar * buf);

    int rnd_init(bool scan);
    int rnd_end();
    int rnd_next(uchar * buf);
    int rnd_pos(uchar * buf, uchar * pos);

Zardosht Kasheff's avatar
Zardosht Kasheff committed
243 244 245 246 247 248
    int read_range_first(const key_range *start_key,
                                 const key_range *end_key,
                                 bool eq_range, bool sorted);
    int read_range_next();


249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277
    void position(const uchar * record);
    int info(uint);
    int extra(enum ha_extra_function operation);
    int reset(void);
    int external_lock(THD * thd, int lock_type);
    int start_stmt(THD * thd, thr_lock_type lock_type);

    ha_rows records_in_range(uint inx, key_range * min_key, key_range * max_key);

    THR_LOCK_DATA **store_lock(THD * thd, THR_LOCK_DATA ** to, enum thr_lock_type lock_type);

    void get_status();
    inline void get_auto_primary_key(uchar * to) {
        pthread_mutex_lock(&share->mutex);
        share->auto_ident++;
        int5store(to, share->auto_ident);
        pthread_mutex_unlock(&share->mutex);
    }
    virtual void get_auto_increment(ulonglong offset, ulonglong increment, ulonglong nb_desired_values, ulonglong * first_value, ulonglong * nb_reserved_values);
    void print_error(int error, myf errflag);
    uint8 table_cache_type() {
        return HA_CACHE_TBL_TRANSACT;
    }
    bool primary_key_is_clustered() {
        return true;
    }
    int cmp_ref(const uchar * ref1, const uchar * ref2);
    bool check_if_incompatible_data(HA_CREATE_INFO * info, uint table_changes);

Zardosht Kasheff's avatar
Zardosht Kasheff committed
278 279 280 281
    int add_index(TABLE *table_arg, KEY *key_info, uint num_of_keys);
    int prepare_drop_index(TABLE *table_arg, uint *key_num, uint num_of_keys);
    int final_drop_index(TABLE *table_arg);

282
private:
283
    int __close(int mutex_is_locked);
284
    int read_last();
285
    ulong field_offset(Field *);
286
};