ha_innodb.cc 237 KB
Newer Older
osku's avatar
osku committed
1 2 3 4
/* Copyright (C) 2000-2005 MySQL AB & Innobase Oy

   This program is free software; you can redistribute it and/or modify
   it under the terms of the GNU General Public License as published by
marko's avatar
marko committed
5
   the Free Software Foundation; version 2 of the License.
osku's avatar
osku committed
6 7 8

   This program is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
9
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.	 See the
osku's avatar
osku committed
10 11 12 13
   GNU General Public License for more details.

   You should have received a copy of the GNU General Public License
   along with this program; if not, write to the Free Software
14
   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307	 USA */
osku's avatar
osku committed
15 16 17

/* This file defines the InnoDB handler: the interface between MySQL and InnoDB
NOTE: You can only use noninlined InnoDB functions in this file, because we
vasil's avatar
vasil committed
18
have disabled the InnoDB inlining in this file. */
osku's avatar
osku committed
19 20

/* TODO list for the InnoDB handler in 5.0:
21
  - Remove the flag trx->active_trans and look at trx->conc_state
osku's avatar
osku committed
22 23 24 25 26 27 28 29 30 31
  - fix savepoint functions to use savepoint storage area
  - Find out what kind of problems the OS X case-insensitivity causes to
    table and database names; should we 'normalize' the names like we do
    in Windows?
*/

#ifdef USE_PRAGMA_IMPLEMENTATION
#pragma implementation				// gcc: Class implementation
#endif

marko's avatar
marko committed
32
#include <mysql_priv.h>
33
#include <mysqld_error.h>
osku's avatar
osku committed
34 35 36 37 38 39 40

#include <m_ctype.h>
#include <hash.h>
#include <myisampack.h>
#include <mysys_err.h>
#include <my_sys.h>
#include "ha_innodb.h"
41 42
#include <mysql/plugin.h>

43
#ifndef MYSQL_SERVER
44 45 46 47
/* This is needed because of Bug #3596.  Let us hope that pthread_mutex_t
is defined the same in both builds: the MySQL server and the InnoDB plugin. */
extern pthread_mutex_t LOCK_thread_count;
#endif /* MYSQL_SERVER */
osku's avatar
osku committed
48

49 50 51 52 53 54 55 56 57
/** to protect innobase_open_files */
static pthread_mutex_t innobase_share_mutex;
/** to force correct commit order in binlog */
static pthread_mutex_t prepare_commit_mutex;
static ulong commit_threads = 0;
static pthread_mutex_t commit_threads_m;
static pthread_cond_t commit_cond;
static pthread_mutex_t commit_cond_m;
static bool innodb_inited = 0;
osku's avatar
osku committed
58

59 60 61 62
/*
  This needs to exist until the query cache callback is removed
  or learns to pass hton.
*/
63
static handlerton *innodb_hton_ptr;
64

osku's avatar
osku committed
65 66 67 68
#define INSIDE_HA_INNOBASE_CC

/* Include necessary InnoDB headers */
extern "C" {
69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92
#include "../storage/innobase/include/univ.i"
#include "../storage/innobase/include/os0file.h"
#include "../storage/innobase/include/os0thread.h"
#include "../storage/innobase/include/srv0start.h"
#include "../storage/innobase/include/srv0srv.h"
#include "../storage/innobase/include/trx0roll.h"
#include "../storage/innobase/include/trx0trx.h"
#include "../storage/innobase/include/trx0sys.h"
#include "../storage/innobase/include/mtr0mtr.h"
#include "../storage/innobase/include/row0ins.h"
#include "../storage/innobase/include/row0mysql.h"
#include "../storage/innobase/include/row0sel.h"
#include "../storage/innobase/include/row0upd.h"
#include "../storage/innobase/include/log0log.h"
#include "../storage/innobase/include/lock0lock.h"
#include "../storage/innobase/include/dict0crea.h"
#include "../storage/innobase/include/btr0cur.h"
#include "../storage/innobase/include/btr0btr.h"
#include "../storage/innobase/include/fsp0fsp.h"
#include "../storage/innobase/include/sync0sync.h"
#include "../storage/innobase/include/fil0fil.h"
#include "../storage/innobase/include/trx0xa.h"
#include "../storage/innobase/include/thr0loc.h"
#include "../storage/innobase/include/ha_prototypes.h"
osku's avatar
osku committed
93 94
}

95 96 97 98
static const long AUTOINC_OLD_STYLE_LOCKING = 0;
static const long AUTOINC_NEW_STYLE_LOCKING = 1;
static const long AUTOINC_NO_LOCKING = 2;

99
static long innobase_mirrored_log_groups, innobase_log_files_in_group,
100 101 102
	innobase_log_buffer_size, innobase_buffer_pool_awe_mem_mb,
	innobase_additional_mem_pool_size, innobase_file_io_threads,
	innobase_lock_wait_timeout, innobase_force_recovery,
103
	innobase_open_files, innobase_autoinc_lock_mode;
104

105
static long long innobase_buffer_pool_size, innobase_log_file_size;
osku's avatar
osku committed
106 107 108

/* The default values for the following char* start-up parameters
are determined in innobase_init below: */
109

110 111 112
static char*	innobase_data_home_dir			= NULL;
static char*	innobase_data_file_path			= NULL;
static char*	innobase_log_group_home_dir		= NULL;
osku's avatar
osku committed
113 114
/* The following has a misleading name: starting from 4.0.5, this also
affects Windows: */
115
static char*	innobase_unix_file_flush_method		= NULL;
osku's avatar
osku committed
116 117 118 119

/* Below we have boolean-valued start-up parameters, and their default
values */

120 121 122 123 124 125 126 127 128 129 130 131
static ulong	innobase_fast_shutdown			= 1;
#ifdef UNIV_LOG_ARCHIVE
static my_bool	innobase_log_archive			= FALSE;
static char*	innobase_log_arch_dir			= NULL;
#endif /* UNIV_LOG_ARCHIVE */
static my_bool	innobase_use_doublewrite		= TRUE;
static my_bool	innobase_use_checksums			= TRUE;
static my_bool	innobase_file_per_table			= FALSE;
static my_bool	innobase_locks_unsafe_for_binlog	= FALSE;
static my_bool	innobase_rollback_on_timeout		= FALSE;
static my_bool	innobase_create_status_file		= FALSE;
static my_bool innobase_stats_on_metadata		= TRUE;
vasil's avatar
vasil committed
132
static my_bool	innobase_adaptive_hash_index	= TRUE;
osku's avatar
osku committed
133

134
static char*	internal_innobase_data_file_path	= NULL;
osku's avatar
osku committed
135 136 137 138 139 140 141

/* The following counter is used to convey information to InnoDB
about server activity: in selects it is not sensible to call
srv_active_wake_master_thread after each fetch or search, we only do
it every INNOBASE_WAKE_INTERVAL'th step. */

#define INNOBASE_WAKE_INTERVAL	32
marko's avatar
marko committed
142
static ulong	innobase_active_counter	= 0;
osku's avatar
osku committed
143

144
static HASH	innobase_open_tables;
osku's avatar
osku committed
145

146
#ifdef __NETWARE__	/* some special cleanup for NetWare */
osku's avatar
osku committed
147 148 149
bool nw_panic = FALSE;
#endif

150
static uchar* innobase_get_key(INNOBASE_SHARE *share, size_t *length,
151
	my_bool not_used __attribute__((unused)));
osku's avatar
osku committed
152 153
static INNOBASE_SHARE *get_share(const char *table_name);
static void free_share(INNOBASE_SHARE *share);
154 155 156 157 158 159 160 161 162 163
static int innobase_close_connection(handlerton *hton, THD* thd);
static int innobase_commit(handlerton *hton, THD* thd, bool all);
static int innobase_rollback(handlerton *hton, THD* thd, bool all);
static int innobase_rollback_to_savepoint(handlerton *hton, THD* thd, 
           void *savepoint);
static int innobase_savepoint(handlerton *hton, THD* thd, void *savepoint);
static int innobase_release_savepoint(handlerton *hton, THD* thd, 
           void *savepoint);
static handler *innobase_create_handler(handlerton *hton,
                                        TABLE_SHARE *table,
marko's avatar
marko committed
164
                                        MEM_ROOT *mem_root);
osku's avatar
osku committed
165

166
static const char innobase_hton_name[]= "InnoDB";
osku's avatar
osku committed
167

168 169 170 171 172 173 174 175 176 177 178

static MYSQL_THDVAR_BOOL(support_xa, PLUGIN_VAR_OPCMDARG,
  "Enable InnoDB support for the XA two-phase commit",
  /* check_func */ NULL, /* update_func */ NULL,
  /* default */ TRUE);

static MYSQL_THDVAR_BOOL(table_locks, PLUGIN_VAR_OPCMDARG,
  "Enable InnoDB locking in LOCK TABLES",
  /* check_func */ NULL, /* update_func */ NULL,
  /* default */ TRUE);

179 180 181
static handler *innobase_create_handler(handlerton *hton,
                                        TABLE_SHARE *table, 
                                        MEM_ROOT *mem_root)
osku's avatar
osku committed
182
{
183
  return new (mem_root) ha_innobase(hton, table);
osku's avatar
osku committed
184 185
}

186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318
/***********************************************************************
This function is used to prepare X/Open XA distributed transaction   */
static
int
innobase_xa_prepare(
/*================*/
			/* out: 0 or error number */
	handlerton* hton,
	THD*	thd,	/* in: handle to the MySQL thread of the user
			whose XA transaction should be prepared */
	bool	all);	/* in: TRUE - commit transaction
			FALSE - the current SQL statement ended */
/***********************************************************************
This function is used to recover X/Open XA distributed transactions   */
static
int
innobase_xa_recover(
/*================*/
				/* out: number of prepared transactions
				stored in xid_list */
	handlerton* hton,
	XID*	xid_list,	/* in/out: prepared transactions */
	uint	len);		/* in: number of slots in xid_list */
/***********************************************************************
This function is used to commit one X/Open XA distributed transaction
which is in the prepared state */
static
int
innobase_commit_by_xid(
/*===================*/
			/* out: 0 or error number */
	handlerton* hton,
	XID*	xid);	/* in: X/Open XA transaction identification */
/***********************************************************************
This function is used to rollback one X/Open XA distributed transaction
which is in the prepared state */
static
int
innobase_rollback_by_xid(
/*=====================*/
			/* out: 0 or error number */
	handlerton* hton,
	XID	*xid);	/* in: X/Open XA transaction identification */
/***********************************************************************
Create a consistent view for a cursor based on current transaction
which is created if the corresponding MySQL thread still lacks one.
This consistent view is then used inside of MySQL when accessing records
using a cursor. */
static
void*
innobase_create_cursor_view(
/*========================*/
				/* out: pointer to cursor view or NULL */
	handlerton*	hton,	/* in: innobase hton */
	THD*		thd);	/* in: user thread handle */
/***********************************************************************
Set the given consistent cursor view to a transaction which is created
if the corresponding MySQL thread still lacks one. If the given
consistent cursor view is NULL global read view of a transaction is
restored to a transaction read view. */
static
void
innobase_set_cursor_view(
/*=====================*/
	handlerton* hton,
	THD*	thd,	/* in: user thread handle */
	void*	curview);/* in: Consistent cursor view to be set */
/***********************************************************************
Close the given consistent cursor view of a transaction and restore
global read view to a transaction read view. Transaction is created if the
corresponding MySQL thread still lacks one. */
static
void
innobase_close_cursor_view(
/*=======================*/
	handlerton* hton,
	THD*	thd,	/* in: user thread handle */
	void*	curview);/* in: Consistent read view to be closed */
/*********************************************************************
Removes all tables in the named database inside InnoDB. */
static
void
innobase_drop_database(
/*===================*/
			/* out: error number */
	handlerton* hton, /* in: handlerton of Innodb */
	char*	path);	/* in: database path; inside InnoDB the name
			of the last directory in the path is used as
			the database name: for example, in 'mysql/data/test'
			the database name is 'test' */
/***********************************************************************
Closes an InnoDB database. */
static
int
innobase_end(handlerton *hton, ha_panic_function type);

/*********************************************************************
Creates an InnoDB transaction struct for the thd if it does not yet have one.
Starts a new InnoDB transaction if a transaction is not yet started. And
assigns a new snapshot for a consistent read if the transaction does not yet
have one. */
static
int
innobase_start_trx_and_assign_read_view(
/*====================================*/
			/* out: 0 */
	handlerton* hton, /* in: Innodb handlerton */ 
	THD*	thd);	/* in: MySQL thread handle of the user for whom
			the transaction should be committed */
/********************************************************************
Flushes InnoDB logs to disk and makes a checkpoint. Really, a commit flushes
the logs, and the name of this function should be innobase_checkpoint. */
static
bool
innobase_flush_logs(
/*================*/
				/* out: TRUE if error */
	handlerton*	hton);	/* in: InnoDB handlerton */

/****************************************************************************
Implements the SHOW INNODB STATUS command. Sends the output of the InnoDB
Monitor to the client. */
static
bool
innodb_show_status(
/*===============*/
	handlerton*	hton,	/* in: the innodb handlerton */
	THD*	thd,	/* in: the MySQL query thread of the caller */
	stat_print_fn *stat_print);
static
bool innobase_show_status(handlerton *hton, THD* thd, 
                          stat_print_fn* stat_print,
                          enum ha_stat_type stat_type);
osku's avatar
osku committed
319

osku's avatar
osku committed
320 321
/*********************************************************************
Commits a transaction in an InnoDB database. */
322
static
osku's avatar
osku committed
323 324 325 326 327
void
innobase_commit_low(
/*================*/
	trx_t*	trx);	/* in: transaction handle */

328
static SHOW_VAR innodb_status_variables[]= {
osku's avatar
osku committed
329
  {"buffer_pool_pages_data",
330
  (char*) &export_vars.innodb_buffer_pool_pages_data,	  SHOW_LONG},
osku's avatar
osku committed
331
  {"buffer_pool_pages_dirty",
332
  (char*) &export_vars.innodb_buffer_pool_pages_dirty,	  SHOW_LONG},
osku's avatar
osku committed
333 334 335
  {"buffer_pool_pages_flushed",
  (char*) &export_vars.innodb_buffer_pool_pages_flushed,  SHOW_LONG},
  {"buffer_pool_pages_free",
336
  (char*) &export_vars.innodb_buffer_pool_pages_free,	  SHOW_LONG},
vasil's avatar
vasil committed
337
#ifdef UNIV_DEBUG
osku's avatar
osku committed
338 339
  {"buffer_pool_pages_latched",
  (char*) &export_vars.innodb_buffer_pool_pages_latched,  SHOW_LONG},
vasil's avatar
vasil committed
340
#endif /* UNIV_DEBUG */
osku's avatar
osku committed
341
  {"buffer_pool_pages_misc",
342
  (char*) &export_vars.innodb_buffer_pool_pages_misc,	  SHOW_LONG},
osku's avatar
osku committed
343
  {"buffer_pool_pages_total",
344
  (char*) &export_vars.innodb_buffer_pool_pages_total,	  SHOW_LONG},
osku's avatar
osku committed
345 346 347 348 349 350 351
  {"buffer_pool_read_ahead_rnd",
  (char*) &export_vars.innodb_buffer_pool_read_ahead_rnd, SHOW_LONG},
  {"buffer_pool_read_ahead_seq",
  (char*) &export_vars.innodb_buffer_pool_read_ahead_seq, SHOW_LONG},
  {"buffer_pool_read_requests",
  (char*) &export_vars.innodb_buffer_pool_read_requests,  SHOW_LONG},
  {"buffer_pool_reads",
352
  (char*) &export_vars.innodb_buffer_pool_reads,	  SHOW_LONG},
osku's avatar
osku committed
353
  {"buffer_pool_wait_free",
354
  (char*) &export_vars.innodb_buffer_pool_wait_free,	  SHOW_LONG},
osku's avatar
osku committed
355 356 357
  {"buffer_pool_write_requests",
  (char*) &export_vars.innodb_buffer_pool_write_requests, SHOW_LONG},
  {"data_fsyncs",
358
  (char*) &export_vars.innodb_data_fsyncs,		  SHOW_LONG},
osku's avatar
osku committed
359
  {"data_pending_fsyncs",
360
  (char*) &export_vars.innodb_data_pending_fsyncs,	  SHOW_LONG},
osku's avatar
osku committed
361
  {"data_pending_reads",
362
  (char*) &export_vars.innodb_data_pending_reads,	  SHOW_LONG},
osku's avatar
osku committed
363
  {"data_pending_writes",
364
  (char*) &export_vars.innodb_data_pending_writes,	  SHOW_LONG},
osku's avatar
osku committed
365
  {"data_read",
366
  (char*) &export_vars.innodb_data_read,		  SHOW_LONG},
osku's avatar
osku committed
367
  {"data_reads",
368
  (char*) &export_vars.innodb_data_reads,		  SHOW_LONG},
osku's avatar
osku committed
369
  {"data_writes",
370
  (char*) &export_vars.innodb_data_writes,		  SHOW_LONG},
osku's avatar
osku committed
371
  {"data_written",
372
  (char*) &export_vars.innodb_data_written,		  SHOW_LONG},
osku's avatar
osku committed
373
  {"dblwr_pages_written",
374
  (char*) &export_vars.innodb_dblwr_pages_written,	  SHOW_LONG},
osku's avatar
osku committed
375
  {"dblwr_writes",
376
  (char*) &export_vars.innodb_dblwr_writes,		  SHOW_LONG},
osku's avatar
osku committed
377
  {"log_waits",
378
  (char*) &export_vars.innodb_log_waits,		  SHOW_LONG},
osku's avatar
osku committed
379
  {"log_write_requests",
380
  (char*) &export_vars.innodb_log_write_requests,	  SHOW_LONG},
osku's avatar
osku committed
381
  {"log_writes",
382
  (char*) &export_vars.innodb_log_writes,		  SHOW_LONG},
osku's avatar
osku committed
383
  {"os_log_fsyncs",
384
  (char*) &export_vars.innodb_os_log_fsyncs,		  SHOW_LONG},
osku's avatar
osku committed
385
  {"os_log_pending_fsyncs",
386
  (char*) &export_vars.innodb_os_log_pending_fsyncs,	  SHOW_LONG},
osku's avatar
osku committed
387
  {"os_log_pending_writes",
388
  (char*) &export_vars.innodb_os_log_pending_writes,	  SHOW_LONG},
osku's avatar
osku committed
389
  {"os_log_written",
390
  (char*) &export_vars.innodb_os_log_written,		  SHOW_LONG},
osku's avatar
osku committed
391
  {"page_size",
392
  (char*) &export_vars.innodb_page_size,		  SHOW_LONG},
osku's avatar
osku committed
393
  {"pages_created",
394
  (char*) &export_vars.innodb_pages_created,		  SHOW_LONG},
osku's avatar
osku committed
395
  {"pages_read",
396
  (char*) &export_vars.innodb_pages_read,		  SHOW_LONG},
osku's avatar
osku committed
397
  {"pages_written",
398
  (char*) &export_vars.innodb_pages_written,		  SHOW_LONG},
osku's avatar
osku committed
399
  {"row_lock_current_waits",
400
  (char*) &export_vars.innodb_row_lock_current_waits,	  SHOW_LONG},
osku's avatar
osku committed
401
  {"row_lock_time",
402
  (char*) &export_vars.innodb_row_lock_time,		  SHOW_LONGLONG},
osku's avatar
osku committed
403
  {"row_lock_time_avg",
404
  (char*) &export_vars.innodb_row_lock_time_avg,	  SHOW_LONG},
osku's avatar
osku committed
405
  {"row_lock_time_max",
406
  (char*) &export_vars.innodb_row_lock_time_max,	  SHOW_LONG},
osku's avatar
osku committed
407
  {"row_lock_waits",
408
  (char*) &export_vars.innodb_row_lock_waits,		  SHOW_LONG},
osku's avatar
osku committed
409
  {"rows_deleted",
410
  (char*) &export_vars.innodb_rows_deleted,		  SHOW_LONG},
osku's avatar
osku committed
411
  {"rows_inserted",
412
  (char*) &export_vars.innodb_rows_inserted,		  SHOW_LONG},
osku's avatar
osku committed
413
  {"rows_read",
414
  (char*) &export_vars.innodb_rows_read,		  SHOW_LONG},
osku's avatar
osku committed
415
  {"rows_updated",
416
  (char*) &export_vars.innodb_rows_updated,		  SHOW_LONG},
marko's avatar
marko committed
417 418
  {NullS, NullS, SHOW_LONG}
};
osku's avatar
osku committed
419 420 421

/* General functions */

422 423 424 425 426 427 428 429 430 431 432 433 434
/**********************************************************************
Returns true if the thread is the replication thread on the slave
server. Used in srv_conc_enter_innodb() to determine if the thread
should be allowed to enter InnoDB - the replication thread is treated
differently than other threads. Also used in
srv_conc_force_exit_innodb(). */
extern "C"
ibool
thd_is_replication_slave_thread(
/*============================*/
			/* out: true if thd is the replication thread */
	void*	thd)	/* in: thread handle (THD*) */
{
435
	return((ibool) thd_slave_thread((THD*) thd));
436 437
}

osku's avatar
osku committed
438 439 440 441 442 443 444 445 446
/**********************************************************************
Save some CPU by testing the value of srv_thread_concurrency in inline
functions. */
inline
void
innodb_srv_conc_enter_innodb(
/*=========================*/
	trx_t*	trx)	/* in: transaction handle */
{
marko's avatar
marko committed
447
	if (UNIV_LIKELY(!srv_thread_concurrency)) {
osku's avatar
osku committed
448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463

		return;
	}

	srv_conc_enter_innodb(trx);
}

/**********************************************************************
Save some CPU by testing the value of srv_thread_concurrency in inline
functions. */
inline
void
innodb_srv_conc_exit_innodb(
/*========================*/
	trx_t*	trx)	/* in: transaction handle */
{
marko's avatar
marko committed
464
	if (UNIV_LIKELY(!srv_thread_concurrency)) {
osku's avatar
osku committed
465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493

		return;
	}

	srv_conc_exit_innodb(trx);
}

/**********************************************************************
Releases possible search latch and InnoDB thread FIFO ticket. These should
be released at each SQL statement end, and also when mysqld passes the
control to the client. It does no harm to release these also in the middle
of an SQL statement. */
inline
void
innobase_release_stat_resources(
/*============================*/
	trx_t*	trx)	/* in: transaction object */
{
	if (trx->has_search_latch) {
		trx_search_latch_release_if_reserved(trx);
	}

	if (trx->declared_to_be_inside_innodb) {
		/* Release our possible ticket in the FIFO */

		srv_conc_force_exit_innodb(trx);
	}
}

494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509
/**********************************************************************
Returns true if the transaction this thread is processing has edited
non-transactional tables. Used by the deadlock detector when deciding
which transaction to rollback in case of a deadlock - we try to avoid
rolling back transactions that have edited non-transactional tables. */
extern "C"
ibool
thd_has_edited_nontrans_tables(
/*===========================*/
			/* out: true if non-transactional tables have
			been edited */
	void*	thd)	/* in: thread handle (THD*) */
{
	return((ibool) thd_non_transactional_update((THD*) thd));
}

510 511 512 513 514 515 516 517 518 519 520 521
/**********************************************************************
Returns true if the thread is executing a SELECT statement. */
extern "C"
ibool
thd_is_select(
/*==========*/
				/* out: true if thd is executing SELECT */
	const void*	thd)	/* in: thread handle (THD*) */
{
	return(thd_sql_command((const THD*) thd) == SQLCOM_SELECT);
}

522 523 524 525 526 527
/************************************************************************
Obtain the InnoDB transaction of a MySQL thread. */
inline
trx_t*&
thd_to_trx(
/*=======*/
528 529
			/* out: reference to transaction pointer */
	THD*	thd)	/* in: MySQL thread */
530
{
531
	return(*(trx_t**) thd_ha_data(thd, innodb_hton_ptr));
532 533
}

osku's avatar
osku committed
534 535 536 537
/************************************************************************
Call this function when mysqld passes control to the client. That is to
avoid deadlocks on the adaptive hash S-latch possibly held by thd. For more
documentation, see handler.cc. */
538
static
osku's avatar
osku committed
539
int
osku's avatar
osku committed
540 541
innobase_release_temporary_latches(
/*===============================*/
542 543 544
				/* out: 0 */
	handlerton*	hton,	/* in: handlerton */
	THD*		thd)	/* in: MySQL thread */
osku's avatar
osku committed
545 546 547
{
	trx_t*	trx;

548 549
	DBUG_ASSERT(hton == innodb_hton_ptr);

osku's avatar
osku committed
550
	if (!innodb_inited) {
551

osku's avatar
osku committed
552
		return 0;
osku's avatar
osku committed
553 554
	}

555
	trx = thd_to_trx(thd);
osku's avatar
osku committed
556 557

	if (trx) {
558
		innobase_release_stat_resources(trx);
osku's avatar
osku committed
559
	}
osku's avatar
osku committed
560
	return 0;
osku's avatar
osku committed
561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595
}

/************************************************************************
Increments innobase_active_counter and every INNOBASE_WAKE_INTERVALth
time calls srv_active_wake_master_thread. This function should be used
when a single database operation may introduce a small need for
server utility activity, like checkpointing. */
inline
void
innobase_active_small(void)
/*=======================*/
{
	innobase_active_counter++;

	if ((innobase_active_counter % INNOBASE_WAKE_INTERVAL) == 0) {
		srv_active_wake_master_thread();
	}
}

/************************************************************************
Converts an InnoDB error code to a MySQL error code and also tells to MySQL
about a possible transaction rollback inside InnoDB caused by a lock wait
timeout or a deadlock. */
static
int
convert_error_code_to_mysql(
/*========================*/
			/* out: MySQL error code */
	int	error,	/* in: InnoDB error code */
	THD*	thd)	/* in: user thread handle or NULL */
{
	if (error == DB_SUCCESS) {

		return(0);

596
	} else if (error == (int) DB_DUPLICATE_KEY) {
osku's avatar
osku committed
597

598
		return(HA_ERR_FOUND_DUPP_KEY);
osku's avatar
osku committed
599

600
	} else if (error == (int) DB_FOREIGN_DUPLICATE_KEY) {
601 602 603

		return(HA_ERR_FOREIGN_DUPLICATE_KEY);

604
	} else if (error == (int) DB_RECORD_NOT_FOUND) {
osku's avatar
osku committed
605

606
		return(HA_ERR_NO_ACTIVE_RECORD);
osku's avatar
osku committed
607

608
	} else if (error == (int) DB_ERROR) {
osku's avatar
osku committed
609

610
		return(-1); /* unspecified error */
osku's avatar
osku committed
611

612 613 614 615
	} else if (error == (int) DB_DEADLOCK) {
		/* Since we rolled back the whole transaction, we must
		tell it also to MySQL so that MySQL knows to empty the
		cached binlog for this transaction */
osku's avatar
osku committed
616

617 618 619
		if (thd) {
			thd_mark_transaction_to_rollback(thd, TRUE);
		}
osku's avatar
osku committed
620

621 622
		return(HA_ERR_LOCK_DEADLOCK);
	} else if (error == (int) DB_LOCK_WAIT_TIMEOUT) {
osku's avatar
osku committed
623 624 625 626 627

		/* Starting from 5.0.13, we let MySQL just roll back the
		latest SQL statement in a lock wait timeout. Previously, we
		rolled back the whole transaction. */

628 629 630 631
		if (thd) {
			thd_mark_transaction_to_rollback(
				thd, (bool)row_rollback_on_timeout);
		}
osku's avatar
osku committed
632

633
		return(HA_ERR_LOCK_WAIT_TIMEOUT);
osku's avatar
osku committed
634

635
	} else if (error == (int) DB_NO_REFERENCED_ROW) {
osku's avatar
osku committed
636

637
		return(HA_ERR_NO_REFERENCED_ROW);
osku's avatar
osku committed
638

639
	} else if (error == (int) DB_ROW_IS_REFERENCED) {
osku's avatar
osku committed
640

641
		return(HA_ERR_ROW_IS_REFERENCED);
osku's avatar
osku committed
642

643
	} else if (error == (int) DB_CANNOT_ADD_CONSTRAINT) {
osku's avatar
osku committed
644

645
		return(HA_ERR_CANNOT_ADD_FOREIGN);
osku's avatar
osku committed
646

647
	} else if (error == (int) DB_CANNOT_DROP_CONSTRAINT) {
osku's avatar
osku committed
648

649
		return(HA_ERR_ROW_IS_REFERENCED); /* TODO: This is a bit
osku's avatar
osku committed
650 651
						misleading, a new MySQL error
						code should be introduced */
652
	} else if (error == (int) DB_COL_APPEARS_TWICE_IN_INDEX) {
osku's avatar
osku committed
653

654
		return(HA_ERR_CRASHED);
osku's avatar
osku committed
655

656
	} else if (error == (int) DB_OUT_OF_FILE_SPACE) {
osku's avatar
osku committed
657

658
		return(HA_ERR_RECORD_FILE_FULL);
osku's avatar
osku committed
659

660
	} else if (error == (int) DB_TABLE_IS_BEING_USED) {
osku's avatar
osku committed
661

662
		return(HA_ERR_WRONG_COMMAND);
osku's avatar
osku committed
663

664
	} else if (error == (int) DB_TABLE_NOT_FOUND) {
osku's avatar
osku committed
665

666
		return(HA_ERR_NO_SUCH_TABLE);
osku's avatar
osku committed
667

668
	} else if (error == (int) DB_TOO_BIG_RECORD) {
osku's avatar
osku committed
669

670
		return(HA_ERR_TO_BIG_ROW);
osku's avatar
osku committed
671

672
	} else if (error == (int) DB_CORRUPTION) {
osku's avatar
osku committed
673

674 675
		return(HA_ERR_CRASHED);
	} else if (error == (int) DB_NO_SAVEPOINT) {
osku's avatar
osku committed
676

677 678
		return(HA_ERR_NO_SAVEPOINT);
	} else if (error == (int) DB_LOCK_TABLE_FULL) {
marko's avatar
marko committed
679 680 681 682
 		/* Since we rolled back the whole transaction, we must
 		tell it also to MySQL so that MySQL knows to empty the
 		cached binlog for this transaction */

683 684 685
		if (thd) {
			thd_mark_transaction_to_rollback(thd, TRUE);
		}
marko's avatar
marko committed
686 687

    		return(HA_ERR_LOCK_TABLE_FULL);
688 689 690 691 692 693 694 695 696 697 698 699 700 701
	} else if (error == DB_TOO_MANY_CONCURRENT_TRXS) {

		/* Once MySQL add the appropriate code to errmsg.txt then
		we can get rid of this #ifdef. NOTE: The code checked by
		the #ifdef is the suggested name for the error condition
		and the actual error code name could very well be different.
		This will require some monitoring, ie. the status
		of this request on our part.*/
#ifdef ER_TOO_MANY_CONCURRENT_TRXS
		return(ER_TOO_MANY_CONCURRENT_TRXS);
#else
		return(HA_ERR_RECORD_FILE_FULL);
#endif

702 703 704
	} else if (error == DB_UNSUPPORTED) {

		return(HA_ERR_UNSUPPORTED);
marko's avatar
marko committed
705 706 707
    	} else {
    		return(-1);			// Unknown error
    	}
osku's avatar
osku committed
708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746
}

/*****************************************************************
If you want to print a thd that is not associated with the current thread,
you must call this function before reserving the InnoDB kernel_mutex, to
protect MySQL from setting thd->query NULL. If you print a thd of the current
thread, we know that MySQL cannot modify thd->query, and it is not necessary
to call this. Call innobase_mysql_end_print_arbitrary_thd() after you release
the kernel_mutex.
NOTE that /mysql/innobase/lock/lock0lock.c must contain the prototype for this
function! */
extern "C"
void
innobase_mysql_prepare_print_arbitrary_thd(void)
/*============================================*/
{
	VOID(pthread_mutex_lock(&LOCK_thread_count));
}

/*****************************************************************
Releases the mutex reserved by innobase_mysql_prepare_print_arbitrary_thd().
NOTE that /mysql/innobase/lock/lock0lock.c must contain the prototype for this
function! */
extern "C"
void
innobase_mysql_end_print_arbitrary_thd(void)
/*========================================*/
{
	VOID(pthread_mutex_unlock(&LOCK_thread_count));
}

/*****************************************************************
Prints info of a THD object (== user session thread) to the given file.
NOTE that /mysql/innobase/trx/trx0trx.c must contain the prototype for
this function! */
extern "C"
void
innobase_mysql_print_thd(
/*=====================*/
747 748
	FILE*	f,		/* in: output stream */
	void*	input_thd,	/* in: pointer to a MySQL THD object */
osku's avatar
osku committed
749 750 751
	uint	max_query_len)	/* in: max query length to print, or 0 to
				   use the default max length */
{
752 753
	THD*	thd;
	char	buffer[1024];
osku's avatar
osku committed
754

755 756 757
	thd = (THD*) input_thd;
	fputs(thd_security_context(thd, buffer, sizeof(buffer), 
				   max_query_len), f);
osku's avatar
osku committed
758 759 760 761 762 763 764
	putc('\n', f);
}

/**********************************************************************
Get the variable length bounds of the given character set.

NOTE that the exact prototype of this function has to be in
765
/innobase/include/data0type.ic! */
osku's avatar
osku committed
766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788
extern "C"
void
innobase_get_cset_width(
/*====================*/
	ulint	cset,		/* in: MySQL charset-collation code */
	ulint*	mbminlen,	/* out: minimum length of a char (in bytes) */
	ulint*	mbmaxlen)	/* out: maximum length of a char (in bytes) */
{
	CHARSET_INFO*	cs;
	ut_ad(cset < 256);
	ut_ad(mbminlen);
	ut_ad(mbmaxlen);

	cs = all_charsets[cset];
	if (cs) {
		*mbminlen = cs->mbminlen;
		*mbmaxlen = cs->mbmaxlen;
	} else {
		ut_a(cset == 0);
		*mbminlen = *mbmaxlen = 0;
	}
}

789 790 791 792 793 794 795 796 797 798 799 800 801 802 803
/**********************************************************************
Converts an identifier to a table name.

NOTE that the exact prototype of this function has to be in
/innobase/dict/dict0dict.c! */
extern "C"
void
innobase_convert_from_table_id(
/*===========================*/
	char*		to,	/* out: converted identifier */
	const char*	from,	/* in: identifier to convert */
	ulint		len)	/* in: length of 'to', in bytes */
{
	uint	errors;

804
	strconvert(thd_charset(current_thd), from,
marko's avatar
marko committed
805
		   &my_charset_filename, to, (uint) len, &errors);
806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822
}

/**********************************************************************
Converts an identifier to UTF-8.

NOTE that the exact prototype of this function has to be in
/innobase/dict/dict0dict.c! */
extern "C"
void
innobase_convert_from_id(
/*=====================*/
	char*		to,	/* out: converted identifier */
	const char*	from,	/* in: identifier to convert */
	ulint		len)	/* in: length of 'to', in bytes */
{
	uint	errors;

823
	strconvert(thd_charset(current_thd), from,
marko's avatar
marko committed
824
		   system_charset_info, to, (uint) len, &errors);
825 826
}

osku's avatar
osku committed
827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856
/**********************************************************************
Compares NUL-terminated UTF-8 strings case insensitively.

NOTE that the exact prototype of this function has to be in
/innobase/dict/dict0dict.c! */
extern "C"
int
innobase_strcasecmp(
/*================*/
				/* out: 0 if a=b, <0 if a<b, >1 if a>b */
	const char*	a,	/* in: first string to compare */
	const char*	b)	/* in: second string to compare */
{
	return(my_strcasecmp(system_charset_info, a, b));
}

/**********************************************************************
Makes all characters in a NUL-terminated UTF-8 string lower case.

NOTE that the exact prototype of this function has to be in
/innobase/dict/dict0dict.c! */
extern "C"
void
innobase_casedn_str(
/*================*/
	char*	a)	/* in/out: string to put in lower case */
{
	my_casedn_str(system_charset_info, a);
}

857 858 859 860 861 862 863 864 865 866 867 868
/**************************************************************************
Determines the connection character set.

NOTE that the exact prototype of this function has to be in
/innobase/dict/dict0dict.c! */
extern "C"
struct charset_info_st*
innobase_get_charset(
/*=================*/
				/* out: connection character set */
	void*	mysql_thd)	/* in: MySQL thread handle */
{
869
	return(thd_charset((THD*) mysql_thd));
870 871
}

osku's avatar
osku committed
872 873 874 875 876 877 878 879
/*************************************************************************
Creates a temporary file. */
extern "C"
int
innobase_mysql_tmpfile(void)
/*========================*/
			/* out: temporary file descriptor, or < 0 on error */
{
880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901
	int	fd2 = -1;
	File	fd = mysql_tmpfile("ib");
	if (fd >= 0) {
		/* Copy the file descriptor, so that the additional resources
		allocated by create_temp_file() can be freed by invoking
		my_close().

		Because the file descriptor returned by this function
		will be passed to fdopen(), it will be closed by invoking
		fclose(), which in turn will invoke close() instead of
		my_close(). */
		fd2 = dup(fd);
		if (fd2 < 0) {
			DBUG_PRINT("error",("Got error %d on dup",fd2));
			my_errno=errno;
			my_error(EE_OUT_OF_FILERESOURCES,
				 MYF(ME_BELL+ME_WAITTANG),
				 "ib*", my_errno);
		}
		my_close(fd, MYF(MY_WME));
	}
	return(fd2);
osku's avatar
osku committed
902 903
}

904 905 906 907 908 909 910 911 912 913 914 915 916 917 918
/*************************************************************************
Wrapper around MySQL's copy_and_convert function, see it for
documentation. */
extern "C"
ulint
innobase_convert_string(
/*====================*/
	void*		to,
	ulint		to_length,
	CHARSET_INFO*	to_cs,
	const void*	from,
	ulint		from_length,
	CHARSET_INFO*	from_cs,
	uint*		errors)
{
marko's avatar
marko committed
919 920 921
  return(copy_and_convert((char*)to, (uint32) to_length, to_cs,
                          (const char*)from, (uint32) from_length, from_cs,
                          errors));
922 923
}

osku's avatar
osku committed
924 925 926 927 928 929 930 931 932 933 934
/*************************************************************************
Gets the InnoDB transaction handle for a MySQL handler object, creates
an InnoDB transaction struct if the corresponding MySQL thread struct still
lacks one. */
static
trx_t*
check_trx_exists(
/*=============*/
			/* out: InnoDB transaction handle */
	THD*	thd)	/* in: user thread handle */
{
935
	trx_t*&	trx = thd_to_trx(thd);
osku's avatar
osku committed
936 937 938 939

	ut_ad(thd == current_thd);

	if (trx == NULL) {
940
		DBUG_ASSERT(thd != NULL);
osku's avatar
osku committed
941 942 943
		trx = trx_allocate_for_mysql();

		trx->mysql_thd = thd;
944
		trx->mysql_query_str = thd_query(thd);
osku's avatar
osku committed
945 946 947

		/* Update the info whether we should skip XA steps that eat
		CPU time */
948
		trx->support_xa = THDVAR(thd, support_xa);
osku's avatar
osku committed
949 950
	} else {
		if (trx->magic_n != TRX_MAGIC_N) {
951
			mem_analyze_corruption(trx);
osku's avatar
osku committed
952

953
			ut_error;
osku's avatar
osku committed
954 955 956
		}
	}

957
	if (thd_test_options(thd, OPTION_NO_FOREIGN_KEY_CHECKS)) {
osku's avatar
osku committed
958 959 960 961 962
		trx->check_foreigns = FALSE;
	} else {
		trx->check_foreigns = TRUE;
	}

963
	if (thd_test_options(thd, OPTION_RELAXED_UNIQUE_CHECKS)) {
osku's avatar
osku committed
964 965 966 967 968 969 970 971 972 973 974 975
		trx->check_unique_secondary = FALSE;
	} else {
		trx->check_unique_secondary = TRUE;
	}

	return(trx);
}


/*************************************************************************
Construct ha_innobase handler. */

976 977
ha_innobase::ha_innobase(handlerton *hton, TABLE_SHARE *table_arg)
  :handler(hton, table_arg),
osku's avatar
osku committed
978
  int_table_flags(HA_REC_NOT_IN_SEQ |
979 980 981
		  HA_NULL_IN_KEY |
		  HA_CAN_INDEX_BLOBS |
		  HA_CAN_SQL_HANDLER |
marko's avatar
marko committed
982
		  HA_PRIMARY_KEY_REQUIRED_FOR_POSITION |
983
		  HA_PRIMARY_KEY_IN_READ_INDEX |
984
		  HA_BINLOG_ROW_CAPABLE |
marko's avatar
marko committed
985
		  HA_CAN_GEOMETRY | HA_PARTIAL_COLUMN_READ |
986
		  HA_TABLE_SCAN_ON_INDEX),
osku's avatar
osku committed
987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003
  start_of_scan(0),
  num_write_row(0)
{}

/*************************************************************************
Updates the user_thd field in a handle and also allocates a new InnoDB
transaction handle if needed, and updates the transaction fields in the
prebuilt struct. */
inline
int
ha_innobase::update_thd(
/*====================*/
			/* out: 0 or error code */
	THD*	thd)	/* in: thd to use the handle */
{
	trx_t*		trx;

1004
	trx = check_trx_exists(thd);
osku's avatar
osku committed
1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024

	if (prebuilt->trx != trx) {

		row_update_prebuilt_trx(prebuilt, trx);
	}

	user_thd = thd;

	return(0);
}

/*************************************************************************
Registers that InnoDB takes part in an SQL statement, so that MySQL knows to
roll back the statement if the statement results in an error. This MUST be
called for every SQL statement that may be rolled back by MySQL. Calling this
several times to register the same statement is allowed, too. */
inline
void
innobase_register_stmt(
/*===================*/
1025
        handlerton*	hton,	/* in: Innobase hton */
osku's avatar
osku committed
1026 1027
	THD*	thd)	/* in: MySQL thd (connection) object */
{
1028
	/* Register the statement */
1029
	trans_register_ha(thd, FALSE, hton);
osku's avatar
osku committed
1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042
}

/*************************************************************************
Registers an InnoDB transaction in MySQL, so that the MySQL XA code knows
to call the InnoDB prepare and commit, or rollback for the transaction. This
MUST be called for every transaction for which the user may call commit or
rollback. Calling this several times to register the same transaction is
allowed, too.
This function also registers the current SQL statement. */
inline
void
innobase_register_trx_and_stmt(
/*===========================*/
1043
        handlerton *hton, /* in: Innobase handlerton */
osku's avatar
osku committed
1044 1045 1046 1047 1048
	THD*	thd)	/* in: MySQL thd (connection) object */
{
	/* NOTE that actually innobase_register_stmt() registers also
	the transaction in the AUTOCOMMIT=1 mode. */

1049
	innobase_register_stmt(hton, thd);
osku's avatar
osku committed
1050

1051
	if (thd_test_options(thd, OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN)) {
osku's avatar
osku committed
1052

1053
		/* No autocommit mode, register for a transaction */
1054
		trans_register_ha(thd, TRUE, hton);
1055
	}
osku's avatar
osku committed
1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118
}

/*   BACKGROUND INFO: HOW THE MYSQL QUERY CACHE WORKS WITH INNODB
     ------------------------------------------------------------

1) The use of the query cache for TBL is disabled when there is an
uncommitted change to TBL.

2) When a change to TBL commits, InnoDB stores the current value of
its global trx id counter, let us denote it by INV_TRX_ID, to the table object
in the InnoDB data dictionary, and does only allow such transactions whose
id <= INV_TRX_ID to use the query cache.

3) When InnoDB does an INSERT/DELETE/UPDATE to a table TBL, or an implicit
modification because an ON DELETE CASCADE, we invalidate the MySQL query cache
of TBL immediately.

How this is implemented inside InnoDB:

1) Since every modification always sets an IX type table lock on the InnoDB
table, it is easy to check if there can be uncommitted modifications for a
table: just check if there are locks in the lock list of the table.

2) When a transaction inside InnoDB commits, it reads the global trx id
counter and stores the value INV_TRX_ID to the tables on which it had a lock.

3) If there is an implicit table change from ON DELETE CASCADE or SET NULL,
InnoDB calls an invalidate method for the MySQL query cache for that table.

How this is implemented inside sql_cache.cc:

1) The query cache for an InnoDB table TBL is invalidated immediately at an
INSERT/UPDATE/DELETE, just like in the case of MyISAM. No need to delay
invalidation to the transaction commit.

2) To store or retrieve a value from the query cache of an InnoDB table TBL,
any query must first ask InnoDB's permission. We must pass the thd as a
parameter because InnoDB will look at the trx id, if any, associated with
that thd.

3) Use of the query cache for InnoDB tables is now allowed also when
AUTOCOMMIT==0 or we are inside BEGIN ... COMMIT. Thus transactions no longer
put restrictions on the use of the query cache.
*/

/**********************************************************************
The MySQL query cache uses this to check from InnoDB if the query cache at
the moment is allowed to operate on an InnoDB table. The SQL query must
be a non-locking SELECT.

The query cache is allowed to operate on certain query only if this function
returns TRUE for all tables in the query.

If thd is not in the autocommit state, this function also starts a new
transaction for thd if there is no active trx yet, and assigns a consistent
read view to it if there is no read view yet.

Why a deadlock of threads is not possible: the query cache calls this function
at the start of a SELECT processing. Then the calling thread cannot be
holding any InnoDB semaphores. The calling thread is holding the
query cache mutex, and this function will reserver the InnoDB kernel mutex.
Thus, the 'rank' in sync0sync.h of the MySQL query cache mutex is above
the InnoDB kernel mutex. */
marko's avatar
marko committed
1119
static
osku's avatar
osku committed
1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134
my_bool
innobase_query_caching_of_table_permitted(
/*======================================*/
				/* out: TRUE if permitted, FALSE if not;
				note that the value FALSE does not mean
				we should invalidate the query cache:
				invalidation is called explicitly */
	THD*	thd,		/* in: thd of the user who is trying to
				store a result to the query cache or
				retrieve it */
	char*	full_name,	/* in: concatenation of database name,
				the null character '\0', and the table
				name */
	uint	full_name_len,	/* in: length of the full name, i.e.
				len(dbname) + len(tablename) + 1 */
1135
	ulonglong *unused)	/* unused for this engine */
osku's avatar
osku committed
1136 1137 1138 1139 1140 1141 1142
{
	ibool	is_autocommit;
	trx_t*	trx;
	char	norm_name[1000];

	ut_a(full_name_len < 999);

1143
	trx = check_trx_exists(thd);
1144 1145

	if (trx->isolation_level == TRX_ISO_SERIALIZABLE) {
osku's avatar
osku committed
1146 1147
		/* In the SERIALIZABLE mode we add LOCK IN SHARE MODE to every
		plain SELECT if AUTOCOMMIT is not on. */
1148

osku's avatar
osku committed
1149 1150 1151 1152 1153 1154 1155
		return((my_bool)FALSE);
	}

	if (trx->has_search_latch) {
		sql_print_error("The calling thread is holding the adaptive "
				"search, latch though calling "
				"innobase_query_caching_of_table_permitted.");
jan's avatar
jan committed
1156

jan's avatar
jan committed
1157
		mutex_enter_noninline(&kernel_mutex);
jan's avatar
jan committed
1158
		trx_print(stderr, trx, 1024);
jan's avatar
jan committed
1159
		mutex_exit_noninline(&kernel_mutex);
osku's avatar
osku committed
1160 1161 1162 1163
	}

	innobase_release_stat_resources(trx);

1164
	if (!thd_test_options(thd, OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN)) {
osku's avatar
osku committed
1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192

		is_autocommit = TRUE;
	} else {
		is_autocommit = FALSE;

	}

	if (is_autocommit && trx->n_mysql_tables_in_use == 0) {
		/* We are going to retrieve the query result from the query
		cache. This cannot be a store operation to the query cache
		because then MySQL would have locks on tables already.

		TODO: if the user has used LOCK TABLES to lock the table,
		then we open a transaction in the call of row_.. below.
		That trx can stay open until UNLOCK TABLES. The same problem
		exists even if we do not use the query cache. MySQL should be
		modified so that it ALWAYS calls some cleanup function when
		the processing of a query ends!

		We can imagine we instantaneously serialize this consistent
		read trx to the current trx id counter. If trx2 would have
		changed the tables of a query result stored in the cache, and
		trx2 would have already committed, making the result obsolete,
		then trx2 would have already invalidated the cache. Thus we
		can trust the result in the cache is ok for this query. */

		return((my_bool)TRUE);
	}
1193

osku's avatar
osku committed
1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206
	/* Normalize the table name to InnoDB format */

	memcpy(norm_name, full_name, full_name_len);

	norm_name[strlen(norm_name)] = '/'; /* InnoDB uses '/' as the
					    separator between db and table */
	norm_name[full_name_len] = '\0';
#ifdef __WIN__
	innobase_casedn_str(norm_name);
#endif
	/* The call of row_search_.. will start a new transaction if it is
	not yet started */

1207
	if (trx->active_trans == 0) {
osku's avatar
osku committed
1208

1209
		innobase_register_trx_and_stmt(innodb_hton_ptr, thd);
1210 1211
		trx->active_trans = 1;
	}
osku's avatar
osku committed
1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246

	if (row_search_check_if_query_cache_permitted(trx, norm_name)) {

		/* printf("Query cache for %s permitted\n", norm_name); */

		return((my_bool)TRUE);
	}

	/* printf("Query cache for %s NOT permitted\n", norm_name); */

	return((my_bool)FALSE);
}

/*********************************************************************
Invalidates the MySQL query cache for the table.
NOTE that the exact prototype of this function has to be in
/innobase/row/row0ins.c! */
extern "C"
void
innobase_invalidate_query_cache(
/*============================*/
	trx_t*	trx,		/* in: transaction which modifies the table */
	char*	full_name,	/* in: concatenation of database name, null
				char '\0', table name, null char'\0';
				NOTE that in Windows this is always
				in LOWER CASE! */
	ulint	full_name_len)	/* in: full name length where also the null
				chars count */
{
	/* Note that the sync0sync.h rank of the query cache mutex is just
	above the InnoDB kernel mutex. The caller of this function must not
	have latches of a lower rank. */

	/* Argument TRUE below means we are using transactions */
#ifdef HAVE_QUERY_CACHE
1247 1248 1249 1250
	mysql_query_cache_invalidate4((THD*) trx->mysql_thd,
				      (const char*) full_name,
				      (uint32) full_name_len,
				      TRUE);
osku's avatar
osku committed
1251 1252 1253 1254
#endif
}

/*********************************************************************
1255
Display an SQL identifier. */
osku's avatar
osku committed
1256
extern "C"
1257 1258 1259 1260
void
innobase_print_identifier(
/*======================*/
	FILE*		f,	/* in: output stream */
osku's avatar
osku committed
1261
	trx_t*		trx,	/* in: transaction */
1262 1263
	ibool		table_id,/* in: TRUE=print a table name,
				FALSE=print other identifier */
osku's avatar
osku committed
1264 1265 1266
	const char*	name,	/* in: name to print */
	ulint		namelen)/* in: length of name */
{
1267 1268 1269 1270 1271 1272 1273 1274 1275 1276
	const char*	s	= name;
	char*		qname	= NULL;
	int		q;

	if (table_id) {
		/* Decode the table name.  The filename_to_tablename()
		function expects a NUL-terminated string.  The input and
		output strings buffers must not be shared.  The function
		only produces more output when the name contains other
		characters than [0-9A-Z_a-z]. */
marko's avatar
marko committed
1277
          char*	temp_name = (char*) my_malloc((uint) namelen + 1, MYF(MY_WME));
marko's avatar
marko committed
1278 1279
          uint	qnamelen = (uint) (namelen
                                   + (1 + sizeof srv_mysql50_table_name_prefix));
1280 1281

		if (temp_name) {
marko's avatar
marko committed
1282
                  qname = (char*) my_malloc(qnamelen, MYF(MY_WME));
1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293
			if (qname) {
				memcpy(temp_name, name, namelen);
				temp_name[namelen] = 0;
				s = qname;
				namelen = filename_to_tablename(temp_name,
						qname, qnamelen);
			}
			my_free(temp_name, MYF(0));
		}
	}

osku's avatar
osku committed
1294
	if (!trx || !trx->mysql_thd) {
1295 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313 1314

		q = '"';
	} else {
		q = get_quote_char_for_identifier((THD*) trx->mysql_thd,
						s, (int) namelen);
	}

	if (q == EOF) {
		fwrite(s, 1, namelen, f);
	} else {
		const char*	e = s + namelen;
		putc(q, f);
		while (s < e) {
			int	c = *s++;
			if (c == q) {
				putc(c, f);
			}
			putc(c, f);
		}
		putc(q, f);
osku's avatar
osku committed
1315
	}
1316 1317

	my_free(qname, MYF(MY_ALLOW_ZERO_PTR));
osku's avatar
osku committed
1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328
}

/**************************************************************************
Determines if the currently running transaction has been interrupted. */
extern "C"
ibool
trx_is_interrupted(
/*===============*/
			/* out: TRUE if interrupted */
	trx_t*	trx)	/* in: transaction */
{
1329
	return(trx && trx->mysql_thd && thd_killed((THD*) trx->mysql_thd));
osku's avatar
osku committed
1330 1331
}

1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344
/******************************************************************
Resets some fields of a prebuilt struct. The template is used in fast
retrieval of just those column values MySQL needs in its processing. */
static
void
reset_template(
/*===========*/
	row_prebuilt_t*	prebuilt)	/* in/out: prebuilt struct */
{
	prebuilt->keep_other_fields_on_keyread = 0;
	prebuilt->read_just_key = 0;
}

osku's avatar
osku committed
1345 1346 1347 1348 1349 1350 1351 1352 1353 1354 1355
/*********************************************************************
Call this when you have opened a new table handle in HANDLER, before you
call index_read_idx() etc. Actually, we can let the cursor stay open even
over a transaction commit! Then you should call this before every operation,
fetch next etc. This function inits the necessary things even after a
transaction commit. */

void
ha_innobase::init_table_handle_for_HANDLER(void)
/*============================================*/
{
1356 1357 1358 1359
	/* If current thd does not yet have a trx struct, create one.
	If the current handle does not yet have a prebuilt struct, create
	one. Update the trx pointers in the prebuilt struct. Normally
	this operation is done in external_lock. */
osku's avatar
osku committed
1360

1361
	update_thd(ha_thd());
osku's avatar
osku committed
1362

1363 1364
	/* Initialize the prebuilt struct much like it would be inited in
	external_lock */
osku's avatar
osku committed
1365 1366 1367

	innobase_release_stat_resources(prebuilt->trx);

1368
	/* If the transaction is not started yet, start it */
osku's avatar
osku committed
1369

1370
	trx_start_if_not_started_noninline(prebuilt->trx);
osku's avatar
osku committed
1371

1372
	/* Assign a read view if the transaction does not have it yet */
osku's avatar
osku committed
1373

1374
	trx_assign_read_view(prebuilt->trx);
osku's avatar
osku committed
1375 1376 1377

	/* Set the MySQL flag to mark that there is an active transaction */

1378
	if (prebuilt->trx->active_trans == 0) {
osku's avatar
osku committed
1379

1380
		innobase_register_trx_and_stmt(ht, user_thd);
osku's avatar
osku committed
1381

1382 1383
		prebuilt->trx->active_trans = 1;
	}
osku's avatar
osku committed
1384

1385 1386
	/* We did the necessary inits in this function, no need to repeat them
	in row_search_for_mysql */
osku's avatar
osku committed
1387

1388
	prebuilt->sql_stat_start = FALSE;
osku's avatar
osku committed
1389

1390 1391
	/* We let HANDLER always to do the reads as consistent reads, even
	if the trx isolation level would have been specified as SERIALIZABLE */
osku's avatar
osku committed
1392

1393 1394
	prebuilt->select_lock_type = LOCK_NONE;
	prebuilt->stored_select_lock_type = LOCK_NONE;
osku's avatar
osku committed
1395

1396
	/* Always fetch all columns in the index record */
osku's avatar
osku committed
1397

1398
	prebuilt->hint_need_to_fetch_extra_cols = ROW_RETRIEVE_ALL_COLS;
osku's avatar
osku committed
1399

1400
	/* We want always to fetch all columns in the whole row? Or do
osku's avatar
osku committed
1401 1402 1403
	we???? */

	prebuilt->used_in_HANDLER = TRUE;
1404
	reset_template(prebuilt);
osku's avatar
osku committed
1405 1406 1407 1408
}

/*************************************************************************
Opens an InnoDB database. */
1409
static
marko's avatar
marko committed
1410
int
1411 1412 1413 1414
innobase_init(
/*==========*/
			/* out: 0 on success, error code on failure */
	void	*p)	/* in: InnoDB handlerton */
osku's avatar
osku committed
1415 1416 1417 1418
{
	static char	current_dir[3];		/* Set if using current lib */
	int		err;
	bool		ret;
1419
	char		*default_path;
osku's avatar
osku committed
1420

1421
	DBUG_ENTER("innobase_init");
1422
        handlerton *innobase_hton= (handlerton *)p;
1423
        innodb_hton_ptr = innobase_hton;
marko's avatar
marko committed
1424

1425
        innobase_hton->state = SHOW_OPTION_YES;
marko's avatar
marko committed
1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448
        innobase_hton->db_type= DB_TYPE_INNODB;
        innobase_hton->savepoint_offset=sizeof(trx_named_savept_t);
        innobase_hton->close_connection=innobase_close_connection;
        innobase_hton->savepoint_set=innobase_savepoint;
        innobase_hton->savepoint_rollback=innobase_rollback_to_savepoint;
        innobase_hton->savepoint_release=innobase_release_savepoint;
        innobase_hton->commit=innobase_commit;
        innobase_hton->rollback=innobase_rollback;
        innobase_hton->prepare=innobase_xa_prepare;
        innobase_hton->recover=innobase_xa_recover;
        innobase_hton->commit_by_xid=innobase_commit_by_xid;
        innobase_hton->rollback_by_xid=innobase_rollback_by_xid;
        innobase_hton->create_cursor_read_view=innobase_create_cursor_view;
        innobase_hton->set_cursor_read_view=innobase_set_cursor_view;
        innobase_hton->close_cursor_read_view=innobase_close_cursor_view;
        innobase_hton->create=innobase_create_handler;
        innobase_hton->drop_database=innobase_drop_database;
        innobase_hton->panic=innobase_end;
        innobase_hton->start_consistent_snapshot=innobase_start_trx_and_assign_read_view;
        innobase_hton->flush_logs=innobase_flush_logs;
        innobase_hton->show_status=innobase_show_status;
        innobase_hton->flags=HTON_NO_FLAGS;
        innobase_hton->release_temporary_latches=innobase_release_temporary_latches;
marko's avatar
marko committed
1449

osku's avatar
osku committed
1450 1451
	ut_a(DATA_MYSQL_TRUE_VARCHAR == (ulint)MYSQL_TYPE_VARCHAR);

1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469
#ifdef UNIV_DEBUG
	static const char	test_filename[] = "-@";
	char			test_tablename[sizeof test_filename
				+ sizeof srv_mysql50_table_name_prefix];
	if ((sizeof test_tablename) - 1
			!= filename_to_tablename(test_filename, test_tablename,
			sizeof test_tablename)
			|| strncmp(test_tablename,
			srv_mysql50_table_name_prefix,
			sizeof srv_mysql50_table_name_prefix)
			|| strcmp(test_tablename
			+ sizeof srv_mysql50_table_name_prefix,
			test_filename)) {
		sql_print_error("tablename encoding has been changed");
		goto error;
	}
#endif /* UNIV_DEBUG */

1470 1471 1472 1473 1474 1475 1476
	/* Check that values don't overflow on 32-bit systems. */
	if (sizeof(ulint) == 4) {
		if (innobase_buffer_pool_size > UINT_MAX32) {
			sql_print_error(
				"innobase_buffer_pool_size can't be over 4GB"
				" on 32-bit systems");

osku's avatar
osku committed
1477
			goto error;
1478 1479 1480 1481 1482 1483 1484
		}

		if (innobase_log_file_size > UINT_MAX32) {
			sql_print_error(
				"innobase_log_file_size can't be over 4GB"
				" on 32-bit systems");

osku's avatar
osku committed
1485
			goto error;
1486 1487 1488
		}
	}

1489
	os_innodb_umask = (ulint)my_umask;
osku's avatar
osku committed
1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500

	/* First calculate the default path for innodb_data_home_dir etc.,
	in case the user has not given any value.

	Note that when using the embedded server, the datadirectory is not
	necessarily the current directory of this program. */

	if (mysqld_embedded) {
		default_path = mysql_real_data_home;
		fil_path_to_mysql_datadir = mysql_real_data_home;
	} else {
1501 1502 1503 1504 1505
		/* It's better to use current lib, to keep paths short */
		current_dir[0] = FN_CURLIB;
		current_dir[1] = FN_LIBCHAR;
		current_dir[2] = 0;
		default_path = current_dir;
osku's avatar
osku committed
1506 1507 1508 1509 1510
	}

	ut_a(default_path);

	if (specialflag & SPECIAL_NO_PRIOR) {
1511
		srv_set_thread_priorities = FALSE;
osku's avatar
osku committed
1512
	} else {
1513 1514
		srv_set_thread_priorities = TRUE;
		srv_query_thread_priority = QUERY_PRIOR;
osku's avatar
osku committed
1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525 1526 1527
	}

	/* Set InnoDB initialization parameters according to the values
	read from MySQL .cnf file */

	/*--------------- Data files -------------------------*/

	/* The default dir for data files is the datadir of MySQL */

	srv_data_home = (innobase_data_home_dir ? innobase_data_home_dir :
			 default_path);

	/* Set default InnoDB data file size to 10 MB and let it be
1528
	auto-extending. Thus users can use InnoDB in >= 4.0 without having
osku's avatar
osku committed
1529 1530 1531
	to specify any startup options. */

	if (!innobase_data_file_path) {
1532
		innobase_data_file_path = (char*) "ibdata1:10M:autoextend";
osku's avatar
osku committed
1533 1534 1535 1536 1537 1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548 1549
	}

	/* Since InnoDB edits the argument in the next call, we make another
	copy of it: */

	internal_innobase_data_file_path = my_strdup(innobase_data_file_path,
						   MYF(MY_FAE));

	ret = (bool) srv_parse_data_file_paths_and_sizes(
				internal_innobase_data_file_path,
				&srv_data_file_names,
				&srv_data_file_sizes,
				&srv_data_file_is_raw_partition,
				&srv_n_data_files,
				&srv_auto_extend_last_data_file,
				&srv_last_file_size_max);
	if (ret == FALSE) {
1550
		sql_print_error(
osku's avatar
osku committed
1551
			"InnoDB: syntax error in innodb_data_file_path");
1552
		my_free(internal_innobase_data_file_path,
osku's avatar
osku committed
1553
						MYF(MY_ALLOW_ZERO_PTR));
1554
		goto error;
osku's avatar
osku committed
1555 1556 1557 1558 1559
	}

	/* -------------- Log files ---------------------------*/

	/* The default dir for log files is the datadir of MySQL */
1560

osku's avatar
osku committed
1561
	if (!innobase_log_group_home_dir) {
1562
		innobase_log_group_home_dir = default_path;
osku's avatar
osku committed
1563 1564
	}

1565
#ifdef UNIV_LOG_ARCHIVE
osku's avatar
osku committed
1566 1567 1568 1569 1570 1571 1572 1573 1574 1575 1576 1577 1578 1579 1580 1581 1582
	/* Since innodb_log_arch_dir has no relevance under MySQL,
	starting from 4.0.6 we always set it the same as
	innodb_log_group_home_dir: */

	innobase_log_arch_dir = innobase_log_group_home_dir;

	srv_arch_dir = innobase_log_arch_dir;
#endif /* UNIG_LOG_ARCHIVE */

	ret = (bool)
		srv_parse_log_group_home_dirs(innobase_log_group_home_dir,
						&srv_log_group_home_dirs);

	if (ret == FALSE || innobase_mirrored_log_groups != 1) {
	  sql_print_error("syntax error in innodb_log_group_home_dir, or a "
			  "wrong number of mirrored log groups");

1583
		my_free(internal_innobase_data_file_path,
osku's avatar
osku committed
1584
						MYF(MY_ALLOW_ZERO_PTR));
1585
		goto error;
osku's avatar
osku committed
1586 1587 1588 1589 1590 1591 1592 1593 1594 1595 1596 1597 1598 1599 1600
	}

	/* --------------------------------------------------*/

	srv_file_flush_method_str = innobase_unix_file_flush_method;

	srv_n_log_groups = (ulint) innobase_mirrored_log_groups;
	srv_n_log_files = (ulint) innobase_log_files_in_group;
	srv_log_file_size = (ulint) innobase_log_file_size;

#ifdef UNIV_LOG_ARCHIVE
	srv_log_archive_on = (ulint) innobase_log_archive;
#endif /* UNIV_LOG_ARCHIVE */
	srv_log_buffer_size = (ulint) innobase_log_buffer_size;

1601 1602 1603 1604
	/* We set srv_pool_size here in units of 1 kB. InnoDB internally
	changes the value so that it becomes the number of database pages. */

	if (innobase_buffer_pool_awe_mem_mb == 0) {
1605
		srv_pool_size = (ulint)(innobase_buffer_pool_size / 1024);
1606 1607 1608 1609 1610 1611 1612 1613 1614 1615 1616
	} else {
		srv_use_awe = TRUE;
		srv_pool_size = (ulint)
				(1024 * innobase_buffer_pool_awe_mem_mb);
		srv_awe_window_size = (ulint) innobase_buffer_pool_size;

		/* Note that what the user specified as
		innodb_buffer_pool_size is actually the AWE memory window
		size in this case, and the real buffer pool size is
		determined by .._awe_mem_mb. */
	}
osku's avatar
osku committed
1617 1618 1619 1620 1621 1622 1623 1624 1625 1626 1627

	srv_mem_pool_size = (ulint) innobase_additional_mem_pool_size;

	srv_n_file_io_threads = (ulint) innobase_file_io_threads;

	srv_lock_wait_timeout = (ulint) innobase_lock_wait_timeout;
	srv_force_recovery = (ulint) innobase_force_recovery;

	srv_use_doublewrite_buf = (ibool) innobase_use_doublewrite;
	srv_use_checksums = (ibool) innobase_use_checksums;

1628 1629 1630 1631
#ifdef HAVE_LARGE_PAGES
        if ((os_use_large_pages = (ibool) my_use_large_pages))
		os_large_page_size = (ulint) opt_large_page_size;
#endif
1632

osku's avatar
osku committed
1633 1634
	row_rollback_on_timeout = (ibool) innobase_rollback_on_timeout;

osku's avatar
osku committed
1635
	srv_file_per_table = (ibool) innobase_file_per_table;
1636
	srv_locks_unsafe_for_binlog = (ibool) innobase_locks_unsafe_for_binlog;
osku's avatar
osku committed
1637 1638 1639 1640

	srv_max_n_open_files = (ulint) innobase_open_files;
	srv_innodb_status = (ibool) innobase_create_status_file;

marko's avatar
marko committed
1641 1642
	srv_stats_on_metadata = (ibool) innobase_stats_on_metadata;

1643
	srv_use_adaptive_hash_indexes =
vasil's avatar
vasil committed
1644
		(ibool) innobase_adaptive_hash_index;
1645

osku's avatar
osku committed
1646 1647 1648 1649 1650 1651 1652 1653 1654
	srv_print_verbose_log = mysqld_embedded ? 0 : 1;

	/* Store the default charset-collation number of this MySQL
	installation */

	data_mysql_default_charset_coll = (ulint)default_charset_info->number;

	ut_a(DATA_MYSQL_LATIN1_SWEDISH_CHARSET_COLL ==
					my_charset_latin1.number);
1655
	ut_a(DATA_MYSQL_BINARY_CHARSET_COLL == my_charset_bin.number);
osku's avatar
osku committed
1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666

	/* Store the latin1_swedish_ci character ordering table to InnoDB. For
	non-latin1_swedish_ci charsets we use the MySQL comparison functions,
	and consequently we do not need to know the ordering internally in
	InnoDB. */

	ut_a(0 == strcmp((char*)my_charset_latin1.name,
						(char*)"latin1_swedish_ci"));
	memcpy(srv_latin1_ordering, my_charset_latin1.sort_order, 256);

	/* Since we in this module access directly the fields of a trx
1667
	struct, and due to different headers and flags it might happen that
osku's avatar
osku committed
1668 1669 1670 1671 1672 1673 1674 1675 1676
	mutex_t has a different size in this module and in InnoDB
	modules, we check at run time that the size is the same in
	these compilation modules. */

	srv_sizeof_trx_t_in_ha_innodb_cc = sizeof(trx_t);

	err = innobase_start_or_create_for_mysql();

	if (err != DB_SUCCESS) {
1677
		my_free(internal_innobase_data_file_path,
osku's avatar
osku committed
1678
						MYF(MY_ALLOW_ZERO_PTR));
1679
		goto error;
osku's avatar
osku committed
1680 1681 1682
	}

	(void) hash_init(&innobase_open_tables,system_charset_info, 32, 0, 0,
1683 1684 1685 1686 1687 1688
					(hash_get_key) innobase_get_key, 0, 0);
	pthread_mutex_init(&innobase_share_mutex, MY_MUTEX_INIT_FAST);
	pthread_mutex_init(&prepare_commit_mutex, MY_MUTEX_INIT_FAST);
	pthread_mutex_init(&commit_threads_m, MY_MUTEX_INIT_FAST);
	pthread_mutex_init(&commit_cond_m, MY_MUTEX_INIT_FAST);
	pthread_cond_init(&commit_cond, NULL);
osku's avatar
osku committed
1689 1690 1691 1692
	innodb_inited= 1;

	DBUG_RETURN(FALSE);
error:
1693
	DBUG_RETURN(TRUE);
osku's avatar
osku committed
1694 1695 1696 1697
}

/***********************************************************************
Closes an InnoDB database. */
1698
static
osku's avatar
osku committed
1699
int
1700
innobase_end(handlerton *hton, ha_panic_function type)
osku's avatar
osku committed
1701 1702 1703 1704 1705 1706 1707
/*==============*/
				/* out: TRUE if error */
{
	int	err= 0;

	DBUG_ENTER("innobase_end");

1708
#ifdef __NETWARE__	/* some special cleanup for NetWare */
osku's avatar
osku committed
1709 1710 1711 1712 1713 1714
	if (nw_panic) {
		set_panic_flag_for_netware();
	}
#endif
	if (innodb_inited) {

1715 1716 1717 1718
		srv_fast_shutdown = (ulint) innobase_fast_shutdown;
		innodb_inited = 0;
		if (innobase_shutdown_for_mysql() != DB_SUCCESS) {
			err = 1;
osku's avatar
osku committed
1719
		}
1720 1721
		hash_free(&innobase_open_tables);
		my_free(internal_innobase_data_file_path,
osku's avatar
osku committed
1722
						MYF(MY_ALLOW_ZERO_PTR));
1723 1724 1725 1726 1727
		pthread_mutex_destroy(&innobase_share_mutex);
		pthread_mutex_destroy(&prepare_commit_mutex);
		pthread_mutex_destroy(&commit_threads_m);
		pthread_mutex_destroy(&commit_cond_m);
		pthread_cond_destroy(&commit_cond);
osku's avatar
osku committed
1728 1729
	}

1730
	DBUG_RETURN(err);
osku's avatar
osku committed
1731 1732 1733 1734 1735
}

/********************************************************************
Flushes InnoDB logs to disk and makes a checkpoint. Really, a commit flushes
the logs, and the name of this function should be innobase_checkpoint. */
1736
static
osku's avatar
osku committed
1737
bool
1738
innobase_flush_logs(handlerton *hton)
osku's avatar
osku committed
1739 1740 1741
/*=====================*/
				/* out: TRUE if error */
{
1742
	bool	result = 0;
osku's avatar
osku committed
1743

1744
	DBUG_ENTER("innobase_flush_logs");
osku's avatar
osku committed
1745 1746 1747

	log_buffer_flush_to_disk();

1748
	DBUG_RETURN(result);
osku's avatar
osku committed
1749 1750 1751 1752
}

/*********************************************************************
Commits a transaction in an InnoDB database. */
1753
static
osku's avatar
osku committed
1754 1755 1756 1757 1758
void
innobase_commit_low(
/*================*/
	trx_t*	trx)	/* in: transaction handle */
{
1759
	if (trx->conc_state == TRX_NOT_STARTED) {
osku's avatar
osku committed
1760

1761 1762
		return;
	}
osku's avatar
osku committed
1763 1764 1765 1766 1767 1768 1769 1770 1771

	trx_commit_for_mysql(trx);
}

/*********************************************************************
Creates an InnoDB transaction struct for the thd if it does not yet have one.
Starts a new InnoDB transaction if a transaction is not yet started. And
assigns a new snapshot for a consistent read if the transaction does not yet
have one. */
1772
static
osku's avatar
osku committed
1773 1774 1775 1776
int
innobase_start_trx_and_assign_read_view(
/*====================================*/
			/* out: 0 */
1777
        handlerton *hton, /* in: Innodb handlerton */ 
osku's avatar
osku committed
1778 1779 1780 1781 1782
	THD*	thd)	/* in: MySQL thread handle of the user for whom
			the transaction should be committed */
{
	trx_t*	trx;

1783
	DBUG_ENTER("innobase_start_trx_and_assign_read_view");
osku's avatar
osku committed
1784 1785 1786

	/* Create a new trx struct for thd, if it does not yet have one */

1787
	trx = check_trx_exists(thd);
osku's avatar
osku committed
1788 1789 1790 1791 1792 1793 1794 1795 1796 1797 1798 1799 1800 1801 1802 1803 1804

	/* This is just to play safe: release a possible FIFO ticket and
	search latch. Since we will reserve the kernel mutex, we have to
	release the search system latch first to obey the latching order. */

	innobase_release_stat_resources(trx);

	/* If the transaction is not started yet, start it */

	trx_start_if_not_started_noninline(trx);

	/* Assign a read view if the transaction does not have it yet */

	trx_assign_read_view(trx);

	/* Set the MySQL flag to mark that there is an active transaction */

1805
	if (trx->active_trans == 0) {
1806
		innobase_register_trx_and_stmt(hton, current_thd);
1807 1808
		trx->active_trans = 1;
	}
osku's avatar
osku committed
1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819 1820

	DBUG_RETURN(0);
}

/*********************************************************************
Commits a transaction in an InnoDB database or marks an SQL statement
ended. */
static
int
innobase_commit(
/*============*/
			/* out: 0 */
1821 1822
        handlerton *hton, /* in: Innodb handlerton */ 
	THD* 	thd,	/* in: MySQL thread handle of the user for whom
osku's avatar
osku committed
1823
			the transaction should be committed */
1824 1825
	bool	all)	/* in:	TRUE - commit transaction
				FALSE - the current SQL statement ended */
osku's avatar
osku committed
1826 1827 1828
{
	trx_t*		trx;

1829 1830
	DBUG_ENTER("innobase_commit");
	DBUG_PRINT("trans", ("ending transaction"));
osku's avatar
osku committed
1831

1832
	trx = check_trx_exists(thd);
osku's avatar
osku committed
1833 1834

	/* Update the info whether we should skip XA steps that eat CPU time */
1835
	trx->support_xa = THDVAR(thd, support_xa);
osku's avatar
osku committed
1836

1837 1838
	/* Since we will reserve the kernel mutex, we have to release
	the search system latch first to obey the latching order. */
osku's avatar
osku committed
1839

1840
	if (trx->has_search_latch) {
1841
		trx_search_latch_release_if_reserved(trx);
1842 1843 1844
	}

	/* The flag trx->active_trans is set to 1 in
osku's avatar
osku committed
1845 1846 1847 1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858

	1. ::external_lock(),
	2. ::start_stmt(),
	3. innobase_query_caching_of_table_permitted(),
	4. innobase_savepoint(),
	5. ::init_table_handle_for_HANDLER(),
	6. innobase_start_trx_and_assign_read_view(),
	7. ::transactional_table_lock()

	and it is only set to 0 in a commit or a rollback. If it is 0 we know
	there cannot be resources to be freed and we could return immediately.
	For the time being, we play safe and do the cleanup though there should
	be nothing to clean up. */

1859 1860 1861 1862 1863
	if (trx->active_trans == 0
		&& trx->conc_state != TRX_NOT_STARTED) {

		sql_print_error("trx->active_trans == 0, but"
			" trx->conc_state != TRX_NOT_STARTED");
osku's avatar
osku committed
1864
	}
1865
	if (all
1866
		|| (!thd_test_options(thd, OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN))) {
1867 1868

		/* We were instructed to commit the whole transaction, or
osku's avatar
osku committed
1869 1870
		this is an SQL statement end and autocommit is on */

1871 1872 1873
		/* We need current binlog position for ibbackup to work.
		Note, the position is current because of
		prepare_commit_mutex */
osku's avatar
osku committed
1874
retry:
1875 1876 1877 1878 1879 1880 1881 1882 1883 1884 1885 1886 1887 1888 1889 1890
		if (srv_commit_concurrency > 0) {
			pthread_mutex_lock(&commit_cond_m);
			commit_threads++;

			if (commit_threads > srv_commit_concurrency) {
				commit_threads--;
				pthread_cond_wait(&commit_cond,
					&commit_cond_m);
				pthread_mutex_unlock(&commit_cond_m);
				goto retry;
			}
			else {
				pthread_mutex_unlock(&commit_cond_m);
			}
		}

1891 1892
		trx->mysql_log_file_name = mysql_bin_log_file_name();
		trx->mysql_log_offset = (ib_longlong) mysql_bin_log_file_pos();
osku's avatar
osku committed
1893 1894 1895

		innobase_commit_low(trx);

1896
		if (srv_commit_concurrency > 0) {
1897 1898 1899 1900 1901 1902 1903 1904 1905 1906 1907 1908 1909
			pthread_mutex_lock(&commit_cond_m);
			commit_threads--;
			pthread_cond_signal(&commit_cond);
			pthread_mutex_unlock(&commit_cond_m);
		}

		if (trx->active_trans == 2) {

			pthread_mutex_unlock(&prepare_commit_mutex);
		}

		trx->active_trans = 0;

osku's avatar
osku committed
1910
	} else {
1911
		/* We just mark the SQL statement ended and do not do a
osku's avatar
osku committed
1912 1913
		transaction commit */

marko's avatar
marko committed
1914 1915 1916 1917
		/* If we had reserved the auto-inc lock for some
		table in this SQL statement we release it now */

		row_unlock_table_autoinc_for_mysql(trx);
1918

osku's avatar
osku committed
1919 1920 1921 1922 1923 1924 1925
		/* Store the current undo_no of the transaction so that we
		know where to roll back if we have to roll back the next
		SQL statement */

		trx_mark_sql_stat_end(trx);
	}

1926 1927
	trx->n_autoinc_rows = 0; /* Reset the number AUTO-INC rows required */

1928
	if (trx->declared_to_be_inside_innodb) {
1929
		/* Release our possible ticket in the FIFO */
osku's avatar
osku committed
1930

1931
		srv_conc_force_exit_innodb(trx);
1932
	}
1933 1934 1935

	/* Tell the InnoDB server that there might be work for utility
	threads: */
osku's avatar
osku committed
1936 1937 1938 1939 1940 1941 1942
	srv_active_wake_master_thread();

	DBUG_RETURN(0);
}

/*********************************************************************
Rolls back a transaction or the latest SQL statement. */
1943 1944
static
int
osku's avatar
osku committed
1945 1946 1947
innobase_rollback(
/*==============*/
			/* out: 0 or error number */
1948
        handlerton *hton, /* in: Innodb handlerton */ 
osku's avatar
osku committed
1949 1950
	THD*	thd,	/* in: handle to the MySQL thread of the user
			whose transaction should be rolled back */
1951 1952
	bool	all)	/* in:	TRUE - commit transaction
				FALSE - the current SQL statement ended */
osku's avatar
osku committed
1953 1954 1955 1956 1957 1958 1959
{
	int	error = 0;
	trx_t*	trx;

	DBUG_ENTER("innobase_rollback");
	DBUG_PRINT("trans", ("aborting transaction"));

1960
	trx = check_trx_exists(thd);
osku's avatar
osku committed
1961 1962

	/* Update the info whether we should skip XA steps that eat CPU time */
1963
	trx->support_xa = THDVAR(thd, support_xa);
osku's avatar
osku committed
1964 1965 1966 1967 1968 1969 1970

	/* Release a possible FIFO ticket and search latch. Since we will
	reserve the kernel mutex, we have to release the search system latch
	first to obey the latching order. */

	innobase_release_stat_resources(trx);

marko's avatar
marko committed
1971 1972 1973
	/* If we had reserved the auto-inc lock for some table (if
	we come here to roll back the latest SQL statement) we
	release it now before a possibly lengthy rollback */
1974

marko's avatar
marko committed
1975
	row_unlock_table_autoinc_for_mysql(trx);
osku's avatar
osku committed
1976

1977
	if (all
1978
		|| !thd_test_options(thd, OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN)) {
osku's avatar
osku committed
1979 1980

		error = trx_rollback_for_mysql(trx);
1981
		trx->active_trans = 0;
osku's avatar
osku committed
1982 1983 1984 1985 1986 1987 1988 1989 1990
	} else {
		error = trx_rollback_last_sql_stat_for_mysql(trx);
	}

	DBUG_RETURN(convert_error_code_to_mysql(error, NULL));
}

/*********************************************************************
Rolls back a transaction */
1991
static
osku's avatar
osku committed
1992 1993 1994 1995 1996 1997 1998 1999 2000 2001 2002 2003 2004 2005 2006 2007 2008
int
innobase_rollback_trx(
/*==================*/
			/* out: 0 or error number */
	trx_t*	trx)	/*  in: transaction */
{
	int	error = 0;

	DBUG_ENTER("innobase_rollback_trx");
	DBUG_PRINT("trans", ("aborting transaction"));

	/* Release a possible FIFO ticket and search latch. Since we will
	reserve the kernel mutex, we have to release the search system latch
	first to obey the latching order. */

	innobase_release_stat_resources(trx);

marko's avatar
marko committed
2009 2010 2011
	/* If we had reserved the auto-inc lock for some table (if
	we come here to roll back the latest SQL statement) we
	release it now before a possibly lengthy rollback */
2012

marko's avatar
marko committed
2013
	row_unlock_table_autoinc_for_mysql(trx);
osku's avatar
osku committed
2014 2015 2016 2017 2018 2019 2020 2021

	error = trx_rollback_for_mysql(trx);

	DBUG_RETURN(convert_error_code_to_mysql(error, NULL));
}

/*********************************************************************
Rolls back a transaction to a savepoint. */
2022 2023
static
int
osku's avatar
osku committed
2024 2025 2026 2027
innobase_rollback_to_savepoint(
/*===========================*/
				/* out: 0 if success, HA_ERR_NO_SAVEPOINT if
				no savepoint with the given name */
2028
        handlerton *hton,       /* in: Innodb handlerton */ 
osku's avatar
osku committed
2029 2030
	THD*	thd,		/* in: handle to the MySQL thread of the user
				whose transaction should be rolled back */
2031
	void*	savepoint)	/* in: savepoint data */
osku's avatar
osku committed
2032
{
2033 2034 2035 2036
	ib_longlong	mysql_binlog_cache_pos;
	int		error = 0;
	trx_t*		trx;
	char		name[64];
osku's avatar
osku committed
2037 2038 2039

	DBUG_ENTER("innobase_rollback_to_savepoint");

2040
	trx = check_trx_exists(thd);
osku's avatar
osku committed
2041 2042 2043 2044 2045 2046 2047

	/* Release a possible FIFO ticket and search latch. Since we will
	reserve the kernel mutex, we have to release the search system latch
	first to obey the latching order. */

	innobase_release_stat_resources(trx);

2048
	/* TODO: use provided savepoint data area to store savepoint data */
osku's avatar
osku committed
2049

2050
	longlong2str((ulint)savepoint, name, 36);
osku's avatar
osku committed
2051

2052
	error = (int) trx_rollback_to_savepoint_for_mysql(trx, name,
osku's avatar
osku committed
2053 2054 2055 2056 2057 2058 2059 2060 2061 2062 2063 2064
						&mysql_binlog_cache_pos);
	DBUG_RETURN(convert_error_code_to_mysql(error, NULL));
}

/*********************************************************************
Release transaction savepoint name. */
static
int
innobase_release_savepoint(
/*=======================*/
				/* out: 0 if success, HA_ERR_NO_SAVEPOINT if
				no savepoint with the given name */
2065
        handlerton*	hton,	/* in: handlerton for Innodb */
osku's avatar
osku committed
2066 2067
	THD*	thd,		/* in: handle to the MySQL thread of the user
				whose transaction should be rolled back */
2068
	void*	savepoint)	/* in: savepoint data */
osku's avatar
osku committed
2069
{
2070 2071 2072
	int		error = 0;
	trx_t*		trx;
	char		name[64];
osku's avatar
osku committed
2073 2074 2075

	DBUG_ENTER("innobase_release_savepoint");

2076
	trx = check_trx_exists(thd);
osku's avatar
osku committed
2077

2078
	/* TODO: use provided savepoint data area to store savepoint data */
osku's avatar
osku committed
2079

2080
	longlong2str((ulint)savepoint, name, 36);
osku's avatar
osku committed
2081 2082 2083 2084 2085 2086 2087 2088 2089 2090 2091 2092 2093

	error = (int) trx_release_savepoint_for_mysql(trx, name);

	DBUG_RETURN(convert_error_code_to_mysql(error, NULL));
}

/*********************************************************************
Sets a transaction savepoint. */
static
int
innobase_savepoint(
/*===============*/
				/* out: always 0, that is, always succeeds */
2094
	handlerton*	hton,   /* in: handle to the Innodb handlerton */
osku's avatar
osku committed
2095
	THD*	thd,		/* in: handle to the MySQL thread */
2096
	void*	savepoint)	/* in: savepoint data */
osku's avatar
osku committed
2097 2098 2099 2100 2101 2102
{
	int	error = 0;
	trx_t*	trx;

	DBUG_ENTER("innobase_savepoint");

2103 2104 2105 2106 2107
	/*
	  In the autocommit mode there is no sense to set a savepoint
	  (unless we are in sub-statement), so SQL layer ensures that
	  this method is never called in such situation.
	*/
2108 2109
#ifdef MYSQL_SERVER /* plugins cannot access thd->in_sub_stmt */
	DBUG_ASSERT(thd_test_options(thd, OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN) ||
2110
		thd->in_sub_stmt);
2111
#endif /* MYSQL_SERVER */
osku's avatar
osku committed
2112

2113
	trx = check_trx_exists(thd);
osku's avatar
osku committed
2114 2115 2116 2117 2118 2119 2120

	/* Release a possible FIFO ticket and search latch. Since we will
	reserve the kernel mutex, we have to release the search system latch
	first to obey the latching order. */

	innobase_release_stat_resources(trx);

2121 2122
	/* cannot happen outside of transaction */
	DBUG_ASSERT(trx->active_trans);
osku's avatar
osku committed
2123

2124 2125 2126
	/* TODO: use provided savepoint data area to store savepoint data */
	char name[64];
	longlong2str((ulint)savepoint,name,36);
osku's avatar
osku committed
2127

2128
	error = (int) trx_savepoint_for_mysql(trx, name, (ib_longlong)0);
osku's avatar
osku committed
2129 2130 2131 2132 2133 2134 2135 2136 2137 2138 2139

	DBUG_RETURN(convert_error_code_to_mysql(error, NULL));
}

/*********************************************************************
Frees a possible InnoDB trx object associated with the current THD. */
static
int
innobase_close_connection(
/*======================*/
			/* out: 0 or error number */
2140
        handlerton*	hton,	/* in:  innobase handlerton */
osku's avatar
osku committed
2141 2142 2143 2144 2145
	THD*	thd)	/* in: handle to the MySQL thread of the user
			whose resources should be free'd */
{
	trx_t*	trx;

2146 2147 2148
	DBUG_ENTER("innobase_close_connection");
	DBUG_ASSERT(hton == innodb_hton_ptr);
	trx = thd_to_trx(thd);
osku's avatar
osku committed
2149 2150 2151

	ut_a(trx);

2152 2153 2154 2155 2156
	if (trx->active_trans == 0
		&& trx->conc_state != TRX_NOT_STARTED) {

		sql_print_error("trx->active_trans == 0, but"
			" trx->conc_state != TRX_NOT_STARTED");
osku's avatar
osku committed
2157 2158 2159 2160
	}


	if (trx->conc_state != TRX_NOT_STARTED &&
2161 2162 2163 2164 2165 2166 2167
		global_system_variables.log_warnings) {
		sql_print_warning(
			"MySQL is closing a connection that has an active "
			"InnoDB transaction.  %lu row modifications will "
			"roll back.",
			(ulong) trx->undo_no.low);
	}
osku's avatar
osku committed
2168 2169 2170

	innobase_rollback_trx(trx);

2171
	thr_local_free(trx->mysql_thread_id);
2172
	trx_free_for_mysql(trx);
osku's avatar
osku committed
2173

2174
	DBUG_RETURN(0);
osku's avatar
osku committed
2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189
}


/*****************************************************************************
** InnoDB database tables
*****************************************************************************/

/********************************************************************
Get the record format from the data dictionary. */
enum row_type
ha_innobase::get_row_type() const
/*=============================*/
			/* out: ROW_TYPE_REDUNDANT or ROW_TYPE_COMPACT */
{
	if (prebuilt && prebuilt->table) {
2190
		if (dict_table_is_comp_noninline(prebuilt->table)) {
osku's avatar
osku committed
2191 2192 2193 2194 2195 2196 2197 2198 2199
			return(ROW_TYPE_COMPACT);
		} else {
			return(ROW_TYPE_REDUNDANT);
		}
	}
	ut_ad(0);
	return(ROW_TYPE_NOT_USED);
}

2200 2201 2202 2203 2204 2205 2206 2207 2208 2209 2210 2211 2212 2213 2214


/********************************************************************
Get the table flags to use for the statement. */
handler::Table_flags
ha_innobase::table_flags() const
{
       /* Need to use tx_isolation here since table flags is (also)
          called before prebuilt is inited. */
        ulong const tx_isolation = thd_tx_isolation(current_thd);
        if (tx_isolation <= ISO_READ_COMMITTED)
                return int_table_flags;
        return int_table_flags | HA_BINLOG_STMT_CAPABLE;
}

osku's avatar
osku committed
2215 2216 2217 2218 2219 2220 2221 2222 2223 2224 2225 2226 2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258 2259 2260 2261 2262 2263 2264 2265 2266 2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277 2278 2279 2280 2281 2282 2283 2284 2285
/********************************************************************
Gives the file extension of an InnoDB single-table tablespace. */
static const char* ha_innobase_exts[] = {
  ".ibd",
  NullS
};

const char**
ha_innobase::bas_ext() const
/*========================*/
				/* out: file extension string */
{
  return ha_innobase_exts;
}


/*********************************************************************
Normalizes a table name string. A normalized name consists of the
database name catenated to '/' and table name. An example:
test/mytable. On Windows normalization puts both the database name and the
table name always to lower case. */
static
void
normalize_table_name(
/*=================*/
	char*		norm_name,	/* out: normalized name as a
					null-terminated string */
	const char*	name)		/* in: table name string */
{
	char*	name_ptr;
	char*	db_ptr;
	char*	ptr;

	/* Scan name from the end */

	ptr = strend(name)-1;

	while (ptr >= name && *ptr != '\\' && *ptr != '/') {
		ptr--;
	}

	name_ptr = ptr + 1;

	DBUG_ASSERT(ptr > name);

	ptr--;

	while (ptr >= name && *ptr != '\\' && *ptr != '/') {
		ptr--;
	}

	db_ptr = ptr + 1;

	memcpy(norm_name, db_ptr, strlen(name) + 1 - (db_ptr - name));

	norm_name[name_ptr - db_ptr - 1] = '/';

#ifdef __WIN__
	innobase_casedn_str(norm_name);
#endif
}

/*********************************************************************
Creates and opens a handle to a table which already exists in an InnoDB
database. */

int
ha_innobase::open(
/*==============*/
					/* out: 1 if error, 0 if success */
	const char*	name,		/* in: table name */
2286 2287
	int		mode,		/* in: not used */
	uint		test_if_locked)	/* in: not used */
osku's avatar
osku committed
2288 2289
{
	dict_table_t*	ib_table;
2290
	char		norm_name[1000];
osku's avatar
osku committed
2291
	THD*		thd;
inaam's avatar
inaam committed
2292 2293
	ulint		retries = 0;
	char*		is_part = NULL;
osku's avatar
osku committed
2294 2295 2296 2297 2298 2299

	DBUG_ENTER("ha_innobase::open");

	UT_NOT_USED(mode);
	UT_NOT_USED(test_if_locked);

2300
	thd = ha_thd();
2301 2302 2303 2304 2305 2306 2307 2308

	/* Under some cases MySQL seems to call this function while
	holding btr_search_latch. This breaks the latching order as
	we acquire dict_sys->mutex below and leads to a deadlock. */
	if (thd != NULL) {
		innobase_release_temporary_latches(ht, thd);
	}

osku's avatar
osku committed
2309 2310 2311 2312 2313 2314 2315 2316 2317 2318 2319 2320 2321 2322 2323 2324 2325
	normalize_table_name(norm_name, name);

	user_thd = NULL;

	if (!(share=get_share(name))) {

		DBUG_RETURN(1);
	}

	/* Create buffers for packing the fields of a record. Why
	table->reclength did not work here? Obviously, because char
	fields when packed actually became 1 byte longer, when we also
	stored the string length as the first byte. */

	upd_and_key_val_buff_len =
				table->s->reclength + table->s->max_key_length
							+ MAX_REF_PARTS * 3;
2326
	if (!(uchar*) my_multi_malloc(MYF(MY_WME),
2327 2328 2329 2330
			&upd_buff, upd_and_key_val_buff_len,
			&key_val_buff, upd_and_key_val_buff_len,
			NullS)) {
		free_share(share);
osku's avatar
osku committed
2331

2332 2333
		DBUG_RETURN(1);
	}
osku's avatar
osku committed
2334

inaam's avatar
inaam committed
2335 2336 2337 2338 2339 2340 2341
	/* We look for pattern #P# to see if the table is partitioned
	MySQL table. The retry logic for partitioned tables is a
	workaround for http://bugs.mysql.com/bug.php?id=33349. Look
	at support issue https://support.mysql.com/view.php?id=21080
	for more details. */
	is_part = strstr(norm_name, "#P#");
retry:
osku's avatar
osku committed
2342
	/* Get pointer to a table object in InnoDB dictionary cache */
2343
	ib_table = dict_table_get(norm_name, TRUE);
inaam's avatar
inaam committed
2344
	
2345
	if (NULL == ib_table) {
inaam's avatar
inaam committed
2346 2347 2348 2349 2350 2351 2352 2353 2354 2355 2356 2357
		if (is_part && retries < 10) {
			++retries;
			os_thread_sleep(100000);
			goto retry;
		}

		if (is_part) {
			sql_print_error("Failed to open table %s after "
					"%lu attemtps.\n", norm_name,
					retries);
		}

2358 2359 2360 2361 2362 2363 2364 2365 2366 2367 2368 2369
		sql_print_error("Cannot find or open table %s from\n"
				"the internal data dictionary of InnoDB "
				"though the .frm file for the\n"
				"table exists. Maybe you have deleted and "
				"recreated InnoDB data\n"
				"files but have forgotten to delete the "
				"corresponding .frm files\n"
				"of InnoDB tables, or you have moved .frm "
				"files to another database?\n"
				"or, the table contains indexes that this "
				"version of the engine\n"
				"doesn't support.\n"
2370
				"See http://dev.mysql.com/doc/refman/5.1/en/innodb-troubleshooting.html\n"
osku's avatar
osku committed
2371 2372
				"how you can resolve the problem.\n",
				norm_name);
2373
		free_share(share);
marko's avatar
marko committed
2374
		my_free(upd_buff, MYF(0));
2375
		my_errno = ENOENT;
osku's avatar
osku committed
2376

2377 2378
		DBUG_RETURN(HA_ERR_NO_SUCH_TABLE);
	}
osku's avatar
osku committed
2379

2380
	if (ib_table->ibd_file_missing && !thd_tablespace_op(thd)) {
osku's avatar
osku committed
2381 2382 2383 2384 2385
		sql_print_error("MySQL is trying to open a table handle but "
				"the .ibd file for\ntable %s does not exist.\n"
				"Have you deleted the .ibd file from the "
				"database directory under\nthe MySQL datadir, "
				"or have you used DISCARD TABLESPACE?\n"
2386
				"See http://dev.mysql.com/doc/refman/5.1/en/innodb-troubleshooting.html\n"
osku's avatar
osku committed
2387 2388
				"how you can resolve the problem.\n",
				norm_name);
2389
		free_share(share);
marko's avatar
marko committed
2390
		my_free(upd_buff, MYF(0));
2391
		my_errno = ENOENT;
osku's avatar
osku committed
2392 2393

		dict_table_decrement_handle_count(ib_table);
2394 2395
		DBUG_RETURN(HA_ERR_NO_SUCH_TABLE);
	}
osku's avatar
osku committed
2396

osku's avatar
osku committed
2397
	prebuilt = row_create_prebuilt(ib_table);
osku's avatar
osku committed
2398

osku's avatar
osku committed
2399
	prebuilt->mysql_row_len = table->s->reclength;
osku's avatar
osku committed
2400 2401 2402

	/* Looks like MySQL-3.23 sometimes has primary key number != 0 */

2403
	primary_key = table->s->primary_key;
osku's avatar
osku committed
2404 2405 2406 2407
	key_used_on_scan = primary_key;

	/* Allocate a buffer for a 'row reference'. A row reference is
	a string of bytes of length ref_length which uniquely specifies
2408 2409 2410
	a row in our table. Note that MySQL may also compare two row
	references for equality by doing a simple memcmp on the strings
	of length ref_length! */
osku's avatar
osku committed
2411

2412 2413
	if (!row_table_got_default_clust_index(ib_table)) {
		if (primary_key >= MAX_KEY) {
osku's avatar
osku committed
2414 2415 2416 2417
		  sql_print_error("Table %s has a primary key in InnoDB data "
				  "dictionary, but not in MySQL!", name);
		}

osku's avatar
osku committed
2418 2419
		prebuilt->clust_index_was_generated = FALSE;

2420
		/* MySQL allocates the buffer for ref. key_info->key_length
osku's avatar
osku committed
2421 2422 2423 2424
		includes space for all key columns + one byte for each column
		that may be NULL. ref_length must be as exact as possible to
		save space, because all row reference buffers are allocated
		based on ref_length. */
2425 2426

		ref_length = table->key_info[primary_key].key_length;
osku's avatar
osku committed
2427
	} else {
2428
		if (primary_key != MAX_KEY) {
osku's avatar
osku committed
2429 2430 2431 2432 2433 2434 2435 2436 2437 2438 2439
		  sql_print_error("Table %s has no primary key in InnoDB data "
				  "dictionary, but has one in MySQL! If you "
				  "created the table with a MySQL version < "
				  "3.23.54 and did not define a primary key, "
				  "but defined a unique key with all non-NULL "
				  "columns, then MySQL internally treats that "
				  "key as the primary key. You can fix this "
				  "error by dump + DROP + CREATE + reimport "
				  "of the table.", name);
		}

osku's avatar
osku committed
2440
		prebuilt->clust_index_was_generated = TRUE;
osku's avatar
osku committed
2441

2442
		ref_length = DATA_ROW_ID_LEN;
osku's avatar
osku committed
2443 2444 2445 2446 2447 2448 2449 2450

		/* If we automatically created the clustered index, then
		MySQL does not know about it, and MySQL must NOT be aware
		of the index used on scan, to make it avoid checking if we
		update the column of the index. That is why we assert below
		that key_used_on_scan is the undefined value MAX_KEY.
		The column is the row id in the automatical generation case,
		and it will never be updated anyway. */
2451

osku's avatar
osku committed
2452
		if (key_used_on_scan != MAX_KEY) {
2453 2454 2455 2456
			sql_print_warning(
				"Table %s key_used_on_scan is %lu even "
				"though there is no primary key inside "
				"InnoDB.", name, (ulong) key_used_on_scan);
osku's avatar
osku committed
2457 2458 2459
		}
	}

marko's avatar
marko committed
2460
	stats.block_size = 16 * 1024;	/* Index block size in InnoDB: used by MySQL
osku's avatar
osku committed
2461 2462 2463 2464 2465
				in query optimization */

	/* Init table lock structure */
	thr_lock_data_init(&share->lock,&lock,(void*) 0);

2466
	info(HA_STATUS_NO_LOCK | HA_STATUS_VARIABLE | HA_STATUS_CONST);
osku's avatar
osku committed
2467

2468
	DBUG_RETURN(0);
osku's avatar
osku committed
2469 2470
}

2471 2472 2473 2474 2475 2476
uint
ha_innobase::max_supported_key_part_length() const
{
	return(DICT_MAX_INDEX_COL_LEN - 1);
}

osku's avatar
osku committed
2477 2478 2479 2480 2481 2482 2483 2484
/**********************************************************************
Closes a handle to an InnoDB table. */

int
ha_innobase::close(void)
/*====================*/
				/* out: 0 */
{
2485 2486
	THD*	thd;

2487
	DBUG_ENTER("ha_innobase::close");
osku's avatar
osku committed
2488

2489 2490 2491 2492
	thd = current_thd;  // avoid calling current_thd twice, it may be slow
	if (thd != NULL) {
		innobase_release_temporary_latches(ht, thd);
	}
vasil's avatar
vasil committed
2493

osku's avatar
osku committed
2494
	row_prebuilt_free(prebuilt);
osku's avatar
osku committed
2495

marko's avatar
marko committed
2496
	my_free(upd_buff, MYF(0));
2497
	free_share(share);
osku's avatar
osku committed
2498 2499 2500 2501 2502 2503

	/* Tell InnoDB server that there might be work for
	utility threads: */

	srv_active_wake_master_thread();

2504
	DBUG_RETURN(0);
osku's avatar
osku committed
2505 2506 2507 2508 2509 2510 2511 2512 2513 2514 2515 2516 2517 2518
}

/* The following accessor functions should really be inside MySQL code! */

/******************************************************************
Gets field offset for a field in a table. */
inline
uint
get_field_offset(
/*=============*/
			/* out: offset */
	TABLE*	table,	/* in: MySQL table object */
	Field*	field)	/* in: MySQL field object */
{
marko's avatar
marko committed
2519
	return((uint) (field->ptr - table->record[0]));
osku's avatar
osku committed
2520 2521 2522 2523 2524
}

/******************************************************************
Checks if a field in a record is SQL NULL. Uses the record format
information in table to track the null bit in record. */
marko's avatar
marko committed
2525
static inline
osku's avatar
osku committed
2526 2527 2528 2529 2530 2531 2532 2533 2534 2535 2536 2537 2538 2539 2540 2541 2542 2543 2544 2545 2546 2547 2548 2549 2550 2551 2552 2553 2554 2555 2556 2557 2558 2559 2560 2561 2562 2563 2564 2565 2566 2567 2568 2569 2570 2571 2572 2573 2574 2575 2576 2577 2578 2579 2580 2581 2582 2583 2584 2585 2586 2587 2588 2589 2590 2591 2592 2593
uint
field_in_record_is_null(
/*====================*/
			/* out: 1 if NULL, 0 otherwise */
	TABLE*	table,	/* in: MySQL table object */
	Field*	field,	/* in: MySQL field object */
	char*	record)	/* in: a row in MySQL format */
{
	int	null_offset;

	if (!field->null_ptr) {

		return(0);
	}

	null_offset = (uint) ((char*) field->null_ptr
					- (char*) table->record[0]);

	if (record[null_offset] & field->null_bit) {

		return(1);
	}

	return(0);
}

/******************************************************************
Sets a field in a record to SQL NULL. Uses the record format
information in table to track the null bit in record. */
inline
void
set_field_in_record_to_null(
/*========================*/
	TABLE*	table,	/* in: MySQL table object */
	Field*	field,	/* in: MySQL field object */
	char*	record)	/* in: a row in MySQL format */
{
	int	null_offset;

	null_offset = (uint) ((char*) field->null_ptr
					- (char*) table->record[0]);

	record[null_offset] = record[null_offset] | field->null_bit;
}

extern "C" {
/*****************************************************************
InnoDB uses this function to compare two data fields for which the data type
is such that we must use MySQL code to compare them. NOTE that the prototype
of this function is in rem0cmp.c in InnoDB source code! If you change this
function, remember to update the prototype there! */

int
innobase_mysql_cmp(
/*===============*/
					/* out: 1, 0, -1, if a is greater,
					equal, less than b, respectively */
	int		mysql_type,	/* in: MySQL type */
	uint		charset_number,	/* in: number of the charset */
	unsigned char*	a,		/* in: data field */
	unsigned int	a_length,	/* in: data field length,
					not UNIV_SQL_NULL */
	unsigned char*	b,		/* in: data field */
	unsigned int	b_length)	/* in: data field length,
					not UNIV_SQL_NULL */
{
	CHARSET_INFO*		charset;
	enum_field_types	mysql_tp;
2594
	int			ret;
osku's avatar
osku committed
2595 2596 2597 2598 2599 2600 2601 2602

	DBUG_ASSERT(a_length != UNIV_SQL_NULL);
	DBUG_ASSERT(b_length != UNIV_SQL_NULL);

	mysql_tp = (enum_field_types) mysql_type;

	switch (mysql_tp) {

2603
	case MYSQL_TYPE_BIT:
osku's avatar
osku committed
2604 2605
	case MYSQL_TYPE_STRING:
	case MYSQL_TYPE_VAR_STRING:
marko's avatar
marko committed
2606 2607 2608 2609
	case MYSQL_TYPE_TINY_BLOB:
	case MYSQL_TYPE_MEDIUM_BLOB:
	case MYSQL_TYPE_BLOB:
	case MYSQL_TYPE_LONG_BLOB:
2610
	case MYSQL_TYPE_VARCHAR:
osku's avatar
osku committed
2611 2612 2613 2614 2615 2616 2617 2618 2619 2620 2621 2622 2623 2624 2625 2626 2627 2628 2629 2630 2631
		/* Use the charset number to pick the right charset struct for
		the comparison. Since the MySQL function get_charset may be
		slow before Bar removes the mutex operation there, we first
		look at 2 common charsets directly. */

		if (charset_number == default_charset_info->number) {
			charset = default_charset_info;
		} else if (charset_number == my_charset_latin1.number) {
			charset = &my_charset_latin1;
		} else {
			charset = get_charset(charset_number, MYF(MY_WME));

			if (charset == NULL) {
			  sql_print_error("InnoDB needs charset %lu for doing "
					  "a comparison, but MySQL cannot "
					  "find that charset.",
					  (ulong) charset_number);
				ut_a(0);
			}
		}

2632 2633 2634 2635
		/* Starting from 4.1.3, we use strnncollsp() in comparisons of
		non-latin1_swedish_ci strings. NOTE that the collation order
		changes then: 'b\0\0...' is ordered BEFORE 'b  ...'. Users
		having indexes on such data need to rebuild their tables! */
osku's avatar
osku committed
2636

2637 2638 2639
		ret = charset->coll->strnncollsp(charset,
				  a, a_length,
						 b, b_length, 0);
osku's avatar
osku committed
2640
		if (ret < 0) {
2641
			return(-1);
osku's avatar
osku committed
2642
		} else if (ret > 0) {
2643
			return(1);
osku's avatar
osku committed
2644
		} else {
2645 2646
			return(0);
		}
osku's avatar
osku committed
2647 2648 2649 2650 2651 2652 2653 2654 2655 2656 2657 2658 2659 2660 2661 2662 2663 2664 2665 2666 2667 2668 2669 2670 2671 2672
	default:
		assert(0);
	}

	return(0);
}
}

/******************************************************************
Converts a MySQL type to an InnoDB type. Note that this function returns
the 'mtype' of InnoDB. InnoDB differentiates between MySQL's old <= 4.1
VARCHAR and the new true VARCHAR in >= 5.0.3 by the 'prtype'. */
inline
ulint
get_innobase_type_from_mysql_type(
/*==============================*/
				/* out: DATA_BINARY, DATA_VARCHAR, ... */
	ulint*	unsigned_flag,	/* out: DATA_UNSIGNED if an 'unsigned type';
				at least ENUM and SET, and unsigned integer
				types are 'unsigned types' */
	Field*	field)		/* in: MySQL field */
{
	/* The following asserts try to check that the MySQL type code fits in
	8 bits: this is used in ibuf and also when DATA_NOT_NULL is ORed to
	the type */

marko's avatar
marko committed
2673 2674 2675 2676 2677
	DBUG_ASSERT((ulint)MYSQL_TYPE_STRING < 256);
	DBUG_ASSERT((ulint)MYSQL_TYPE_VAR_STRING < 256);
	DBUG_ASSERT((ulint)MYSQL_TYPE_DOUBLE < 256);
	DBUG_ASSERT((ulint)MYSQL_TYPE_FLOAT < 256);
	DBUG_ASSERT((ulint)MYSQL_TYPE_DECIMAL < 256);
osku's avatar
osku committed
2678 2679 2680 2681 2682 2683 2684 2685

	if (field->flags & UNSIGNED_FLAG) {

		*unsigned_flag = DATA_UNSIGNED;
	} else {
		*unsigned_flag = 0;
	}

marko's avatar
marko committed
2686 2687
	if (field->real_type() == MYSQL_TYPE_ENUM
		|| field->real_type() == MYSQL_TYPE_SET) {
osku's avatar
osku committed
2688 2689 2690 2691 2692 2693 2694 2695 2696 2697 2698 2699 2700

		/* MySQL has field->type() a string type for these, but the
		data is actually internally stored as an unsigned integer
		code! */

		*unsigned_flag = DATA_UNSIGNED; /* MySQL has its own unsigned
						flag set to zero, even though
						internally this is an unsigned
						integer type */
		return(DATA_INT);
	}

	switch (field->type()) {
2701 2702 2703 2704 2705 2706 2707 2708 2709 2710 2711 2712 2713 2714 2715 2716 2717 2718 2719 2720 2721 2722 2723 2724
		/* NOTE that we only allow string types in DATA_MYSQL and
		DATA_VARMYSQL */
	case MYSQL_TYPE_VAR_STRING: /* old <= 4.1 VARCHAR */
	case MYSQL_TYPE_VARCHAR:    /* new >= 5.0.3 true VARCHAR */
		if (field->binary()) {
			return(DATA_BINARY);
		} else if (strcmp(
				   field->charset()->name,
				   "latin1_swedish_ci") == 0) {
			return(DATA_VARCHAR);
		} else {
			return(DATA_VARMYSQL);
		}
	case MYSQL_TYPE_BIT:
	case MYSQL_TYPE_STRING: if (field->binary()) {

			return(DATA_FIXBINARY);
		} else if (strcmp(
				   field->charset()->name,
				   "latin1_swedish_ci") == 0) {
			return(DATA_CHAR);
		} else {
			return(DATA_MYSQL);
		}
marko's avatar
marko committed
2725
	case MYSQL_TYPE_NEWDECIMAL:
2726
		return(DATA_FIXBINARY);
marko's avatar
marko committed
2727 2728 2729 2730 2731 2732 2733 2734 2735 2736 2737
	case MYSQL_TYPE_LONG:
	case MYSQL_TYPE_LONGLONG:
	case MYSQL_TYPE_TINY:
	case MYSQL_TYPE_SHORT:
	case MYSQL_TYPE_INT24:
	case MYSQL_TYPE_DATE:
	case MYSQL_TYPE_DATETIME:
	case MYSQL_TYPE_YEAR:
	case MYSQL_TYPE_NEWDATE:
	case MYSQL_TYPE_TIME:
	case MYSQL_TYPE_TIMESTAMP:
2738
		return(DATA_INT);
marko's avatar
marko committed
2739
	case MYSQL_TYPE_FLOAT:
2740
		return(DATA_FLOAT);
marko's avatar
marko committed
2741
	case MYSQL_TYPE_DOUBLE:
2742
		return(DATA_DOUBLE);
marko's avatar
marko committed
2743
	case MYSQL_TYPE_DECIMAL:
2744
		return(DATA_DECIMAL);
marko's avatar
marko committed
2745 2746 2747 2748 2749
	case MYSQL_TYPE_GEOMETRY:
	case MYSQL_TYPE_TINY_BLOB:
	case MYSQL_TYPE_MEDIUM_BLOB:
	case MYSQL_TYPE_BLOB:
	case MYSQL_TYPE_LONG_BLOB:
2750 2751 2752
		return(DATA_BLOB);
	default:
		assert(0);
osku's avatar
osku committed
2753 2754 2755 2756 2757 2758 2759 2760 2761 2762 2763 2764 2765 2766 2767 2768 2769 2770 2771 2772 2773 2774 2775 2776 2777 2778 2779 2780
	}

	return(0);
}

/***********************************************************************
Writes an unsigned integer value < 64k to 2 bytes, in the little-endian
storage format. */
inline
void
innobase_write_to_2_little_endian(
/*==============================*/
	byte*	buf,	/* in: where to store */
	ulint	val)	/* in: value to write, must be < 64k */
{
	ut_a(val < 256 * 256);

	buf[0] = (byte)(val & 0xFF);
	buf[1] = (byte)(val / 256);
}

/***********************************************************************
Reads an unsigned integer value < 64k from 2 bytes, in the little-endian
storage format. */
inline
uint
innobase_read_from_2_little_endian(
/*===============================*/
2781 2782
				/* out: value */
	const uchar*	buf)	/* in: from where to read */
osku's avatar
osku committed
2783 2784 2785 2786 2787 2788 2789 2790 2791 2792 2793
{
	return (uint) ((ulint)(buf[0]) + 256 * ((ulint)(buf[1])));
}

/***********************************************************************
Stores a key value for a row to a buffer. */

uint
ha_innobase::store_key_val_for_row(
/*===============================*/
				/* out: key value length as stored in buff */
2794
	uint		keynr,	/* in: key number */
osku's avatar
osku committed
2795 2796 2797
	char*		buff,	/* in/out: buffer for the key value (in MySQL
				format) */
	uint		buff_len,/* in: buffer length */
2798
	const uchar*	record)/* in: row in MySQL format */
osku's avatar
osku committed
2799
{
2800 2801 2802
	KEY*		key_info	= table->key_info + keynr;
	KEY_PART_INFO*	key_part	= key_info->key_part;
	KEY_PART_INFO*	end		= key_part + key_info->key_parts;
osku's avatar
osku committed
2803 2804 2805 2806 2807
	char*		buff_start	= buff;
	enum_field_types mysql_type;
	Field*		field;
	ibool		is_null;

2808
	DBUG_ENTER("store_key_val_for_row");
osku's avatar
osku committed
2809 2810 2811 2812 2813 2814 2815 2816 2817 2818 2819 2820 2821 2822 2823 2824 2825 2826 2827 2828 2829 2830 2831 2832 2833 2834 2835 2836

	/* The format for storing a key field in MySQL is the following:

	1. If the column can be NULL, then in the first byte we put 1 if the
	field value is NULL, 0 otherwise.

	2. If the column is of a BLOB type (it must be a column prefix field
	in this case), then we put the length of the data in the field to the
	next 2 bytes, in the little-endian format. If the field is SQL NULL,
	then these 2 bytes are set to 0. Note that the length of data in the
	field is <= column prefix length.

	3. In a column prefix field, prefix_len next bytes are reserved for
	data. In a normal field the max field length next bytes are reserved
	for data. For a VARCHAR(n) the max field length is n. If the stored
	value is the SQL NULL then these data bytes are set to 0.

	4. We always use a 2 byte length for a true >= 5.0.3 VARCHAR. Note that
	in the MySQL row format, the length is stored in 1 or 2 bytes,
	depending on the maximum allowed length. But in the MySQL key value
	format, the length always takes 2 bytes.

	We have to zero-fill the buffer so that MySQL is able to use a
	simple memcmp to compare two key values to determine if they are
	equal. MySQL does this to compare contents of two 'ref' values. */

	bzero(buff, buff_len);

2837 2838
	for (; key_part != end; key_part++) {
		is_null = FALSE;
osku's avatar
osku committed
2839

2840 2841
		if (key_part->null_bit) {
			if (record[key_part->null_offset]
osku's avatar
osku committed
2842 2843 2844
						& key_part->null_bit) {
				*buff = 1;
				is_null = TRUE;
2845
			} else {
osku's avatar
osku committed
2846 2847 2848
				*buff = 0;
			}
			buff++;
2849
		}
osku's avatar
osku committed
2850 2851 2852 2853 2854 2855 2856 2857 2858 2859

		field = key_part->field;
		mysql_type = field->type();

		if (mysql_type == MYSQL_TYPE_VARCHAR) {
						/* >= 5.0.3 true VARCHAR */
			ulint	lenlen;
			ulint	len;
			byte*	data;
			ulint	key_len;
2860
			ulint	true_len;
osku's avatar
osku committed
2861 2862 2863
			CHARSET_INFO*	cs;
			int	error=0;

2864 2865
			key_len = key_part->length;

osku's avatar
osku committed
2866
			if (is_null) {
2867
				buff += key_len + 2;
2868

osku's avatar
osku committed
2869 2870
				continue;
			}
2871
			cs = field->charset();
osku's avatar
osku committed
2872 2873 2874 2875

			lenlen = (ulint)
				(((Field_varstring*)field)->length_bytes);

2876
			data = row_mysql_read_true_varchar(&len,
osku's avatar
osku committed
2877 2878 2879 2880
				(byte*) (record
				+ (ulint)get_field_offset(table, field)),
				lenlen);

2881 2882
			true_len = len;

2883 2884 2885
			/* For multi byte character sets we need to calculate
			the true length of the key */

2886
			if (len > 0 && cs->mbmaxlen > 1) {
2887 2888
				true_len = (ulint) cs->cset->well_formed_len(cs,
						(const char *) data,
2889
						(const char *) data + len,
marko's avatar
marko committed
2890 2891
                                                (uint) (key_len /
                                                        cs->mbmaxlen),
2892 2893 2894
						&error);
			}

osku's avatar
osku committed
2895 2896 2897
			/* In a column prefix index, we may need to truncate
			the stored value: */

2898 2899
			if (true_len > key_len) {
				true_len = key_len;
osku's avatar
osku committed
2900 2901 2902 2903 2904
			}

			/* The length in a key value is always stored in 2
			bytes */

2905
			row_mysql_store_true_var_len((byte*)buff, true_len, 2);
osku's avatar
osku committed
2906 2907
			buff += 2;

2908
			memcpy(buff, data, true_len);
osku's avatar
osku committed
2909 2910 2911 2912 2913 2914 2915

			/* Note that we always reserve the maximum possible
			length of the true VARCHAR in the key value, though
			only len first bytes after the 2 length bytes contain
			actual data. The rest of the space was reset to zero
			in the bzero() call above. */

2916
			buff += key_len;
osku's avatar
osku committed
2917

marko's avatar
marko committed
2918 2919 2920 2921
		} else if (mysql_type == MYSQL_TYPE_TINY_BLOB
			|| mysql_type == MYSQL_TYPE_MEDIUM_BLOB
			|| mysql_type == MYSQL_TYPE_BLOB
			|| mysql_type == MYSQL_TYPE_LONG_BLOB) {
osku's avatar
osku committed
2922 2923 2924

			CHARSET_INFO*	cs;
			ulint		key_len;
2925
			ulint		true_len;
osku's avatar
osku committed
2926
			int		error=0;
2927 2928
			ulint		blob_len;
			byte*		blob_data;
osku's avatar
osku committed
2929 2930 2931

			ut_a(key_part->key_part_flag & HA_PART_KEY_SEG);

2932 2933
			key_len = key_part->length;

2934
			if (is_null) {
2935
				buff += key_len + 2;
2936

osku's avatar
osku committed
2937 2938
				continue;
			}
2939

2940 2941
			cs = field->charset();

2942
			blob_data = row_mysql_read_blob_ref(&blob_len,
osku's avatar
osku committed
2943 2944 2945 2946
				(byte*) (record
				+ (ulint)get_field_offset(table, field)),
					(ulint) field->pack_length());

2947 2948
			true_len = blob_len;

osku's avatar
osku committed
2949
			ut_a(get_field_offset(table, field)
2950
				== key_part->offset);
osku's avatar
osku committed
2951

2952 2953
			/* For multi byte character sets we need to calculate
			the true length of the key */
2954

2955
			if (blob_len > 0 && cs->mbmaxlen > 1) {
2956 2957
				true_len = (ulint) cs->cset->well_formed_len(cs,
						(const char *) blob_data,
2958
						(const char *) blob_data
2959
							+ blob_len,
marko's avatar
marko committed
2960 2961
                                                (uint) (key_len /
                                                        cs->mbmaxlen),
2962 2963 2964
						&error);
			}

osku's avatar
osku committed
2965 2966 2967 2968
			/* All indexes on BLOB and TEXT are column prefix
			indexes, and we may need to truncate the data to be
			stored in the key value: */

2969 2970
			if (true_len > key_len) {
				true_len = key_len;
osku's avatar
osku committed
2971 2972 2973 2974 2975 2976
			}

			/* MySQL reserves 2 bytes for the length and the
			storage of the number is little-endian */

			innobase_write_to_2_little_endian(
2977
					(byte*)buff, true_len);
osku's avatar
osku committed
2978 2979
			buff += 2;

2980
			memcpy(buff, blob_data, true_len);
osku's avatar
osku committed
2981 2982 2983 2984

			/* Note that we always reserve the maximum possible
			length of the BLOB prefix in the key value. */

2985
			buff += key_len;
osku's avatar
osku committed
2986 2987 2988 2989 2990 2991 2992
		} else {
			/* Here we handle all other data types except the
			true VARCHAR, BLOB and TEXT. Note that the column
			value we store may be also in a column prefix
			index. */

			CHARSET_INFO*		cs;
2993 2994
			ulint			true_len;
			ulint			key_len;
2995
			const uchar*		src_start;
osku's avatar
osku committed
2996
			int			error=0;
2997 2998 2999
			enum_field_types	real_type;

			key_len = key_part->length;
osku's avatar
osku committed
3000

3001
			if (is_null) {
3002
				 buff += key_len;
3003

osku's avatar
osku committed
3004 3005 3006 3007
				 continue;
			}

			src_start = record + key_part->offset;
3008 3009 3010 3011
			real_type = field->real_type();
			true_len = key_len;

			/* Character set for the field is defined only
3012
			to fields whose type is string and real field
3013 3014 3015
			type is not enum or set. For these fields check
			if character set is multi byte. */

marko's avatar
marko committed
3016 3017
			if (real_type != MYSQL_TYPE_ENUM
				&& real_type != MYSQL_TYPE_SET
3018 3019 3020 3021 3022
				&& ( mysql_type == MYSQL_TYPE_VAR_STRING
					|| mysql_type == MYSQL_TYPE_STRING)) {

				cs = field->charset();

3023
				/* For multi byte character sets we need to
3024 3025 3026 3027
				calculate the true length of the key */

				if (key_len > 0 && cs->mbmaxlen > 1) {

3028
					true_len = (ulint)
3029 3030
						cs->cset->well_formed_len(cs,
							(const char *)src_start,
3031
							(const char *)src_start
3032
								+ key_len,
marko's avatar
marko committed
3033 3034
                                                        (uint) (key_len /
                                                                cs->mbmaxlen),
3035 3036
							&error);
				}
osku's avatar
osku committed
3037 3038
			}

3039 3040
			memcpy(buff, src_start, true_len);
			buff += true_len;
osku's avatar
osku committed
3041

3042 3043 3044
			/* Pad the unused space with spaces. Note that no
			padding is ever needed for UCS-2 because in MySQL,
			all UCS2 characters are 2 bytes, as MySQL does not
3045 3046
			support surrogate pairs, which are needed to represent
			characters in the range U+10000 to U+10FFFF. */
osku's avatar
osku committed
3047

3048 3049 3050 3051
			if (true_len < key_len) {
				ulint pad_len = key_len - true_len;
				memset(buff, ' ', pad_len);
				buff += pad_len;
osku's avatar
osku committed
3052 3053
			}
		}
3054
	}
osku's avatar
osku committed
3055 3056 3057 3058 3059 3060 3061 3062 3063

	ut_a(buff <= buff_start + buff_len);

	DBUG_RETURN((uint)(buff - buff_start));
}

/******************************************************************
Builds a 'template' to the prebuilt struct. The template is used in fast
retrieval of just those column values MySQL needs in its processing. */
3064
static
osku's avatar
osku committed
3065
void
3066
build_template(
osku's avatar
osku committed
3067
/*===========*/
3068
	row_prebuilt_t*	prebuilt,	/* in/out: prebuilt struct */
osku's avatar
osku committed
3069 3070 3071 3072
	THD*		thd,		/* in: current user thread, used
					only if templ_type is
					ROW_MYSQL_REC_FIELDS */
	TABLE*		table,		/* in: MySQL table */
marko's avatar
marko committed
3073
	uint		templ_type)	/* in: ROW_MYSQL_WHOLE_ROW or
osku's avatar
osku committed
3074 3075 3076 3077 3078 3079 3080 3081 3082 3083 3084 3085 3086 3087 3088 3089 3090 3091 3092
					ROW_MYSQL_REC_FIELDS */
{
	dict_index_t*	index;
	dict_index_t*	clust_index;
	mysql_row_templ_t* templ;
	Field*		field;
	ulint		n_fields;
	ulint		n_requested_fields	= 0;
	ibool		fetch_all_in_key	= FALSE;
	ibool		fetch_primary_key_cols	= FALSE;
	ulint		i;
	/* byte offset of the end of last requested column */
	ulint		mysql_prefix_len	= 0;

	if (prebuilt->select_lock_type == LOCK_X) {
		/* We always retrieve the whole clustered index record if we
		use exclusive row level locks, for example, if the read is
		done in an UPDATE statement. */

3093
		templ_type = ROW_MYSQL_WHOLE_ROW;
osku's avatar
osku committed
3094 3095 3096
	}

	if (templ_type == ROW_MYSQL_REC_FIELDS) {
3097 3098
		if (prebuilt->hint_need_to_fetch_extra_cols
			== ROW_RETRIEVE_ALL_COLS) {
osku's avatar
osku committed
3099

3100 3101
			/* We know we must at least fetch all columns in the
			key, or all columns in the table */
osku's avatar
osku committed
3102

3103 3104 3105 3106 3107 3108 3109
			if (prebuilt->read_just_key) {
				/* MySQL has instructed us that it is enough
				to fetch the columns in the key; looks like
				MySQL can set this flag also when there is
				only a prefix of the column in the key: in
				that case we retrieve the whole column from
				the clustered index */
osku's avatar
osku committed
3110

3111 3112 3113 3114 3115 3116 3117 3118 3119 3120 3121 3122 3123 3124
				fetch_all_in_key = TRUE;
			} else {
				templ_type = ROW_MYSQL_WHOLE_ROW;
			}
		} else if (prebuilt->hint_need_to_fetch_extra_cols
			== ROW_RETRIEVE_PRIMARY_KEY) {
			/* We must at least fetch all primary key cols. Note
			   that if the clustered index was internally generated
			   by InnoDB on the row id (no primary key was
			   defined), then row_search_for_mysql() will always
			   retrieve the row id to a special buffer in the
			   prebuilt struct. */

			fetch_primary_key_cols = TRUE;
osku's avatar
osku committed
3125 3126 3127 3128 3129 3130 3131 3132 3133 3134 3135 3136 3137 3138 3139 3140 3141 3142 3143 3144 3145 3146 3147 3148 3149 3150 3151 3152 3153 3154 3155 3156 3157 3158 3159 3160 3161 3162 3163 3164 3165 3166 3167 3168 3169 3170 3171 3172 3173 3174 3175 3176 3177 3178 3179 3180 3181
		}
	}

	clust_index = dict_table_get_first_index_noninline(prebuilt->table);

	if (templ_type == ROW_MYSQL_REC_FIELDS) {
		index = prebuilt->index;
	} else {
		index = clust_index;
	}

	if (index == clust_index) {
		prebuilt->need_to_access_clustered = TRUE;
	} else {
		prebuilt->need_to_access_clustered = FALSE;
		/* Below we check column by column if we need to access
		the clustered index */
	}

	n_fields = (ulint)table->s->fields; /* number of columns */

	if (!prebuilt->mysql_template) {
		prebuilt->mysql_template = (mysql_row_templ_t*)
						mem_alloc_noninline(
					n_fields * sizeof(mysql_row_templ_t));
	}

	prebuilt->template_type = templ_type;
	prebuilt->null_bitmap_len = table->s->null_bytes;

	prebuilt->templ_contains_blob = FALSE;

	/* Note that in InnoDB, i is the column number. MySQL calls columns
	'fields'. */
	for (i = 0; i < n_fields; i++) {
		templ = prebuilt->mysql_template + n_requested_fields;
		field = table->field[i];

		if (UNIV_LIKELY(templ_type == ROW_MYSQL_REC_FIELDS)) {
			/* Decide which columns we should fetch
			and which we can skip. */
			register const ibool	index_contains_field =
				dict_index_contains_col_or_prefix(index, i);

			if (!index_contains_field && prebuilt->read_just_key) {
				/* If this is a 'key read', we do not need
				columns that are not in the key */

				goto skip_field;
			}

			if (index_contains_field && fetch_all_in_key) {
				/* This field is needed in the query */

				goto include_field;
			}

marko's avatar
marko committed
3182 3183
                        if (bitmap_is_set(table->read_set, i) ||
                            bitmap_is_set(table->write_set, i)) {
osku's avatar
osku committed
3184 3185 3186 3187 3188 3189
				/* This field is needed in the query */

				goto include_field;
			}

			if (fetch_primary_key_cols
3190 3191
				&& dict_table_col_in_clustered_key(
					index->table, i)) {
osku's avatar
osku committed
3192 3193 3194 3195 3196 3197 3198 3199 3200 3201 3202 3203 3204 3205 3206
				/* This field is needed in the query */

				goto include_field;
			}

			/* This field is not needed in the query, skip it */

			goto skip_field;
		}
include_field:
		n_requested_fields++;

		templ->col_no = i;

		if (index == clust_index) {
3207 3208
			templ->rec_field_no = dict_col_get_clust_pos_noninline(
				&index->table->cols[i], index);
osku's avatar
osku committed
3209 3210 3211 3212 3213 3214 3215 3216 3217 3218 3219 3220 3221 3222 3223 3224 3225 3226 3227 3228 3229 3230 3231 3232 3233 3234 3235 3236
		} else {
			templ->rec_field_no = dict_index_get_nth_col_pos(
								index, i);
		}

		if (templ->rec_field_no == ULINT_UNDEFINED) {
			prebuilt->need_to_access_clustered = TRUE;
		}

		if (field->null_ptr) {
			templ->mysql_null_byte_offset =
				(ulint) ((char*) field->null_ptr
					- (char*) table->record[0]);

			templ->mysql_null_bit_mask = (ulint) field->null_bit;
		} else {
			templ->mysql_null_bit_mask = 0;
		}

		templ->mysql_col_offset = (ulint)
					get_field_offset(table, field);

		templ->mysql_col_len = (ulint) field->pack_length();
		if (mysql_prefix_len < templ->mysql_col_offset
				+ templ->mysql_col_len) {
			mysql_prefix_len = templ->mysql_col_offset
				+ templ->mysql_col_len;
		}
3237
		templ->type = index->table->cols[i].mtype;
osku's avatar
osku committed
3238 3239 3240 3241
		templ->mysql_type = (ulint)field->type();

		if (templ->mysql_type == DATA_MYSQL_TRUE_VARCHAR) {
			templ->mysql_length_bytes = (ulint)
3242
				(((Field_varstring*)field)->length_bytes);
osku's avatar
osku committed
3243
		}
3244

osku's avatar
osku committed
3245
		templ->charset = dtype_get_charset_coll_noninline(
3246 3247 3248 3249
				index->table->cols[i].prtype);
		templ->mbminlen = index->table->cols[i].mbminlen;
		templ->mbmaxlen = index->table->cols[i].mbmaxlen;
		templ->is_unsigned = index->table->cols[i].prtype
osku's avatar
osku committed
3250 3251 3252 3253 3254 3255 3256 3257 3258 3259 3260 3261 3262 3263 3264 3265 3266
							& DATA_UNSIGNED;
		if (templ->type == DATA_BLOB) {
			prebuilt->templ_contains_blob = TRUE;
		}
skip_field:
		;
	}

	prebuilt->n_template = n_requested_fields;
	prebuilt->mysql_prefix_len = mysql_prefix_len;

	if (index != clust_index && prebuilt->need_to_access_clustered) {
		/* Change rec_field_no's to correspond to the clustered index
		record */
		for (i = 0; i < n_requested_fields; i++) {
			templ = prebuilt->mysql_template + i;

3267 3268 3269
			templ->rec_field_no = dict_col_get_clust_pos_noninline(
				&index->table->cols[templ->col_no],
				clust_index);
osku's avatar
osku committed
3270 3271 3272 3273
		}
	}
}

3274 3275 3276 3277 3278 3279 3280 3281 3282 3283 3284 3285 3286 3287 3288
/************************************************************************
This special handling is really to overcome the limitations of MySQL's
binlogging. We need to eliminate the non-determinism that will arise in
INSERT ... SELECT type of statements, since MySQL binlog only stores the
min value of the autoinc interval. Once that is fixed we can get rid of
the special lock handling.*/

ulong
ha_innobase::innobase_autoinc_lock(void)
/*====================================*/
					/* out: DB_SUCCESS if all OK else
					error code */
{
	ulint		error = DB_SUCCESS;

3289 3290 3291
	switch (innobase_autoinc_lock_mode) {
	case AUTOINC_NO_LOCKING:
		/* Acquire only the AUTOINC mutex. */
3292
		dict_table_autoinc_lock(prebuilt->table);
3293
		break;
3294

3295 3296 3297 3298 3299
	case AUTOINC_NEW_STYLE_LOCKING:
		/* For simple (single/multi) row INSERTs, we fallback to the
		old style only if another transaction has already acquired
		the AUTOINC lock on behalf of a LOAD FILE or INSERT ... SELECT
		etc. type of statement. */
3300 3301
		if (thd_sql_command(user_thd) == SQLCOM_INSERT
		    || thd_sql_command(user_thd) == SQLCOM_REPLACE) {
3302
			dict_table_t*	table = prebuilt->table;
3303 3304

			/* Acquire the AUTOINC mutex. */
3305
			dict_table_autoinc_lock(table);
3306

3307 3308 3309
			/* We need to check that another transaction isn't
			already holding the AUTOINC lock on the table. */
			if (table->n_waiting_or_granted_auto_inc_locks) {
3310
				/* Release the mutex to avoid deadlocks. */
3311
				dict_table_autoinc_unlock(table);
3312 3313 3314
			} else {
				break;
			}
3315
		}
3316 3317 3318
		/* Fall through to old style locking. */

	case AUTOINC_OLD_STYLE_LOCKING:
3319 3320 3321
		error = row_lock_table_autoinc_for_mysql(prebuilt);

		if (error == DB_SUCCESS) {
3322 3323

			/* Acquire the AUTOINC mutex. */
3324 3325
			dict_table_autoinc_lock(prebuilt->table);
		}
3326 3327 3328 3329
		break;

	default:
		ut_error;
3330 3331 3332 3333 3334 3335 3336 3337 3338 3339 3340 3341 3342 3343 3344 3345 3346 3347 3348 3349 3350 3351 3352 3353 3354 3355 3356 3357 3358 3359 3360 3361 3362 3363 3364 3365 3366 3367 3368 3369 3370 3371 3372 3373 3374 3375 3376 3377 3378 3379 3380 3381 3382 3383
	}

	return(ulong(error));
}

/************************************************************************
Reset the autoinc value in the table.*/

ulong
ha_innobase::innobase_reset_autoinc(
/*================================*/
					/* out: DB_SUCCESS if all went well
					else error code */
	ulonglong	autoinc)	/* in: value to store */
{
	ulint		error;

	error = innobase_autoinc_lock();

	if (error == DB_SUCCESS) {

		dict_table_autoinc_initialize(prebuilt->table, autoinc);

		dict_table_autoinc_unlock(prebuilt->table);
	}

	return(ulong(error));
}

/************************************************************************
Store the autoinc value in the table. The autoinc value is only set if
it's greater than the existing autoinc value in the table.*/

ulong
ha_innobase::innobase_set_max_autoinc(
/*==================================*/
					/* out: DB_SUCCES if all went well
					else error code */
	ulonglong	auto_inc)	/* in: value to store */
{
	ulint		error;

	error = innobase_autoinc_lock();

	if (error == DB_SUCCESS) {

		dict_table_autoinc_update(prebuilt->table, auto_inc);

		dict_table_autoinc_unlock(prebuilt->table);
	}

	return(ulong(error));
}

osku's avatar
osku committed
3384 3385 3386 3387 3388 3389 3390
/************************************************************************
Stores a row in an InnoDB database, to the table specified in this
handle. */

int
ha_innobase::write_row(
/*===================*/
3391 3392
			/* out: error code */
	uchar*	record)	/* in: a row in MySQL format */
osku's avatar
osku committed
3393
{
3394
	int		error = 0;
3395
	ibool		auto_inc_used= FALSE;
3396
	ulint		sql_command;
3397
	trx_t*		trx = thd_to_trx(user_thd);
osku's avatar
osku committed
3398

3399
	DBUG_ENTER("ha_innobase::write_row");
osku's avatar
osku committed
3400

3401
	if (prebuilt->trx != trx) {
osku's avatar
osku committed
3402 3403
	  sql_print_error("The transaction object for the table handle is at "
			  "%p, but for the current thread it is at %p",
3404
			  prebuilt->trx, trx);
osku's avatar
osku committed
3405 3406 3407 3408

		fputs("InnoDB: Dump of 200 bytes around prebuilt: ", stderr);
		ut_print_buf(stderr, ((const byte*)prebuilt) - 100, 200);
		fputs("\n"
3409
			"InnoDB: Dump of 200 bytes around ha_data: ",
osku's avatar
osku committed
3410
			stderr);
3411
		ut_print_buf(stderr, ((const byte*) trx) - 100, 200);
osku's avatar
osku committed
3412 3413 3414 3415
		putc('\n', stderr);
		ut_error;
	}

3416
	ha_statistic_increment(&SSV::ha_write_count);
osku's avatar
osku committed
3417

3418 3419
	if (table->timestamp_field_type & TIMESTAMP_AUTO_SET_ON_INSERT)
		table->timestamp_field->set_time();
osku's avatar
osku committed
3420

3421 3422 3423 3424 3425 3426 3427
	sql_command = thd_sql_command(user_thd);

	if ((sql_command == SQLCOM_ALTER_TABLE
	     || sql_command == SQLCOM_OPTIMIZE
	     || sql_command == SQLCOM_CREATE_INDEX
	     || sql_command == SQLCOM_DROP_INDEX)
	    && num_write_row >= 10000) {
osku's avatar
osku committed
3428 3429 3430 3431 3432 3433 3434 3435 3436 3437 3438 3439 3440 3441 3442 3443 3444 3445 3446 3447 3448 3449 3450 3451 3452 3453 3454
		/* ALTER TABLE is COMMITted at every 10000 copied rows.
		The IX table lock for the original table has to be re-issued.
		As this method will be called on a temporary table where the
		contents of the original table is being copied to, it is
		a bit tricky to determine the source table.  The cursor
		position in the source table need not be adjusted after the
		intermediate COMMIT, since writes by other transactions are
		being blocked by a MySQL table lock TL_WRITE_ALLOW_READ. */

		dict_table_t*	src_table;
		ulint		mode;

		num_write_row = 0;

		/* Commit the transaction.  This will release the table
		locks, so they have to be acquired again. */

		/* Altering an InnoDB table */
		/* Get the source table. */
		src_table = lock_get_src_table(
				prebuilt->trx, prebuilt->table, &mode);
		if (!src_table) {
no_commit:
			/* Unknown situation: do not commit */
			/*
			ut_print_timestamp(stderr);
			fprintf(stderr,
3455
				"  InnoDB: ALTER TABLE is holding lock"
osku's avatar
osku committed
3456 3457 3458 3459 3460 3461 3462 3463 3464
				" on %lu tables!\n",
				prebuilt->trx->mysql_n_tables_locked);
			*/
			;
		} else if (src_table == prebuilt->table) {
			/* Source table is not in InnoDB format:
			no need to re-acquire locks on it. */

			/* Altering to InnoDB format */
3465
			innobase_commit(ht, user_thd, 1);
osku's avatar
osku committed
3466 3467 3468
			/* Note that this transaction is still active. */
			prebuilt->trx->active_trans = 1;
			/* We will need an IX lock on the destination table. */
3469
			prebuilt->sql_stat_start = TRUE;
osku's avatar
osku committed
3470 3471 3472 3473 3474 3475 3476 3477 3478 3479 3480
		} else {
			/* Ensure that there are no other table locks than
			LOCK_IX and LOCK_AUTO_INC on the destination table. */

			if (!lock_is_table_exclusive(prebuilt->table,
							prebuilt->trx)) {
				goto no_commit;
			}

			/* Commit the transaction.  This will release the table
			locks, so they have to be acquired again. */
3481
			innobase_commit(ht, user_thd, 1);
osku's avatar
osku committed
3482 3483 3484 3485 3486
			/* Note that this transaction is still active. */
			prebuilt->trx->active_trans = 1;
			/* Re-acquire the table lock on the source table. */
			row_lock_table_for_mysql(prebuilt, src_table, mode);
			/* We will need an IX lock on the destination table. */
3487
			prebuilt->sql_stat_start = TRUE;
osku's avatar
osku committed
3488 3489 3490 3491 3492
		}
	}

	num_write_row++;

3493
	/* This is the case where the table has an auto-increment column */
3494
	if (table->next_number_field && record == table->record[0]) {
osku's avatar
osku committed
3495

3496
		if ((error = update_auto_increment())) {
osku's avatar
osku committed
3497 3498 3499 3500

			goto func_exit;
		}

3501
		auto_inc_used = TRUE;
osku's avatar
osku committed
3502 3503 3504
	}

	if (prebuilt->mysql_template == NULL
3505 3506
	    || prebuilt->template_type != ROW_MYSQL_WHOLE_ROW) {

osku's avatar
osku committed
3507 3508 3509 3510 3511 3512 3513 3514 3515 3516
		/* Build the template used in converting quickly between
		the two database formats */

		build_template(prebuilt, NULL, table, ROW_MYSQL_WHOLE_ROW);
	}

	innodb_srv_conc_enter_innodb(prebuilt->trx);

	error = row_insert_for_mysql((byte*) record, prebuilt);

3517 3518
	/* Handle duplicate key errors */
	if (auto_inc_used) {
3519
		ulint		err;
3520
		ulonglong	auto_inc;
osku's avatar
osku committed
3521

3522 3523 3524 3525 3526 3527 3528
		/* Note the number of rows processed for this statement, used
		by get_auto_increment() to determine the number of AUTO-INC
		values to reserve. This is only useful for a mult-value INSERT
		and is a statement level counter.*/
		if (trx->n_autoinc_rows > 0) {
			--trx->n_autoinc_rows;
		}
osku's avatar
osku committed
3529

3530
		/* Get the value that MySQL attempted to store in the table.*/
3531
		auto_inc = table->next_number_field->val_int();
osku's avatar
osku committed
3532

3533 3534
		switch (error) {
		case DB_DUPLICATE_KEY:
osku's avatar
osku committed
3535

3536 3537 3538 3539
			/* A REPLACE command and LOAD DATA INFILE REPLACE
			handle a duplicate key error themselves, but we
			must update the autoinc counter if we are performing
			those statements. */
osku's avatar
osku committed
3540

3541 3542 3543 3544
			switch (sql_command) {
			case SQLCOM_LOAD:
				if ((trx->duplicates
				    & (TRX_DUP_IGNORE | TRX_DUP_REPLACE))) {
osku's avatar
osku committed
3545

3546 3547 3548
					goto set_max_autoinc;
				}
				break;
osku's avatar
osku committed
3549

3550 3551 3552 3553 3554
			case SQLCOM_REPLACE:
			case SQLCOM_INSERT_SELECT:
			case SQLCOM_REPLACE_SELECT:
				goto set_max_autoinc;
				break;
osku's avatar
osku committed
3555

3556 3557 3558 3559 3560 3561 3562 3563 3564 3565 3566 3567 3568 3569
			default:
				break;
			}

			break;

		case DB_SUCCESS:
			/* If the actual value inserted is greater than
			the upper limit of the interval, then we try and
			update the table upper limit. Note: last_value
			will be 0 if get_auto_increment() was not called.*/

			if (auto_inc > prebuilt->last_value) {
set_max_autoinc:
3570
				ut_a(prebuilt->table->autoinc_increment > 0);
3571 3572 3573 3574 3575 3576 3577 3578 3579 3580 3581 3582 3583

				ulonglong	have;
				ulonglong	need;

				/* Check for overflow conditions. */
				need = prebuilt->table->autoinc_increment;
				have = ~0x0ULL - auto_inc;

				if (have < need) {
					need = have;
				}

				auto_inc += need;
3584

3585 3586 3587
				err = innobase_set_max_autoinc(auto_inc);

				if (err != DB_SUCCESS) {
marko's avatar
marko committed
3588
					error = (int) err;
3589
				}
3590 3591
			}
			break;
3592 3593
		}
	}
osku's avatar
osku committed
3594 3595 3596 3597 3598 3599 3600 3601

	innodb_srv_conc_exit_innodb(prebuilt->trx);

	error = convert_error_code_to_mysql(error, user_thd);

func_exit:
	innobase_active_small();

3602
	DBUG_RETURN(error);
osku's avatar
osku committed
3603 3604 3605 3606 3607 3608 3609 3610 3611 3612 3613
}

/**************************************************************************
Checks which fields have changed in a row and stores information
of them to an update vector. */
static
int
calc_row_difference(
/*================*/
					/* out: error number or 0 */
	upd_t*		uvect,		/* in/out: update vector */
3614 3615
	uchar*		old_row,	/* in: old row in MySQL format */
	uchar*		new_row,	/* in: new row in MySQL format */
osku's avatar
osku committed
3616 3617
	struct st_table* table,		/* in: table in MySQL data
					dictionary */
3618
	uchar*		upd_buff,	/* in: buffer to use */
osku's avatar
osku committed
3619 3620 3621 3622
	ulint		buff_len,	/* in: buffer length */
	row_prebuilt_t*	prebuilt,	/* in: InnoDB prebuilt struct */
	THD*		thd)		/* in: user thread */
{
3623
	uchar*		original_upd_buff = upd_buff;
osku's avatar
osku committed
3624 3625 3626 3627 3628 3629 3630
	Field*		field;
	enum_field_types field_mysql_type;
	uint		n_fields;
	ulint		o_len;
	ulint		n_len;
	ulint		col_pack_len;
	byte*		new_mysql_row_col;
3631 3632 3633
	byte*		o_ptr;
	byte*		n_ptr;
	byte*		buf;
osku's avatar
osku committed
3634 3635 3636 3637
	upd_field_t*	ufield;
	ulint		col_type;
	ulint		n_changed = 0;
	dfield_t	dfield;
marko's avatar
marko committed
3638
	dict_index_t*	clust_index;
osku's avatar
osku committed
3639 3640 3641
	uint		i;

	n_fields = table->s->fields;
marko's avatar
marko committed
3642
	clust_index = dict_table_get_first_index_noninline(prebuilt->table);
osku's avatar
osku committed
3643 3644 3645 3646 3647 3648 3649 3650 3651

	/* We use upd_buff to convert changed fields */
	buf = (byte*) upd_buff;

	for (i = 0; i < n_fields; i++) {
		field = table->field[i];

		o_ptr = (byte*) old_row + get_field_offset(table, field);
		n_ptr = (byte*) new_row + get_field_offset(table, field);
3652

osku's avatar
osku committed
3653 3654 3655 3656 3657 3658 3659 3660 3661
		/* Use new_mysql_row_col and col_pack_len save the values */

		new_mysql_row_col = n_ptr;
		col_pack_len = field->pack_length();

		o_len = col_pack_len;
		n_len = col_pack_len;

		/* We use o_ptr and n_ptr to dig up the actual data for
3662
		comparison. */
osku's avatar
osku committed
3663 3664

		field_mysql_type = field->type();
3665

3666
		col_type = prebuilt->table->cols[i].mtype;
osku's avatar
osku committed
3667 3668 3669 3670 3671 3672 3673 3674 3675 3676 3677 3678 3679 3680 3681 3682

		switch (col_type) {

		case DATA_BLOB:
			o_ptr = row_mysql_read_blob_ref(&o_len, o_ptr, o_len);
			n_ptr = row_mysql_read_blob_ref(&n_len, n_ptr, n_len);

			break;

		case DATA_VARCHAR:
		case DATA_BINARY:
		case DATA_VARMYSQL:
			if (field_mysql_type == MYSQL_TYPE_VARCHAR) {
				/* This is a >= 5.0.3 type true VARCHAR where
				the real payload data length is stored in
				1 or 2 bytes */
3683

osku's avatar
osku committed
3684
				o_ptr = row_mysql_read_true_varchar(
3685 3686 3687 3688
					&o_len, o_ptr,
					(ulint)
					(((Field_varstring*)field)->length_bytes));

osku's avatar
osku committed
3689
				n_ptr = row_mysql_read_true_varchar(
3690 3691 3692
					&n_len, n_ptr,
					(ulint)
					(((Field_varstring*)field)->length_bytes));
osku's avatar
osku committed
3693 3694 3695 3696 3697 3698 3699 3700 3701 3702 3703 3704 3705 3706 3707 3708 3709 3710 3711 3712 3713 3714 3715 3716
			}

			break;
		default:
			;
		}

		if (field->null_ptr) {
			if (field_in_record_is_null(table, field,
							(char*) old_row)) {
				o_len = UNIV_SQL_NULL;
			}

			if (field_in_record_is_null(table, field,
							(char*) new_row)) {
				n_len = UNIV_SQL_NULL;
			}
		}

		if (o_len != n_len || (o_len != UNIV_SQL_NULL &&
					0 != memcmp(o_ptr, n_ptr, o_len))) {
			/* The field has changed */

			ufield = uvect->fields + n_changed;
3717

osku's avatar
osku committed
3718 3719 3720
			/* Let us use a dummy dfield to make the conversion
			from the MySQL column format to the InnoDB format */

3721 3722
			dict_col_copy_type_noninline(prebuilt->table->cols + i,
						     &dfield.type);
osku's avatar
osku committed
3723 3724 3725

			if (n_len != UNIV_SQL_NULL) {
				buf = row_mysql_store_col_in_innobase_format(
3726 3727 3728 3729 3730
					&dfield,
					(byte*)buf,
					TRUE,
					new_mysql_row_col,
					col_pack_len,
3731 3732
					dict_table_is_comp_noninline(
							prebuilt->table));
osku's avatar
osku committed
3733 3734 3735 3736 3737 3738 3739 3740
				ufield->new_val.data = dfield.data;
				ufield->new_val.len = dfield.len;
			} else {
				ufield->new_val.data = NULL;
				ufield->new_val.len = UNIV_SQL_NULL;
			}

			ufield->exp = NULL;
3741 3742
			ufield->field_no = dict_col_get_clust_pos_noninline(
				&prebuilt->table->cols[i], clust_index);
osku's avatar
osku committed
3743 3744 3745 3746 3747 3748 3749 3750 3751 3752 3753 3754 3755 3756 3757 3758 3759 3760 3761 3762 3763 3764 3765 3766
			n_changed++;
		}
	}

	uvect->n_fields = n_changed;
	uvect->info_bits = 0;

	ut_a(buf <= (byte*)original_upd_buff + buff_len);

	return(0);
}

/**************************************************************************
Updates a row given as a parameter to a new value. Note that we are given
whole rows, not just the fields which are updated: this incurs some
overhead for CPU when we check which fields are actually updated.
TODO: currently InnoDB does not prevent the 'Halloween problem':
in a searched update a single row can get updated several times
if its index columns are updated! */

int
ha_innobase::update_row(
/*====================*/
					/* out: error number or 0 */
3767 3768
	const uchar*	old_row,	/* in: old row in MySQL format */
	uchar*		new_row)	/* in: new row in MySQL format */
osku's avatar
osku committed
3769 3770 3771
{
	upd_t*		uvect;
	int		error = 0;
3772
	trx_t*		trx = thd_to_trx(user_thd);
osku's avatar
osku committed
3773 3774 3775

	DBUG_ENTER("ha_innobase::update_row");

3776
	ut_a(prebuilt->trx == trx);
osku's avatar
osku committed
3777

3778 3779
	ha_statistic_increment(&SSV::ha_update_count);

3780 3781
	if (table->timestamp_field_type & TIMESTAMP_AUTO_SET_ON_UPDATE)
		table->timestamp_field->set_time();
osku's avatar
osku committed
3782 3783 3784 3785 3786 3787 3788 3789 3790 3791

	if (prebuilt->upd_node) {
		uvect = prebuilt->upd_node->update;
	} else {
		uvect = row_get_prebuilt_update_vector(prebuilt);
	}

	/* Build an update vector from the modified fields in the rows
	(uses upd_buff of the handle) */

3792
	calc_row_difference(uvect, (uchar*) old_row, new_row, table,
osku's avatar
osku committed
3793 3794 3795 3796 3797 3798 3799 3800
			upd_buff, (ulint)upd_and_key_val_buff_len,
			prebuilt, user_thd);

	/* This is not a delete */
	prebuilt->upd_node->is_delete = FALSE;

	assert(prebuilt->template_type == ROW_MYSQL_WHOLE_ROW);

3801
	innodb_srv_conc_enter_innodb(trx);
osku's avatar
osku committed
3802 3803 3804

	error = row_update_for_mysql((byte*) old_row, prebuilt);

3805 3806 3807 3808 3809 3810 3811 3812 3813 3814 3815 3816 3817 3818 3819 3820 3821 3822 3823 3824 3825 3826
	/* We need to do some special AUTOINC handling for the following case:

	INSERT INTO t (c1,c2) VALUES(x,y) ON DUPLICATE KEY UPDATE ...

	We need to use the AUTOINC counter that was actually used by
	MySQL in the UPDATE statement, which can be different from the
	value used in the INSERT statement.*/

	if (error == DB_SUCCESS
	    && table->next_number_field
	    && new_row == table->record[0]
	    && thd_sql_command(user_thd) == SQLCOM_INSERT
	    && (trx->duplicates & (TRX_DUP_IGNORE | TRX_DUP_REPLACE))
		== TRX_DUP_IGNORE)  {

		longlong	auto_inc;

		auto_inc = table->next_number_field->val_int();

		if (auto_inc != 0) {
			auto_inc += prebuilt->table->autoinc_increment;

3827
			error = innobase_set_max_autoinc(auto_inc);
3828 3829 3830
		}
	}

3831
	innodb_srv_conc_exit_innodb(trx);
osku's avatar
osku committed
3832 3833 3834

	error = convert_error_code_to_mysql(error, user_thd);

vasil's avatar
vasil committed
3835 3836 3837 3838 3839 3840 3841 3842 3843 3844
	if (error == 0 /* success */
	    && uvect->n_fields == 0 /* no columns were updated */) {

		/* This is the same as success, but instructs
		MySQL that the row is not really updated and it
		should not increase the count of updated rows.
		This is fix for http://bugs.mysql.com/29157 */
		error = HA_ERR_RECORD_IS_THE_SAME;
	}

osku's avatar
osku committed
3845 3846 3847 3848 3849 3850 3851 3852 3853 3854 3855 3856 3857 3858
	/* Tell InnoDB server that there might be work for
	utility threads: */

	innobase_active_small();

	DBUG_RETURN(error);
}

/**************************************************************************
Deletes a row given as the parameter. */

int
ha_innobase::delete_row(
/*====================*/
3859 3860
				/* out: error number or 0 */
	const uchar*	record)	/* in: a row in MySQL format */
osku's avatar
osku committed
3861 3862
{
	int		error = 0;
3863
	trx_t*		trx = thd_to_trx(user_thd);
osku's avatar
osku committed
3864 3865 3866

	DBUG_ENTER("ha_innobase::delete_row");

3867
	ut_a(prebuilt->trx == trx);
osku's avatar
osku committed
3868

3869 3870
	ha_statistic_increment(&SSV::ha_delete_count);

3871 3872 3873 3874
	/* Only if the table has an AUTOINC column */
	if (table->found_next_number_field && record == table->record[0]) {
		ulonglong	dummy = 0;

3875 3876 3877 3878
		/* First check whether the AUTOINC sub-system has been
		initialized using the AUTOINC mutex. If not then we
		do it the "proper" way, by acquiring the heavier locks. */
		dict_table_autoinc_lock(prebuilt->table);
3879

3880 3881 3882 3883 3884 3885 3886 3887 3888 3889 3890
		if (!prebuilt->table->autoinc_inited) {
			dict_table_autoinc_unlock(prebuilt->table);

			error = innobase_get_auto_increment(&dummy);

			if (error == DB_SUCCESS) {
				dict_table_autoinc_unlock(prebuilt->table);
			} else {
				goto error_exit;
			}
		} else  {
3891 3892 3893 3894
			dict_table_autoinc_unlock(prebuilt->table);
		}
	}

osku's avatar
osku committed
3895 3896 3897 3898 3899 3900 3901 3902
	if (!prebuilt->upd_node) {
		row_get_prebuilt_update_vector(prebuilt);
	}

	/* This is a delete */

	prebuilt->upd_node->is_delete = TRUE;

3903
	innodb_srv_conc_enter_innodb(trx);
osku's avatar
osku committed
3904 3905 3906

	error = row_update_for_mysql((byte*) record, prebuilt);

3907
	innodb_srv_conc_exit_innodb(trx);
osku's avatar
osku committed
3908

3909
error_exit:
osku's avatar
osku committed
3910 3911 3912 3913 3914 3915 3916 3917 3918 3919 3920
	error = convert_error_code_to_mysql(error, user_thd);

	/* Tell the InnoDB server that there might be work for
	utility threads: */

	innobase_active_small();

	DBUG_RETURN(error);
}

/**************************************************************************
3921
Removes a new lock set on a row, if it was not read optimistically. This can
3922 3923
be called after a row has been read in the processing of an UPDATE or a DELETE
query, if the option innodb_locks_unsafe_for_binlog is set. */
osku's avatar
osku committed
3924 3925 3926 3927 3928 3929 3930

void
ha_innobase::unlock_row(void)
/*=========================*/
{
	DBUG_ENTER("ha_innobase::unlock_row");

3931 3932 3933 3934 3935 3936 3937
	/* Consistent read does not take any locks, thus there is
	nothing to unlock. */

	if (prebuilt->select_lock_type == LOCK_NONE) {
		DBUG_VOID_RETURN;
	}

3938 3939
	switch (prebuilt->row_read_type) {
	case ROW_READ_WITH_LOCKS:
3940 3941
		if (!srv_locks_unsafe_for_binlog
		|| prebuilt->trx->isolation_level == TRX_ISO_READ_COMMITTED) {
3942 3943 3944 3945
			break;
		}
		/* fall through */
	case ROW_READ_TRY_SEMI_CONSISTENT:
osku's avatar
osku committed
3946
		row_unlock_for_mysql(prebuilt, FALSE);
3947 3948 3949 3950 3951 3952 3953 3954 3955 3956 3957 3958 3959 3960 3961 3962 3963 3964 3965 3966 3967 3968
		break;
	case ROW_READ_DID_SEMI_CONSISTENT:
		prebuilt->row_read_type = ROW_READ_TRY_SEMI_CONSISTENT;
		break;
	}

	DBUG_VOID_RETURN;
}

/* See handler.h and row0mysql.h for docs on this function. */
bool
ha_innobase::was_semi_consistent_read(void)
/*=======================================*/
{
	return(prebuilt->row_read_type == ROW_READ_DID_SEMI_CONSISTENT);
}

/* See handler.h and row0mysql.h for docs on this function. */
void
ha_innobase::try_semi_consistent_read(bool yes)
/*===========================================*/
{
3969
	ut_a(prebuilt->trx == thd_to_trx(ha_thd()));
3970

3971 3972 3973 3974 3975
	/* Row read type is set to semi consistent read if this was
	requested by the MySQL and either innodb_locks_unsafe_for_binlog
	option is used or this session is using READ COMMITTED isolation
	level. */

3976 3977
	if (yes
	    && (srv_locks_unsafe_for_binlog
3978
		|| prebuilt->trx->isolation_level == TRX_ISO_READ_COMMITTED)) {
3979 3980 3981
		prebuilt->row_read_type = ROW_READ_TRY_SEMI_CONSISTENT;
	} else {
		prebuilt->row_read_type = ROW_READ_WITH_LOCKS;
osku's avatar
osku committed
3982 3983 3984 3985 3986 3987 3988 3989 3990 3991
	}
}

/**********************************************************************
Initializes a handle to use an index. */

int
ha_innobase::index_init(
/*====================*/
			/* out: 0 or error number */
3992 3993
	uint	keynr,	/* in: key (index) number */
	bool sorted)	/* in: 1 if result MUST be sorted according to index */
osku's avatar
osku committed
3994
{
3995 3996
	int	error	= 0;
	DBUG_ENTER("index_init");
osku's avatar
osku committed
3997 3998 3999

	error = change_active_index(keynr);

4000
	DBUG_RETURN(error);
osku's avatar
osku committed
4001 4002 4003 4004 4005 4006 4007 4008 4009
}

/**********************************************************************
Currently does nothing. */

int
ha_innobase::index_end(void)
/*========================*/
{
4010 4011 4012 4013
	int	error	= 0;
	DBUG_ENTER("index_end");
	active_index=MAX_KEY;
	DBUG_RETURN(error);
osku's avatar
osku committed
4014 4015 4016 4017 4018 4019 4020 4021 4022 4023 4024 4025
}

/*************************************************************************
Converts a search mode flag understood by MySQL to a flag understood
by InnoDB. */
inline
ulint
convert_search_mode_to_innobase(
/*============================*/
	enum ha_rkey_function	find_flag)
{
	switch (find_flag) {
4026 4027 4028 4029 4030 4031 4032 4033 4034 4035 4036 4037 4038 4039 4040 4041 4042 4043 4044 4045 4046 4047 4048 4049 4050 4051 4052 4053 4054 4055 4056 4057 4058 4059
	case HA_READ_KEY_EXACT:
		/* this does not require the index to be UNIQUE */
		return(PAGE_CUR_GE);
	case HA_READ_KEY_OR_NEXT:
		return(PAGE_CUR_GE);
	case HA_READ_KEY_OR_PREV:
		return(PAGE_CUR_LE);
	case HA_READ_AFTER_KEY:	
		return(PAGE_CUR_G);
	case HA_READ_BEFORE_KEY:
		return(PAGE_CUR_L);
	case HA_READ_PREFIX:
		return(PAGE_CUR_GE);
	case HA_READ_PREFIX_LAST:
		return(PAGE_CUR_LE);
	case HA_READ_PREFIX_LAST_OR_PREV:
		return(PAGE_CUR_LE);
		/* In MySQL-4.0 HA_READ_PREFIX and HA_READ_PREFIX_LAST always
		pass a complete-field prefix of a key value as the search
		tuple. I.e., it is not allowed that the last field would
		just contain n first bytes of the full field value.
		MySQL uses a 'padding' trick to convert LIKE 'abc%'
		type queries so that it can use as a search tuple
		a complete-field-prefix of a key value. Thus, the InnoDB
		search mode PAGE_CUR_LE_OR_EXTENDS is never used.
		TODO: when/if MySQL starts to use also partial-field
		prefixes, we have to deal with stripping of spaces
		and comparison of non-latin1 char type fields in
		innobase_mysql_cmp() to get PAGE_CUR_LE_OR_EXTENDS to
		work correctly. */
	case HA_READ_MBR_CONTAIN:
	case HA_READ_MBR_INTERSECT:
	case HA_READ_MBR_WITHIN:
	case HA_READ_MBR_DISJOINT:
4060
	case HA_READ_MBR_EQUAL:
4061 4062 4063 4064 4065
		my_error(ER_TABLE_CANT_HANDLE_SPKEYS, MYF(0));
		return(PAGE_CUR_UNSUPP);
	/* do not use "default:" in order to produce a gcc warning:
	enumeration value '...' not handled in switch
	(if -Wswitch or -Wall is used) */
osku's avatar
osku committed
4066 4067
	}

4068 4069 4070
	my_error(ER_CHECK_NOT_IMPLEMENTED, MYF(0), "this functionality");

	return(PAGE_CUR_UNSUPP);
osku's avatar
osku committed
4071 4072 4073 4074 4075 4076 4077 4078 4079 4080 4081 4082 4083 4084 4085 4086 4087 4088 4089 4090 4091 4092 4093 4094 4095 4096 4097 4098 4099 4100 4101 4102 4103 4104 4105 4106 4107 4108 4109 4110 4111 4112 4113 4114 4115 4116 4117 4118 4119 4120 4121 4122 4123 4124 4125 4126 4127 4128 4129 4130
}

/*
   BACKGROUND INFO: HOW A SELECT SQL QUERY IS EXECUTED
   ---------------------------------------------------
The following does not cover all the details, but explains how we determine
the start of a new SQL statement, and what is associated with it.

For each table in the database the MySQL interpreter may have several
table handle instances in use, also in a single SQL query. For each table
handle instance there is an InnoDB  'prebuilt' struct which contains most
of the InnoDB data associated with this table handle instance.

  A) if the user has not explicitly set any MySQL table level locks:

  1) MySQL calls ::external_lock to set an 'intention' table level lock on
the table of the handle instance. There we set
prebuilt->sql_stat_start = TRUE. The flag sql_stat_start should be set
true if we are taking this table handle instance to use in a new SQL
statement issued by the user. We also increment trx->n_mysql_tables_in_use.

  2) If prebuilt->sql_stat_start == TRUE we 'pre-compile' the MySQL search
instructions to prebuilt->template of the table handle instance in
::index_read. The template is used to save CPU time in large joins.

  3) In row_search_for_mysql, if prebuilt->sql_stat_start is true, we
allocate a new consistent read view for the trx if it does not yet have one,
or in the case of a locking read, set an InnoDB 'intention' table level
lock on the table.

  4) We do the SELECT. MySQL may repeatedly call ::index_read for the
same table handle instance, if it is a join.

  5) When the SELECT ends, MySQL removes its intention table level locks
in ::external_lock. When trx->n_mysql_tables_in_use drops to zero,
 (a) we execute a COMMIT there if the autocommit is on,
 (b) we also release possible 'SQL statement level resources' InnoDB may
have for this SQL statement. The MySQL interpreter does NOT execute
autocommit for pure read transactions, though it should. That is why the
table handler in that case has to execute the COMMIT in ::external_lock.

  B) If the user has explicitly set MySQL table level locks, then MySQL
does NOT call ::external_lock at the start of the statement. To determine
when we are at the start of a new SQL statement we at the start of
::index_read also compare the query id to the latest query id where the
table handle instance was used. If it has changed, we know we are at the
start of a new SQL statement. Since the query id can theoretically
overwrap, we use this test only as a secondary way of determining the
start of a new SQL statement. */


/**************************************************************************
Positions an index cursor to the index specified in the handle. Fetches the
row if any. */

int
ha_innobase::index_read(
/*====================*/
					/* out: 0, HA_ERR_KEY_NOT_FOUND,
					or error number */
4131
	uchar*		buf,		/* in/out: buffer for the returned
osku's avatar
osku committed
4132
					row */
4133
	const uchar*	key_ptr,	/* in: key value; if this is NULL
osku's avatar
osku committed
4134 4135 4136 4137 4138 4139 4140 4141 4142 4143 4144 4145 4146
					we position the cursor at the
					start or end of index; this can
					also contain an InnoDB row id, in
					which case key_len is the InnoDB
					row id length; the key value can
					also be a prefix of a full key value,
					and the last column can be a prefix
					of a full column */
	uint			key_len,/* in: key value length */
	enum ha_rkey_function find_flag)/* in: search flags from my_base.h */
{
	ulint		mode;
	dict_index_t*	index;
4147 4148
	ulint		match_mode	= 0;
	int		error;
osku's avatar
osku committed
4149 4150
	ulint		ret;

4151
	DBUG_ENTER("index_read");
osku's avatar
osku committed
4152

4153
	ut_a(prebuilt->trx == thd_to_trx(user_thd));
osku's avatar
osku committed
4154

4155
	ha_statistic_increment(&SSV::ha_read_key_count);
osku's avatar
osku committed
4156 4157 4158 4159

	index = prebuilt->index;

	/* Note that if the index for which the search template is built is not
4160
	necessarily prebuilt->index, but can also be the clustered index */
osku's avatar
osku committed
4161 4162 4163 4164 4165 4166 4167

	if (prebuilt->sql_stat_start) {
		build_template(prebuilt, user_thd, table,
							ROW_MYSQL_REC_FIELDS);
	}

	if (key_ptr) {
4168
		/* Convert the search key value to InnoDB format into
osku's avatar
osku committed
4169 4170 4171 4172 4173 4174 4175 4176 4177 4178 4179 4180
		prebuilt->search_tuple */

		row_sel_convert_mysql_key_to_innobase(prebuilt->search_tuple,
					(byte*) key_val_buff,
					(ulint)upd_and_key_val_buff_len,
					index,
					(byte*) key_ptr,
					(ulint) key_len, prebuilt->trx);
	} else {
		/* We position the cursor to the last or the first entry
		in the index */

4181
		dtuple_set_n_fields(prebuilt->search_tuple, 0);
osku's avatar
osku committed
4182 4183 4184 4185 4186 4187 4188 4189 4190 4191 4192 4193 4194 4195 4196 4197
	}

	mode = convert_search_mode_to_innobase(find_flag);

	match_mode = 0;

	if (find_flag == HA_READ_KEY_EXACT) {
		match_mode = ROW_SEL_EXACT;

	} else if (find_flag == HA_READ_PREFIX
				|| find_flag == HA_READ_PREFIX_LAST) {
		match_mode = ROW_SEL_EXACT_PREFIX;
	}

	last_match_mode = (uint) match_mode;

4198
	if (mode != PAGE_CUR_UNSUPP) {
osku's avatar
osku committed
4199

4200
		innodb_srv_conc_enter_innodb(prebuilt->trx);
osku's avatar
osku committed
4201

4202 4203 4204 4205 4206 4207 4208 4209
		ret = row_search_for_mysql((byte*) buf, mode, prebuilt,
					   match_mode, 0);

		innodb_srv_conc_exit_innodb(prebuilt->trx);
	} else {

		ret = DB_UNSUPPORTED;
	}
osku's avatar
osku committed
4210 4211 4212 4213 4214 4215 4216 4217 4218 4219 4220 4221 4222 4223 4224 4225 4226 4227 4228 4229 4230 4231 4232 4233 4234 4235 4236

	if (ret == DB_SUCCESS) {
		error = 0;
		table->status = 0;

	} else if (ret == DB_RECORD_NOT_FOUND) {
		error = HA_ERR_KEY_NOT_FOUND;
		table->status = STATUS_NOT_FOUND;

	} else if (ret == DB_END_OF_INDEX) {
		error = HA_ERR_KEY_NOT_FOUND;
		table->status = STATUS_NOT_FOUND;
	} else {
		error = convert_error_code_to_mysql((int) ret, user_thd);
		table->status = STATUS_NOT_FOUND;
	}

	DBUG_RETURN(error);
}

/***********************************************************************
The following functions works like index_read, but it find the last
row with the current key value or prefix. */

int
ha_innobase::index_read_last(
/*=========================*/
4237 4238 4239 4240 4241 4242 4243
				/* out: 0, HA_ERR_KEY_NOT_FOUND, or an
				error code */
	uchar*		buf,	/* out: fetched row */
	const uchar*	key_ptr,/* in: key value, or a prefix of a full
				key value */
	uint		key_len)/* in: length of the key val or prefix
				in bytes */
osku's avatar
osku committed
4244
{
4245
	return(index_read(buf, key_ptr, key_len, HA_READ_PREFIX_LAST));
osku's avatar
osku committed
4246 4247 4248
}

/************************************************************************
4249
Get the index for a handle. Does not change active index.*/
osku's avatar
osku committed
4250

4251 4252 4253 4254 4255 4256 4257
dict_index_t*
ha_innobase::innobase_get_index(
/*============================*/
				/* out: NULL or index instance. */
	uint		keynr)	/* in: use this index; MAX_KEY means always
				clustered index, even if it was internally
				generated by InnoDB */
osku's avatar
osku committed
4258
{
4259 4260 4261 4262
	KEY*		key = 0;
	dict_index_t*	index = 0;

	DBUG_ENTER("innobase_get_index");
4263
	ha_statistic_increment(&SSV::ha_read_key_count);
osku's avatar
osku committed
4264

4265
	ut_ad(user_thd == ha_thd());
4266
	ut_a(prebuilt->trx == thd_to_trx(user_thd));
osku's avatar
osku committed
4267 4268

	if (keynr != MAX_KEY && table->s->keys > 0) {
4269
		key = table->key_info + keynr;
osku's avatar
osku committed
4270

4271
		index = dict_table_get_index_noninline(
4272 4273
			prebuilt->table, key->name);
	} else {
4274
		index = dict_table_get_first_index_noninline(prebuilt->table);
osku's avatar
osku committed
4275 4276
	}

4277
	if (!index) {
4278 4279 4280 4281 4282
		sql_print_error(
			"Innodb could not find key n:o %u with name %s "
			"from dict cache for table %s",
			keynr, key ? key->name : "NULL",
			prebuilt->table->name);
4283 4284 4285 4286 4287 4288 4289 4290 4291 4292 4293 4294 4295 4296 4297 4298 4299 4300 4301 4302 4303 4304
	}

	DBUG_RETURN(index);
}

/************************************************************************
Changes the active index of a handle. */

int
ha_innobase::change_active_index(
/*=============================*/
			/* out: 0 or error code */
	uint	keynr)	/* in: use this index; MAX_KEY means always clustered
			index, even if it was internally generated by
			InnoDB */
{
	DBUG_ENTER("change_active_index");

	ut_ad(user_thd == ha_thd());
	ut_a(prebuilt->trx == thd_to_trx(user_thd));

	active_index = keynr;
4305

4306 4307 4308
	prebuilt->index = innobase_get_index(keynr);

	if (!prebuilt->index) {
4309
		DBUG_RETURN(1);
osku's avatar
osku committed
4310 4311 4312 4313 4314 4315 4316 4317 4318 4319 4320 4321 4322 4323 4324 4325 4326 4327 4328 4329 4330 4331 4332 4333 4334 4335 4336 4337 4338
	}

	assert(prebuilt->search_tuple != 0);

	dtuple_set_n_fields(prebuilt->search_tuple, prebuilt->index->n_fields);

	dict_index_copy_types(prebuilt->search_tuple, prebuilt->index,
			prebuilt->index->n_fields);

	/* MySQL changes the active index for a handle also during some
	queries, for example SELECT MAX(a), SUM(a) first retrieves the MAX()
	and then calculates the sum. Previously we played safe and used
	the flag ROW_MYSQL_WHOLE_ROW below, but that caused unnecessary
	copying. Starting from MySQL-4.1 we use a more efficient flag here. */

	build_template(prebuilt, user_thd, table, ROW_MYSQL_REC_FIELDS);

	DBUG_RETURN(0);
}

/**************************************************************************
Positions an index cursor to the index specified in keynr. Fetches the
row if any. */
/* ??? This is only used to read whole keys ??? */

int
ha_innobase::index_read_idx(
/*========================*/
					/* out: error number or 0 */
4339
	uchar*		buf,		/* in/out: buffer for the returned
osku's avatar
osku committed
4340
					row */
4341
	uint		keynr,		/* in: use this index */
4342
	const uchar*	key,		/* in: key value; if this is NULL
osku's avatar
osku committed
4343 4344 4345 4346 4347 4348 4349 4350 4351 4352 4353 4354 4355 4356 4357 4358 4359 4360 4361 4362 4363 4364
					we position the cursor at the
					start or end of index */
	uint		key_len,	/* in: key value length */
	enum ha_rkey_function find_flag)/* in: search flags from my_base.h */
{
	if (change_active_index(keynr)) {

		return(1);
	}

	return(index_read(buf, key, key_len, find_flag));
}

/***************************************************************************
Reads the next or previous row from a cursor, which must have previously been
positioned using index_read. */

int
ha_innobase::general_fetch(
/*=======================*/
				/* out: 0, HA_ERR_END_OF_FILE, or error
				number */
4365
	uchar*	buf,		/* in/out: buffer for next row in MySQL
osku's avatar
osku committed
4366
				format */
4367
	uint	direction,	/* in: ROW_SEL_NEXT or ROW_SEL_PREV */
osku's avatar
osku committed
4368 4369 4370 4371 4372 4373 4374 4375
	uint	match_mode)	/* in: 0, ROW_SEL_EXACT, or
				ROW_SEL_EXACT_PREFIX */
{
	ulint		ret;
	int		error	= 0;

	DBUG_ENTER("general_fetch");

4376
	ut_a(prebuilt->trx == thd_to_trx(user_thd));
osku's avatar
osku committed
4377 4378 4379 4380 4381 4382 4383 4384 4385 4386 4387 4388 4389 4390 4391 4392 4393 4394 4395 4396 4397 4398 4399 4400 4401 4402 4403 4404 4405 4406 4407 4408 4409 4410 4411

	innodb_srv_conc_enter_innodb(prebuilt->trx);

	ret = row_search_for_mysql((byte*)buf, 0, prebuilt, match_mode,
								direction);
	innodb_srv_conc_exit_innodb(prebuilt->trx);

	if (ret == DB_SUCCESS) {
		error = 0;
		table->status = 0;

	} else if (ret == DB_RECORD_NOT_FOUND) {
		error = HA_ERR_END_OF_FILE;
		table->status = STATUS_NOT_FOUND;

	} else if (ret == DB_END_OF_INDEX) {
		error = HA_ERR_END_OF_FILE;
		table->status = STATUS_NOT_FOUND;
	} else {
		error = convert_error_code_to_mysql((int) ret, user_thd);
		table->status = STATUS_NOT_FOUND;
	}

	DBUG_RETURN(error);
}

/***************************************************************************
Reads the next row from a cursor, which must have previously been
positioned using index_read. */

int
ha_innobase::index_next(
/*====================*/
				/* out: 0, HA_ERR_END_OF_FILE, or error
				number */
4412
	uchar*		buf)	/* in/out: buffer for next row in MySQL
osku's avatar
osku committed
4413 4414
				format */
{
4415
	ha_statistic_increment(&SSV::ha_read_next_count);
osku's avatar
osku committed
4416 4417 4418 4419 4420 4421 4422 4423 4424 4425 4426 4427

	return(general_fetch(buf, ROW_SEL_NEXT, 0));
}

/***********************************************************************
Reads the next row matching to the key value given as the parameter. */

int
ha_innobase::index_next_same(
/*=========================*/
				/* out: 0, HA_ERR_END_OF_FILE, or error
				number */
4428 4429
	uchar*		buf,	/* in/out: buffer for the row */
	const uchar*	key,	/* in: key value */
4430
	uint		keylen)	/* in: key value length */
osku's avatar
osku committed
4431
{
4432
	ha_statistic_increment(&SSV::ha_read_next_count);
osku's avatar
osku committed
4433 4434 4435 4436 4437 4438 4439 4440 4441 4442 4443

	return(general_fetch(buf, ROW_SEL_NEXT, last_match_mode));
}

/***************************************************************************
Reads the previous row from a cursor, which must have previously been
positioned using index_read. */

int
ha_innobase::index_prev(
/*====================*/
4444 4445
			/* out: 0, HA_ERR_END_OF_FILE, or error number */
	uchar*	buf)	/* in/out: buffer for previous row in MySQL format */
osku's avatar
osku committed
4446
{
4447
	ha_statistic_increment(&SSV::ha_read_prev_count);
4448

osku's avatar
osku committed
4449 4450 4451 4452 4453 4454 4455 4456 4457 4458
	return(general_fetch(buf, ROW_SEL_PREV, 0));
}

/************************************************************************
Positions a cursor on the first record in an index and reads the
corresponding row to buf. */

int
ha_innobase::index_first(
/*=====================*/
4459 4460
			/* out: 0, HA_ERR_END_OF_FILE, or error code */
	uchar*	buf)	/* in/out: buffer for the row */
osku's avatar
osku committed
4461 4462 4463
{
	int	error;

4464
	DBUG_ENTER("index_first");
4465
	ha_statistic_increment(&SSV::ha_read_first_count);
osku's avatar
osku committed
4466

4467
	error = index_read(buf, NULL, 0, HA_READ_AFTER_KEY);
osku's avatar
osku committed
4468

4469
	/* MySQL does not seem to allow this to return HA_ERR_KEY_NOT_FOUND */
osku's avatar
osku committed
4470

4471 4472 4473
	if (error == HA_ERR_KEY_NOT_FOUND) {
		error = HA_ERR_END_OF_FILE;
	}
osku's avatar
osku committed
4474

4475
	DBUG_RETURN(error);
osku's avatar
osku committed
4476 4477 4478 4479 4480 4481 4482 4483 4484
}

/************************************************************************
Positions a cursor on the last record in an index and reads the
corresponding row to buf. */

int
ha_innobase::index_last(
/*====================*/
4485 4486
			/* out: 0, HA_ERR_END_OF_FILE, or error code */
	uchar*	buf)	/* in/out: buffer for the row */
osku's avatar
osku committed
4487 4488 4489
{
	int	error;

4490
	DBUG_ENTER("index_last");
4491
	ha_statistic_increment(&SSV::ha_read_last_count);
osku's avatar
osku committed
4492

4493
	error = index_read(buf, NULL, 0, HA_READ_BEFORE_KEY);
osku's avatar
osku committed
4494

4495
	/* MySQL does not seem to allow this to return HA_ERR_KEY_NOT_FOUND */
osku's avatar
osku committed
4496

4497 4498 4499
	if (error == HA_ERR_KEY_NOT_FOUND) {
		error = HA_ERR_END_OF_FILE;
	}
osku's avatar
osku committed
4500

4501
	DBUG_RETURN(error);
osku's avatar
osku committed
4502 4503 4504 4505 4506 4507 4508 4509 4510 4511 4512 4513 4514 4515 4516 4517 4518 4519 4520 4521 4522 4523
}

/********************************************************************
Initialize a table scan. */

int
ha_innobase::rnd_init(
/*==================*/
			/* out: 0 or error number */
	bool	scan)	/* in: ???????? */
{
	int	err;

	/* Store the active index value so that we can restore the original
	value after a scan */

	if (prebuilt->clust_index_was_generated) {
		err = change_active_index(MAX_KEY);
	} else {
		err = change_active_index(primary_key);
	}

4524 4525 4526 4527 4528 4529 4530
	/* Don't use semi-consistent read in random row reads (by position).
	This means we must disable semi_consistent_read if scan is false */

	if (!scan) {
		try_semi_consistent_read(0);
	}

4531
	start_of_scan = 1;
osku's avatar
osku committed
4532

4533
	return(err);
osku's avatar
osku committed
4534 4535 4536 4537 4538 4539 4540 4541 4542 4543 4544 4545 4546 4547 4548 4549 4550 4551 4552 4553 4554
}

/*********************************************************************
Ends a table scan. */

int
ha_innobase::rnd_end(void)
/*======================*/
				/* out: 0 or error number */
{
	return(index_end());
}

/*********************************************************************
Reads the next row in a table scan (also used to read the FIRST row
in a table scan). */

int
ha_innobase::rnd_next(
/*==================*/
			/* out: 0, HA_ERR_END_OF_FILE, or error number */
4555
	uchar*	buf)	/* in/out: returns the row in this buffer,
osku's avatar
osku committed
4556 4557 4558 4559
			in MySQL format */
{
	int	error;

4560
	DBUG_ENTER("rnd_next");
4561
	ha_statistic_increment(&SSV::ha_read_rnd_next_count);
osku's avatar
osku committed
4562

4563
	if (start_of_scan) {
osku's avatar
osku committed
4564 4565 4566 4567 4568 4569 4570 4571 4572
		error = index_first(buf);
		if (error == HA_ERR_KEY_NOT_FOUND) {
			error = HA_ERR_END_OF_FILE;
		}
		start_of_scan = 0;
	} else {
		error = general_fetch(buf, ROW_SEL_NEXT, 0);
	}

4573
	DBUG_RETURN(error);
osku's avatar
osku committed
4574 4575 4576 4577 4578 4579 4580 4581
}

/**************************************************************************
Fetches a row from the table based on a row reference. */

int
ha_innobase::rnd_pos(
/*=================*/
4582 4583 4584 4585 4586 4587
			/* out: 0, HA_ERR_KEY_NOT_FOUND, or error code */
	uchar*	buf,	/* in/out: buffer for the row */
	uchar*	pos)	/* in: primary key value of the row in the
			MySQL format, or the row id if the clustered
			index was internally generated by InnoDB; the
			length of data in pos has to be ref_length */
osku's avatar
osku committed
4588 4589 4590 4591
{
	int		error;
	uint		keynr	= active_index;
	DBUG_ENTER("rnd_pos");
marko's avatar
marko committed
4592
	DBUG_DUMP("key", pos, ref_length);
osku's avatar
osku committed
4593

4594
	ha_statistic_increment(&SSV::ha_read_rnd_count);
osku's avatar
osku committed
4595

4596
	ut_a(prebuilt->trx == thd_to_trx(ha_thd()));
osku's avatar
osku committed
4597 4598 4599 4600 4601 4602 4603 4604 4605 4606 4607 4608 4609

	if (prebuilt->clust_index_was_generated) {
		/* No primary key was defined for the table and we
		generated the clustered index from the row id: the
		row reference is the row id, not any key value
		that MySQL knows of */

		error = change_active_index(MAX_KEY);
	} else {
		error = change_active_index(primary_key);
	}

	if (error) {
marko's avatar
marko committed
4610
		DBUG_PRINT("error", ("Got error: %d", error));
osku's avatar
osku committed
4611 4612 4613 4614
		DBUG_RETURN(error);
	}

	/* Note that we assume the length of the row reference is fixed
4615
	for the table, and it is == ref_length */
osku's avatar
osku committed
4616 4617 4618 4619

	error = index_read(buf, pos, ref_length, HA_READ_KEY_EXACT);

	if (error) {
marko's avatar
marko committed
4620
		DBUG_PRINT("error", ("Got error: %d", error));
osku's avatar
osku committed
4621 4622 4623 4624
	}

	change_active_index(keynr);

4625
	DBUG_RETURN(error);
osku's avatar
osku committed
4626 4627 4628 4629 4630 4631 4632 4633 4634 4635 4636 4637 4638 4639
}

/*************************************************************************
Stores a reference to the current row to 'ref' field of the handle. Note
that in the case where we have generated the clustered index for the
table, the function parameter is illogical: we MUST ASSUME that 'record'
is the current 'position' of the handle, because if row ref is actually
the row id internally generated in InnoDB, then 'record' does not contain
it. We just guess that the row id must be for the record where the handle
was positioned the last time. */

void
ha_innobase::position(
/*==================*/
4640
	const uchar*	record)	/* in: row in MySQL format */
osku's avatar
osku committed
4641 4642 4643
{
	uint		len;

4644
	ut_a(prebuilt->trx == thd_to_trx(ha_thd()));
osku's avatar
osku committed
4645 4646 4647 4648 4649 4650 4651 4652 4653 4654 4655 4656 4657 4658 4659 4660 4661

	if (prebuilt->clust_index_was_generated) {
		/* No primary key was defined for the table and we
		generated the clustered index from row id: the
		row reference will be the row id, not any key value
		that MySQL knows of */

		len = DATA_ROW_ID_LEN;

		memcpy(ref, prebuilt->row_id, len);
	} else {
		len = store_key_val_for_row(primary_key, (char*)ref,
							 ref_length, record);
	}

	/* We assume that the 'ref' value len is always fixed for the same
	table. */
4662

osku's avatar
osku committed
4663 4664
	if (len != ref_length) {
	  sql_print_error("Stored ref len is %lu, but table ref len is %lu",
4665
			  (ulong) len, (ulong) ref_length);
osku's avatar
osku committed
4666 4667 4668
	}
}

4669 4670 4671
/*********************************************************************
If it's a DB_TOO_BIG_RECORD error then set a suitable message to
return to the client.*/
4672
inline
4673 4674
void
innodb_check_for_record_too_big_error(
4675
/*==================================*/
4676 4677
	ulint	comp,	/* in: ROW_FORMAT: nonzero=COMPACT, 0=REDUNDANT */
	int	error)	/* in: error code to check */
4678 4679
{
	if (error == (int)DB_TOO_BIG_RECORD) {
4680 4681
		ulint	max_row_size
			= page_get_free_space_of_empty_noninline(comp) / 2;
4682 4683 4684 4685 4686

		my_error(ER_TOO_BIG_ROWSIZE, MYF(0), max_row_size);
	}
}

vasil's avatar
vasil committed
4687 4688 4689 4690 4691 4692
/* limit innodb monitor access to users with PROCESS privilege.
See http://bugs.mysql.com/32710 for expl. why we choose PROCESS. */
#define IS_MAGIC_TABLE_AND_USER_DENIED_ACCESS(table_name, thd) \
	(row_is_magic_monitor_table(table_name) \
	 && check_global_access(thd, PROCESS_ACL))

osku's avatar
osku committed
4693 4694 4695 4696 4697 4698 4699 4700 4701 4702 4703 4704 4705 4706 4707 4708 4709 4710
/*********************************************************************
Creates a table definition to an InnoDB database. */
static
int
create_table_def(
/*=============*/
	trx_t*		trx,		/* in: InnoDB transaction handle */
	TABLE*		form,		/* in: information on table
					columns and indexes */
	const char*	table_name,	/* in: table name */
	const char*	path_of_temp_table,/* in: if this is a table explicitly
					created by the user with the
					TEMPORARY keyword, then this
					parameter is the dir path where the
					table should be placed if we create
					an .ibd file for it (no .ibd extension
					in the path, though); otherwise this
					is NULL */
4711
	ulint		flags)		/* in: table flags */
osku's avatar
osku committed
4712 4713 4714 4715
{
	Field*		field;
	dict_table_t*	table;
	ulint		n_cols;
4716 4717
	int		error;
	ulint		col_type;
osku's avatar
osku committed
4718
	ulint		col_len;
4719
	ulint		nulls_allowed;
osku's avatar
osku committed
4720 4721 4722 4723
	ulint		unsigned_type;
	ulint		binary_type;
	ulint		long_true_varchar;
	ulint		charset_no;
4724
	ulint		i;
osku's avatar
osku committed
4725

4726 4727
	DBUG_ENTER("create_table_def");
	DBUG_PRINT("enter", ("table_name: %s", table_name));
osku's avatar
osku committed
4728

vasil's avatar
vasil committed
4729 4730 4731 4732 4733 4734
	ut_a(trx->mysql_thd != NULL);
	if (IS_MAGIC_TABLE_AND_USER_DENIED_ACCESS(table_name,
						  (THD*) trx->mysql_thd)) {
		DBUG_RETURN(HA_ERR_GENERIC);
	}

osku's avatar
osku committed
4735 4736 4737 4738 4739
	n_cols = form->s->fields;

	/* We pass 0 as the space id, and determine at a lower level the space
	id where to store the table */

4740
	table = dict_mem_table_create(table_name, 0, n_cols, flags);
osku's avatar
osku committed
4741 4742 4743 4744 4745 4746 4747 4748 4749 4750 4751 4752 4753 4754 4755 4756 4757 4758 4759 4760 4761 4762 4763

	if (path_of_temp_table) {
		table->dir_path_of_temp_table =
			mem_heap_strdup(table->heap, path_of_temp_table);
	}

	for (i = 0; i < n_cols; i++) {
		field = form->field[i];

		col_type = get_innobase_type_from_mysql_type(&unsigned_type,
									field);
		if (field->null_ptr) {
			nulls_allowed = 0;
		} else {
			nulls_allowed = DATA_NOT_NULL;
		}

		if (field->binary()) {
			binary_type = DATA_BINARY_TYPE;
		} else {
			binary_type = 0;
		}

4764
		charset_no = 0;
osku's avatar
osku committed
4765 4766 4767 4768 4769 4770 4771 4772 4773 4774 4775 4776 4777 4778 4779 4780 4781 4782

		if (dtype_is_string_type(col_type)) {

			charset_no = (ulint)field->charset()->number;

			ut_a(charset_no < 256); /* in data0type.h we assume
						that the number fits in one
						byte */
		}

		ut_a(field->type() < 256); /* we assume in dtype_form_prtype()
					   that this fits in one byte */
		col_len = field->pack_length();

		/* The MySQL pack length contains 1 or 2 bytes length field
		for a true VARCHAR. Let us subtract that, so that the InnoDB
		column length in the InnoDB data dictionary is the real
		maximum byte length of the actual data. */
4783

osku's avatar
osku committed
4784 4785 4786 4787 4788 4789 4790 4791 4792 4793
		long_true_varchar = 0;

		if (field->type() == MYSQL_TYPE_VARCHAR) {
			col_len -= ((Field_varstring*)field)->length_bytes;

			if (((Field_varstring*)field)->length_bytes == 2) {
				long_true_varchar = DATA_LONG_TRUE_VARCHAR;
			}
		}

4794
		dict_mem_table_add_col(table, table->heap,
4795 4796 4797 4798 4799 4800 4801
			(char*) field->field_name,
			col_type,
			dtype_form_prtype(
				(ulint)field->type()
				| nulls_allowed | unsigned_type
				| binary_type | long_true_varchar,
				charset_no),
4802
			col_len);
osku's avatar
osku committed
4803 4804 4805 4806
	}

	error = row_create_table_for_mysql(table, trx);

4807
	innodb_check_for_record_too_big_error(flags & DICT_TF_COMPACT, error);
4808

osku's avatar
osku committed
4809 4810 4811 4812 4813 4814 4815 4816 4817 4818 4819 4820 4821 4822 4823 4824 4825 4826 4827
	error = convert_error_code_to_mysql(error, NULL);

	DBUG_RETURN(error);
}

/*********************************************************************
Creates an index in an InnoDB database. */
static
int
create_index(
/*=========*/
	trx_t*		trx,		/* in: InnoDB transaction handle */
	TABLE*		form,		/* in: information on table
					columns and indexes */
	const char*	table_name,	/* in: table name */
	uint		key_num)	/* in: index number */
{
	Field*		field;
	dict_index_t*	index;
4828
	int		error;
osku's avatar
osku committed
4829 4830 4831 4832 4833 4834 4835
	ulint		n_fields;
	KEY*		key;
	KEY_PART_INFO*	key_part;
	ulint		ind_type;
	ulint		col_type;
	ulint		prefix_len;
	ulint		is_unsigned;
4836 4837
	ulint		i;
	ulint		j;
osku's avatar
osku committed
4838
	ulint*		field_lengths;
4839 4840

	DBUG_ENTER("create_index");
osku's avatar
osku committed
4841 4842 4843

	key = form->key_info + key_num;

4844
	n_fields = key->key_parts;
osku's avatar
osku committed
4845

4846
	ind_type = 0;
osku's avatar
osku committed
4847

4848
	if (key_num == form->s->primary_key) {
osku's avatar
osku committed
4849 4850 4851 4852 4853 4854 4855 4856 4857 4858 4859 4860 4861 4862 4863
		ind_type = ind_type | DICT_CLUSTERED;
	}

	if (key->flags & HA_NOSAME ) {
		ind_type = ind_type | DICT_UNIQUE;
	}

	/* We pass 0 as the space id, and determine at a lower level the space
	id where to store the table */

	index = dict_mem_index_create((char*) table_name, key->name, 0,
						ind_type, n_fields);

	field_lengths = (ulint*) my_malloc(sizeof(ulint) * n_fields,
		MYF(MY_FAE));
4864

osku's avatar
osku committed
4865 4866 4867 4868 4869 4870 4871 4872
	for (i = 0; i < n_fields; i++) {
		key_part = key->key_part + i;

		/* (The flag HA_PART_KEY_SEG denotes in MySQL a column prefix
		field in an index: we only store a specified number of first
		bytes of the column to the index field.) The flag does not
		seem to be properly set by MySQL. Let us fall back on testing
		the length of the key part versus the column. */
4873

osku's avatar
osku committed
4874 4875 4876 4877 4878 4879 4880 4881 4882 4883 4884 4885 4886 4887 4888 4889 4890 4891 4892 4893
		field = NULL;
		for (j = 0; j < form->s->fields; j++) {

			field = form->field[j];

			if (0 == innobase_strcasecmp(
					field->field_name,
					key_part->field->field_name)) {
				/* Found the corresponding column */

				break;
			}
		}

		ut_a(j < form->s->fields);

		col_type = get_innobase_type_from_mysql_type(
					&is_unsigned, key_part->field);

		if (DATA_BLOB == col_type
4894 4895 4896 4897 4898
			|| (key_part->length < field->pack_length()
				&& field->type() != MYSQL_TYPE_VARCHAR)
			|| (field->type() == MYSQL_TYPE_VARCHAR
				&& key_part->length < field->pack_length()
				- ((Field_varstring*)field)->length_bytes)) {
osku's avatar
osku committed
4899

4900
			prefix_len = key_part->length;
osku's avatar
osku committed
4901 4902

			if (col_type == DATA_INT
4903 4904 4905 4906 4907 4908 4909 4910 4911 4912 4913 4914
				|| col_type == DATA_FLOAT
				|| col_type == DATA_DOUBLE
				|| col_type == DATA_DECIMAL) {
				sql_print_error(
					"MySQL is trying to create a column "
					"prefix index field, on an "
					"inappropriate data type. Table "
					"name %s, column name %s.",
					table_name,
					key_part->field->field_name);

				prefix_len = 0;
osku's avatar
osku committed
4915 4916
			}
		} else {
4917
			prefix_len = 0;
osku's avatar
osku committed
4918 4919 4920 4921 4922
		}

		field_lengths[i] = key_part->length;

		dict_mem_index_add_field(index,
4923
			(char*) key_part->field->field_name, prefix_len);
osku's avatar
osku committed
4924 4925
	}

4926 4927 4928
	/* Even though we've defined max_supported_key_part_length, we
	still do our own checking using field_lengths to be absolutely
	sure we don't create too long indexes. */
osku's avatar
osku committed
4929 4930
	error = row_create_index_for_mysql(index, trx, field_lengths);

4931 4932
	innodb_check_for_record_too_big_error(form->s->row_type
					      != ROW_TYPE_REDUNDANT, error);
4933

osku's avatar
osku committed
4934 4935
	error = convert_error_code_to_mysql(error, NULL);

marko's avatar
marko committed
4936
	my_free(field_lengths, MYF(0));
4937

osku's avatar
osku committed
4938 4939 4940 4941 4942 4943 4944 4945 4946 4947 4948
	DBUG_RETURN(error);
}

/*********************************************************************
Creates an index to an InnoDB table when the user has defined no
primary index. */
static
int
create_clustered_index_when_no_primary(
/*===================================*/
	trx_t*		trx,		/* in: InnoDB transaction handle */
4949 4950
	ulint		comp,		/* in: ROW_FORMAT:
					nonzero=COMPACT, 0=REDUNDANT */
osku's avatar
osku committed
4951 4952 4953
	const char*	table_name)	/* in: table name */
{
	dict_index_t*	index;
4954
	int		error;
osku's avatar
osku committed
4955 4956 4957 4958

	/* We pass 0 as the space id, and determine at a lower level the space
	id where to store the table */

4959 4960
	index = dict_mem_index_create(table_name, "GEN_CLUST_INDEX",
				      0, DICT_CLUSTERED, 0);
osku's avatar
osku committed
4961 4962
	error = row_create_index_for_mysql(index, trx, NULL);

4963
	innodb_check_for_record_too_big_error(comp, error);
4964

osku's avatar
osku committed
4965 4966 4967 4968 4969 4970
	error = convert_error_code_to_mysql(error, NULL);

	return(error);
}

/*********************************************************************
4971 4972 4973 4974 4975 4976 4977 4978 4979 4980 4981 4982 4983 4984
Update create_info.  Used in SHOW CREATE TABLE et al. */

void
ha_innobase::update_create_info(
/*============================*/
	HA_CREATE_INFO* create_info)	/* in/out: create info */
{
  if (!(create_info->used_fields & HA_CREATE_USED_AUTO)) {
    ha_innobase::info(HA_STATUS_AUTO);
    create_info->auto_increment_value = stats.auto_increment_value;
  }
}

/*********************************************************************
osku's avatar
osku committed
4985 4986 4987 4988 4989 4990 4991 4992 4993 4994 4995 4996 4997 4998 4999 5000 5001 5002 5003 5004 5005
Creates a new table to an InnoDB database. */

int
ha_innobase::create(
/*================*/
					/* out: error number */
	const char*	name,		/* in: table name */
	TABLE*		form,		/* in: information on table
					columns and indexes */
	HA_CREATE_INFO*	create_info)	/* in: more information of the
					created table, contains also the
					create statement string */
{
	int		error;
	dict_table_t*	innobase_table;
	trx_t*		parent_trx;
	trx_t*		trx;
	int		primary_key_no;
	uint		i;
	char		name2[FN_REFLEN];
	char		norm_name[FN_REFLEN];
5006
	THD*		thd = ha_thd();
5007
	ib_longlong	auto_inc_value;
5008
	ulint		flags;
osku's avatar
osku committed
5009

5010
	DBUG_ENTER("ha_innobase::create");
osku's avatar
osku committed
5011 5012

	DBUG_ASSERT(thd != NULL);
calvin's avatar
calvin committed
5013 5014 5015 5016 5017 5018 5019 5020 5021 5022 5023 5024 5025 5026 5027 5028 5029 5030 5031 5032 5033 5034 5035
	DBUG_ASSERT(create_info != NULL);

#ifdef __WIN__
	/* Names passed in from server are in two formats:
	1. <database_name>/<table_name>: for normal table creation
	2. full path: for temp table creation, or sym link

	When srv_file_per_table is on, check for full path pattern, i.e.
	X:\dir\...,		X is a driver letter, or
	\\dir1\dir2\...,	UNC path
	returns error if it is in full path format, but not creating a temp.
	table. Currently InnoDB does not support symbolic link on Windows. */

	if (srv_file_per_table
	    && (!create_info->options & HA_LEX_CREATE_TMP_TABLE)) {

		if ((name[1] == ':')
		    || (name[0] == '\\' && name[1] == '\\')) {
			sql_print_error("Cannot create table %s\n", name);
			DBUG_RETURN(HA_ERR_GENERIC);
		}
	}
#endif
osku's avatar
osku committed
5036 5037 5038 5039 5040

	if (form->s->fields > 1000) {
		/* The limit probably should be REC_MAX_N_FIELDS - 3 = 1020,
		but we play safe here */

5041 5042
		DBUG_RETURN(HA_ERR_TO_BIG_ROW);
	}
osku's avatar
osku committed
5043 5044 5045

	/* Get the transaction associated with the current thd, or create one
	if not yet created */
5046

5047
	parent_trx = check_trx_exists(thd);
osku's avatar
osku committed
5048 5049 5050 5051

	/* In case MySQL calls this in the middle of a SELECT query, release
	possible adaptive hash latch to avoid deadlocks of threads */

5052 5053
	trx_search_latch_release_if_reserved(parent_trx);

osku's avatar
osku committed
5054
	trx = trx_allocate_for_mysql();
5055

osku's avatar
osku committed
5056
	trx->mysql_thd = thd;
5057
	trx->mysql_query_str = thd_query(thd);
osku's avatar
osku committed
5058

5059
	if (thd_test_options(thd, OPTION_NO_FOREIGN_KEY_CHECKS)) {
osku's avatar
osku committed
5060 5061 5062
		trx->check_foreigns = FALSE;
	}

5063
	if (thd_test_options(thd, OPTION_RELAXED_UNIQUE_CHECKS)) {
osku's avatar
osku committed
5064 5065 5066 5067 5068 5069 5070 5071 5072
		trx->check_unique_secondary = FALSE;
	}

	if (lower_case_table_names) {
		srv_lower_case_table_names = TRUE;
	} else {
		srv_lower_case_table_names = FALSE;
	}

5073
	strcpy(name2, name);
osku's avatar
osku committed
5074 5075 5076 5077 5078 5079 5080 5081 5082 5083 5084

	normalize_table_name(norm_name, name2);

	/* Latch the InnoDB data dictionary exclusively so that no deadlocks
	or lock waits can happen in it during a table create operation.
	Drop table etc. do this latching in row0mysql.c. */

	row_mysql_lock_data_dictionary(trx);

	/* Create the table definition in InnoDB */

5085 5086 5087 5088 5089 5090
	flags = 0;

	if (form->s->row_type != ROW_TYPE_REDUNDANT) {
		flags |= DICT_TF_COMPACT;
	}

osku's avatar
osku committed
5091 5092
	error = create_table_def(trx, form, norm_name,
		create_info->options & HA_LEX_CREATE_TMP_TABLE ? name2 : NULL,
5093
		flags);
osku's avatar
osku committed
5094

5095
	if (error) {
osku's avatar
osku committed
5096
		goto cleanup;
5097
	}
osku's avatar
osku committed
5098 5099 5100

	/* Look for a primary key */

osku's avatar
osku committed
5101
	primary_key_no= (form->s->primary_key != MAX_KEY ?
5102
			 (int) form->s->primary_key :
osku's avatar
osku committed
5103 5104 5105 5106 5107 5108 5109 5110 5111 5112 5113 5114 5115 5116
			 -1);

	/* Our function row_get_mysql_key_number_for_index assumes
	the primary key is always number 0, if it exists */

	DBUG_ASSERT(primary_key_no == -1 || primary_key_no == 0);

	/* Create the keys */

	if (form->s->keys == 0 || primary_key_no == -1) {
		/* Create an index which is used as the clustered index;
		order the rows by their row id which is internally generated
		by InnoDB */

5117 5118 5119
		error = create_clustered_index_when_no_primary(
			trx, form->s->row_type != ROW_TYPE_REDUNDANT,
			norm_name);
5120
		if (error) {
osku's avatar
osku committed
5121
			goto cleanup;
5122
		}
osku's avatar
osku committed
5123 5124 5125 5126 5127
	}

	if (primary_key_no != -1) {
		/* In InnoDB the clustered index must always be created
		first */
5128
		if ((error = create_index(trx, form, norm_name,
osku's avatar
osku committed
5129 5130
					  (uint) primary_key_no))) {
			goto cleanup;
5131 5132
		}
	}
osku's avatar
osku committed
5133 5134 5135 5136 5137

	for (i = 0; i < form->s->keys; i++) {

		if (i != (uint) primary_key_no) {

5138
			if ((error = create_index(trx, form, norm_name, i))) {
osku's avatar
osku committed
5139
				goto cleanup;
5140 5141 5142
			}
		}
	}
osku's avatar
osku committed
5143

5144
	if (*trx->mysql_query_str) {
osku's avatar
osku committed
5145
		error = row_table_add_foreign_constraints(trx,
5146
			*trx->mysql_query_str, norm_name,
osku's avatar
osku committed
5147 5148 5149 5150 5151 5152 5153 5154 5155
			create_info->options & HA_LEX_CREATE_TMP_TABLE);

		error = convert_error_code_to_mysql(error, NULL);

		if (error) {
			goto cleanup;
		}
	}

5156
	innobase_commit_low(trx);
osku's avatar
osku committed
5157 5158 5159 5160 5161 5162 5163 5164 5165

	row_mysql_unlock_data_dictionary(trx);

	/* Flush the log to reduce probability that the .frm files and
	the InnoDB data dictionary get out-of-sync if the user runs
	with innodb_flush_log_at_trx_commit = 0 */

	log_buffer_flush_to_disk();

5166
	innobase_table = dict_table_get(norm_name, FALSE);
osku's avatar
osku committed
5167 5168 5169

	DBUG_ASSERT(innobase_table != 0);

5170 5171 5172 5173 5174 5175 5176 5177 5178
	/* Note: We can't call update_thd() as prebuilt will not be
	setup at this stage and so we use thd. */

	/* We need to copy the AUTOINC value from the old table if
	this is an ALTER TABLE. */

	if (((create_info->used_fields & HA_CREATE_USED_AUTO)
	    || thd_sql_command(thd) == SQLCOM_ALTER_TABLE)
	    && create_info->auto_increment_value != 0) {
osku's avatar
osku committed
5179

5180
		/* Query was ALTER TABLE...AUTO_INCREMENT = x; or
osku's avatar
osku committed
5181 5182 5183 5184 5185 5186 5187
		CREATE TABLE ...AUTO_INCREMENT = x; Find out a table
		definition from the dictionary and get the current value
		of the auto increment field. Set a new value to the
		auto increment field if the value is greater than the
		maximum value in the column. */

		auto_inc_value = create_info->auto_increment_value;
5188 5189

		dict_table_autoinc_lock(innobase_table);
osku's avatar
osku committed
5190
		dict_table_autoinc_initialize(innobase_table, auto_inc_value);
5191
		dict_table_autoinc_unlock(innobase_table);
osku's avatar
osku committed
5192 5193 5194 5195 5196 5197 5198
	}

	/* Tell the InnoDB server that there might be work for
	utility threads: */

	srv_active_wake_master_thread();

5199
	trx_free_for_mysql(trx);
osku's avatar
osku committed
5200 5201 5202 5203 5204

	DBUG_RETURN(0);

cleanup:
	innobase_commit_low(trx);
5205

osku's avatar
osku committed
5206
	row_mysql_unlock_data_dictionary(trx);
5207

osku's avatar
osku committed
5208 5209 5210 5211 5212 5213 5214 5215 5216 5217 5218 5219 5220 5221 5222 5223 5224 5225
	trx_free_for_mysql(trx);

	DBUG_RETURN(error);
}

/*********************************************************************
Discards or imports an InnoDB tablespace. */

int
ha_innobase::discard_or_import_tablespace(
/*======================================*/
				/* out: 0 == success, -1 == error */
	my_bool discard)	/* in: TRUE if discard, else import */
{
	dict_table_t*	dict_table;
	trx_t*		trx;
	int		err;

5226
	DBUG_ENTER("ha_innobase::discard_or_import_tablespace");
osku's avatar
osku committed
5227

5228 5229
	ut_a(prebuilt->trx);
	ut_a(prebuilt->trx->magic_n == TRX_MAGIC_N);
5230
	ut_a(prebuilt->trx == thd_to_trx(ha_thd()));
osku's avatar
osku committed
5231 5232 5233 5234 5235 5236 5237 5238 5239 5240 5241 5242 5243 5244 5245 5246 5247 5248 5249 5250 5251 5252 5253 5254 5255 5256 5257

	dict_table = prebuilt->table;
	trx = prebuilt->trx;

	if (discard) {
		err = row_discard_tablespace_for_mysql(dict_table->name, trx);
	} else {
		err = row_import_tablespace_for_mysql(dict_table->name, trx);
	}

	err = convert_error_code_to_mysql(err, NULL);

	DBUG_RETURN(err);
}

/*********************************************************************
Deletes all rows of an InnoDB table. */

int
ha_innobase::delete_all_rows(void)
/*==============================*/
				/* out: error number */
{
	int		error;

	DBUG_ENTER("ha_innobase::delete_all_rows");

5258 5259 5260 5261 5262 5263
	/* Get the transaction associated with the current thd, or create one
	if not yet created, and update prebuilt->trx */

	update_thd(ha_thd());

	if (thd_sql_command(user_thd) != SQLCOM_TRUNCATE) {
osku's avatar
osku committed
5264 5265 5266 5267 5268 5269 5270 5271
	fallback:
		/* We only handle TRUNCATE TABLE t as a special case.
		DELETE FROM t will have to use ha_innobase::delete_row(). */
		DBUG_RETURN(my_errno=HA_ERR_WRONG_COMMAND);
	}

	/* Truncate the table in InnoDB */

5272
	error = row_truncate_table_for_mysql(prebuilt->table, prebuilt->trx);
osku's avatar
osku committed
5273 5274 5275 5276 5277 5278 5279 5280 5281 5282 5283 5284 5285 5286 5287 5288 5289 5290 5291 5292 5293 5294 5295 5296 5297 5298 5299
	if (error == DB_ERROR) {
		/* Cannot truncate; resort to ha_innobase::delete_row() */
		goto fallback;
	}

	error = convert_error_code_to_mysql(error, NULL);

	DBUG_RETURN(error);
}

/*********************************************************************
Drops a table from an InnoDB database. Before calling this function,
MySQL calls innobase_commit to commit the transaction of the current user.
Then the current user cannot have locks set on the table. Drop table
operation inside InnoDB will remove all locks any user has on the table
inside InnoDB. */

int
ha_innobase::delete_table(
/*======================*/
				/* out: error number */
	const char*	name)	/* in: table name */
{
	ulint	name_len;
	int	error;
	trx_t*	parent_trx;
	trx_t*	trx;
5300
	THD	*thd = ha_thd();
osku's avatar
osku committed
5301 5302
	char	norm_name[1000];

5303
	DBUG_ENTER("ha_innobase::delete_table");
osku's avatar
osku committed
5304

vasil's avatar
vasil committed
5305 5306 5307 5308 5309 5310 5311 5312
	/* Strangely, MySQL passes the table name without the '.frm'
	extension, in contrast to ::create */
	normalize_table_name(norm_name, name);

	if (IS_MAGIC_TABLE_AND_USER_DENIED_ACCESS(norm_name, thd)) {
		DBUG_RETURN(HA_ERR_GENERIC);
	}

osku's avatar
osku committed
5313 5314
	/* Get the transaction associated with the current thd, or create one
	if not yet created */
5315

5316
	parent_trx = check_trx_exists(thd);
osku's avatar
osku committed
5317 5318 5319 5320

	/* In case MySQL calls this in the middle of a SELECT query, release
	possible adaptive hash latch to avoid deadlocks of threads */

5321
	trx_search_latch_release_if_reserved(parent_trx);
osku's avatar
osku committed
5322 5323 5324 5325 5326 5327 5328 5329 5330

	if (lower_case_table_names) {
		srv_lower_case_table_names = TRUE;
	} else {
		srv_lower_case_table_names = FALSE;
	}

	trx = trx_allocate_for_mysql();

5331 5332
	trx->mysql_thd = thd;
	trx->mysql_query_str = thd_query(thd);
osku's avatar
osku committed
5333

5334
	if (thd_test_options(thd, OPTION_NO_FOREIGN_KEY_CHECKS)) {
osku's avatar
osku committed
5335 5336 5337
		trx->check_foreigns = FALSE;
	}

5338
	if (thd_test_options(thd, OPTION_RELAXED_UNIQUE_CHECKS)) {
osku's avatar
osku committed
5339 5340 5341 5342 5343 5344 5345
		trx->check_unique_secondary = FALSE;
	}

	name_len = strlen(name);

	assert(name_len < 1000);

5346
	/* Drop the table in InnoDB */
osku's avatar
osku committed
5347 5348

	error = row_drop_table_for_mysql(norm_name, trx,
5349 5350
					 thd_sql_command(thd)
					 == SQLCOM_DROP_DB);
osku's avatar
osku committed
5351 5352 5353 5354 5355 5356 5357 5358 5359 5360 5361 5362

	/* Flush the log to reduce probability that the .frm files and
	the InnoDB data dictionary get out-of-sync if the user runs
	with innodb_flush_log_at_trx_commit = 0 */

	log_buffer_flush_to_disk();

	/* Tell the InnoDB server that there might be work for
	utility threads: */

	srv_active_wake_master_thread();

5363
	innobase_commit_low(trx);
osku's avatar
osku committed
5364

5365
	trx_free_for_mysql(trx);
osku's avatar
osku committed
5366 5367 5368 5369 5370 5371 5372 5373

	error = convert_error_code_to_mysql(error, NULL);

	DBUG_RETURN(error);
}

/*********************************************************************
Removes all tables in the named database inside InnoDB. */
5374
static
osku's avatar
osku committed
5375
void
osku's avatar
osku committed
5376 5377 5378
innobase_drop_database(
/*===================*/
			/* out: error number */
5379
        handlerton *hton, /* in: handlerton of Innodb */
osku's avatar
osku committed
5380 5381 5382 5383 5384 5385 5386 5387 5388 5389 5390
	char*	path)	/* in: database path; inside InnoDB the name
			of the last directory in the path is used as
			the database name: for example, in 'mysql/data/test'
			the database name is 'test' */
{
	ulint	len		= 0;
	trx_t*	parent_trx;
	trx_t*	trx;
	char*	ptr;
	int	error;
	char*	namebuf;
5391
	THD*	thd		= current_thd;
osku's avatar
osku committed
5392 5393 5394

	/* Get the transaction associated with the current thd, or create one
	if not yet created */
5395

5396
	parent_trx = check_trx_exists(thd);
osku's avatar
osku committed
5397 5398 5399 5400

	/* In case MySQL calls this in the middle of a SELECT query, release
	possible adaptive hash latch to avoid deadlocks of threads */

5401
	trx_search_latch_release_if_reserved(parent_trx);
osku's avatar
osku committed
5402 5403 5404 5405 5406 5407 5408 5409 5410

	ptr = strend(path) - 2;

	while (ptr >= path && *ptr != '\\' && *ptr != '/') {
		ptr--;
		len++;
	}

	ptr++;
marko's avatar
marko committed
5411
	namebuf = (char*) my_malloc((uint) len + 2, MYF(0));
osku's avatar
osku committed
5412 5413 5414 5415

	memcpy(namebuf, ptr, len);
	namebuf[len] = '/';
	namebuf[len + 1] = '\0';
5416
#ifdef	__WIN__
osku's avatar
osku committed
5417 5418 5419
	innobase_casedn_str(namebuf);
#endif
	trx = trx_allocate_for_mysql();
5420 5421
	trx->mysql_thd = thd;
	trx->mysql_query_str = thd_query(thd);
osku's avatar
osku committed
5422

5423
	if (thd_test_options(thd, OPTION_NO_FOREIGN_KEY_CHECKS)) {
osku's avatar
osku committed
5424 5425 5426
		trx->check_foreigns = FALSE;
	}

5427
	error = row_drop_database_for_mysql(namebuf, trx);
osku's avatar
osku committed
5428 5429 5430 5431 5432 5433 5434 5435 5436 5437 5438 5439 5440
	my_free(namebuf, MYF(0));

	/* Flush the log to reduce probability that the .frm files and
	the InnoDB data dictionary get out-of-sync if the user runs
	with innodb_flush_log_at_trx_commit = 0 */

	log_buffer_flush_to_disk();

	/* Tell the InnoDB server that there might be work for
	utility threads: */

	srv_active_wake_master_thread();

5441 5442 5443
	innobase_commit_low(trx);
	trx_free_for_mysql(trx);
#ifdef NO_LONGER_INTERESTED_IN_DROP_DB_ERROR
osku's avatar
osku committed
5444 5445 5446
	error = convert_error_code_to_mysql(error, NULL);

	return(error);
osku's avatar
osku committed
5447 5448 5449
#else
	return;
#endif
osku's avatar
osku committed
5450 5451 5452 5453 5454 5455 5456 5457 5458 5459 5460 5461 5462 5463 5464 5465 5466 5467 5468
}

/*************************************************************************
Renames an InnoDB table. */

int
ha_innobase::rename_table(
/*======================*/
				/* out: 0 or error code */
	const char*	from,	/* in: old name of the table */
	const char*	to)	/* in: new name of the table */
{
	ulint	name_len1;
	ulint	name_len2;
	int	error;
	trx_t*	parent_trx;
	trx_t*	trx;
	char	norm_from[1000];
	char	norm_to[1000];
5469
	THD*	thd		= ha_thd();
osku's avatar
osku committed
5470

5471
	DBUG_ENTER("ha_innobase::rename_table");
osku's avatar
osku committed
5472 5473 5474

	/* Get the transaction associated with the current thd, or create one
	if not yet created */
5475

5476
	parent_trx = check_trx_exists(thd);
osku's avatar
osku committed
5477 5478 5479 5480

	/* In case MySQL calls this in the middle of a SELECT query, release
	possible adaptive hash latch to avoid deadlocks of threads */

5481
	trx_search_latch_release_if_reserved(parent_trx);
osku's avatar
osku committed
5482 5483 5484 5485 5486 5487 5488 5489

	if (lower_case_table_names) {
		srv_lower_case_table_names = TRUE;
	} else {
		srv_lower_case_table_names = FALSE;
	}

	trx = trx_allocate_for_mysql();
5490 5491
	trx->mysql_thd = thd;
	trx->mysql_query_str = thd_query(thd);
osku's avatar
osku committed
5492

5493
	if (thd_test_options(thd, OPTION_NO_FOREIGN_KEY_CHECKS)) {
osku's avatar
osku committed
5494 5495 5496 5497 5498 5499 5500 5501 5502 5503 5504 5505
		trx->check_foreigns = FALSE;
	}

	name_len1 = strlen(from);
	name_len2 = strlen(to);

	assert(name_len1 < 1000);
	assert(name_len2 < 1000);

	normalize_table_name(norm_from, from);
	normalize_table_name(norm_to, to);

5506
	/* Rename the table in InnoDB */
osku's avatar
osku committed
5507

5508
	error = row_rename_table_for_mysql(norm_from, norm_to, trx);
osku's avatar
osku committed
5509 5510 5511 5512 5513 5514 5515 5516 5517 5518 5519 5520

	/* Flush the log to reduce probability that the .frm files and
	the InnoDB data dictionary get out-of-sync if the user runs
	with innodb_flush_log_at_trx_commit = 0 */

	log_buffer_flush_to_disk();

	/* Tell the InnoDB server that there might be work for
	utility threads: */

	srv_active_wake_master_thread();

5521 5522
	innobase_commit_low(trx);
	trx_free_for_mysql(trx);
osku's avatar
osku committed
5523 5524 5525 5526 5527 5528 5529 5530 5531 5532 5533 5534 5535 5536

	error = convert_error_code_to_mysql(error, NULL);

	DBUG_RETURN(error);
}

/*************************************************************************
Estimates the number of index records in a range. */

ha_rows
ha_innobase::records_in_range(
/*==========================*/
						/* out: estimated number of
						rows */
5537 5538 5539
	uint			keynr,		/* in: index number */
	key_range		*min_key,	/* in: start key value of the
						   range, may also be 0 */
osku's avatar
osku committed
5540
	key_range		*max_key)	/* in: range end key val, may
5541
						   also be 0 */
osku's avatar
osku committed
5542 5543 5544
{
	KEY*		key;
	dict_index_t*	index;
5545
	uchar*		key_val_buff2	= (uchar*) my_malloc(
osku's avatar
osku committed
5546
						  table->s->reclength
5547
					+ table->s->max_key_length + 100,
osku's avatar
osku committed
5548 5549
								MYF(MY_FAE));
	ulint		buff2_len = table->s->reclength
5550
					+ table->s->max_key_length + 100;
osku's avatar
osku committed
5551 5552 5553 5554 5555
	dtuple_t*	range_start;
	dtuple_t*	range_end;
	ib_longlong	n_rows;
	ulint		mode1;
	ulint		mode2;
5556 5557
	void*		heap1;
	void*		heap2;
osku's avatar
osku committed
5558

5559
	DBUG_ENTER("records_in_range");
osku's avatar
osku committed
5560

5561
	ut_a(prebuilt->trx == thd_to_trx(ha_thd()));
5562

osku's avatar
osku committed
5563 5564 5565 5566 5567 5568 5569 5570 5571 5572 5573 5574 5575 5576
	prebuilt->trx->op_info = (char*)"estimating records in index range";

	/* In case MySQL calls this in the middle of a SELECT query, release
	possible adaptive hash latch to avoid deadlocks of threads */

	trx_search_latch_release_if_reserved(prebuilt->trx);

	active_index = keynr;

	key = table->key_info + active_index;

	index = dict_table_get_index_noninline(prebuilt->table, key->name);

	range_start = dtuple_create_for_mysql(&heap1, key->key_parts);
5577
	dict_index_copy_types(range_start, index, key->key_parts);
osku's avatar
osku committed
5578 5579

	range_end = dtuple_create_for_mysql(&heap2, key->key_parts);
5580
	dict_index_copy_types(range_end, index, key->key_parts);
osku's avatar
osku committed
5581 5582 5583 5584 5585 5586

	row_sel_convert_mysql_key_to_innobase(
				range_start, (byte*) key_val_buff,
				(ulint)upd_and_key_val_buff_len,
				index,
				(byte*) (min_key ? min_key->key :
5587
					 (const uchar*) 0),
osku's avatar
osku committed
5588 5589 5590 5591 5592 5593 5594
				(ulint) (min_key ? min_key->length : 0),
				prebuilt->trx);

	row_sel_convert_mysql_key_to_innobase(
				range_end, (byte*) key_val_buff2,
				buff2_len, index,
				(byte*) (max_key ? max_key->key :
5595
					 (const uchar*) 0),
osku's avatar
osku committed
5596 5597 5598 5599
				(ulint) (max_key ? max_key->length : 0),
				prebuilt->trx);

	mode1 = convert_search_mode_to_innobase(min_key ? min_key->flag :
5600
						HA_READ_KEY_EXACT);
osku's avatar
osku committed
5601
	mode2 = convert_search_mode_to_innobase(max_key ? max_key->flag :
5602
						HA_READ_KEY_EXACT);
osku's avatar
osku committed
5603

5604 5605 5606 5607 5608 5609 5610 5611 5612 5613
	if (mode1 != PAGE_CUR_UNSUPP && mode2 != PAGE_CUR_UNSUPP) {

		n_rows = btr_estimate_n_rows_in_range(index, range_start,
						      mode1, range_end,
						      mode2);
	} else {

		n_rows = 0;
	}

osku's avatar
osku committed
5614 5615 5616
	dtuple_free_for_mysql(heap1);
	dtuple_free_for_mysql(heap2);

marko's avatar
marko committed
5617
	my_free(key_val_buff2, MYF(0));
osku's avatar
osku committed
5618 5619 5620 5621 5622 5623 5624 5625 5626 5627

	prebuilt->trx->op_info = (char*)"";

	/* The MySQL optimizer seems to believe an estimate of 0 rows is
	always accurate and may return the result 'Empty set' based on that.
	The accuracy is not guaranteed, and even if it were, for a locking
	read we should anyway perform the search to set the next-key lock.
	Add 1 to the value to make sure MySQL does not make the assumption! */

	if (n_rows == 0) {
5628
		n_rows = 1;
osku's avatar
osku committed
5629 5630 5631 5632 5633 5634 5635 5636 5637 5638 5639 5640 5641 5642 5643 5644 5645 5646
	}

	DBUG_RETURN((ha_rows) n_rows);
}

/*************************************************************************
Gives an UPPER BOUND to the number of rows in a table. This is used in
filesort.cc. */

ha_rows
ha_innobase::estimate_rows_upper_bound(void)
/*======================================*/
			/* out: upper bound of rows */
{
	dict_index_t*	index;
	ulonglong	estimate;
	ulonglong	local_data_file_length;

5647
	DBUG_ENTER("estimate_rows_upper_bound");
osku's avatar
osku committed
5648 5649 5650 5651 5652

	/* We do not know if MySQL can call this function before calling
	external_lock(). To be safe, update the thd of the current table
	handle. */

5653
	update_thd(ha_thd());
osku's avatar
osku committed
5654 5655

	prebuilt->trx->op_info = (char*)
5656
				 "calculating upper bound for table rows";
osku's avatar
osku committed
5657 5658 5659 5660 5661 5662 5663 5664 5665

	/* In case MySQL calls this in the middle of a SELECT query, release
	possible adaptive hash latch to avoid deadlocks of threads */

	trx_search_latch_release_if_reserved(prebuilt->trx);

	index = dict_table_get_first_index_noninline(prebuilt->table);

	local_data_file_length = ((ulonglong) index->stat_n_leaf_pages)
5666
							* UNIV_PAGE_SIZE;
osku's avatar
osku committed
5667 5668 5669 5670 5671 5672 5673 5674 5675 5676 5677 5678 5679 5680 5681 5682 5683 5684 5685 5686 5687 5688 5689 5690 5691 5692 5693 5694

	/* Calculate a minimum length for a clustered index record and from
	that an upper bound for the number of rows. Since we only calculate
	new statistics in row0mysql.c when a table has grown by a threshold
	factor, we must add a safety factor 2 in front of the formula below. */

	estimate = 2 * local_data_file_length /
					 dict_index_calc_min_rec_len(index);

	prebuilt->trx->op_info = (char*)"";

	DBUG_RETURN((ha_rows) estimate);
}

/*************************************************************************
How many seeks it will take to read through the table. This is to be
comparable to the number returned by records_in_range so that we can
decide if we should scan the table or use keys. */

double
ha_innobase::scan_time()
/*====================*/
			/* out: estimated time measured in disk seeks */
{
	/* Since MySQL seems to favor table scans too much over index
	searches, we pretend that a sequential read takes the same time
	as a random disk read, that is, we do not divide the following
	by 10, which would be physically realistic. */
5695

osku's avatar
osku committed
5696 5697 5698 5699 5700 5701 5702 5703 5704 5705 5706
	return((double) (prebuilt->table->stat_clustered_index_size));
}

/**********************************************************************
Calculate the time it takes to read a set of ranges through an index
This enables us to optimise reads for clustered indexes. */

double
ha_innobase::read_time(
/*===================*/
			/* out: estimated time measured in disk seeks */
5707
	uint	index,	/* in: key number */
osku's avatar
osku committed
5708 5709 5710 5711
	uint	ranges,	/* in: how many ranges */
	ha_rows rows)	/* in: estimated number of rows in the ranges */
{
	ha_rows total_rows;
5712 5713
	double	time_for_scan;

osku's avatar
osku committed
5714
	if (index != table->s->primary_key) {
5715 5716
		/* Not clustered */
		return(handler::read_time(index, ranges, rows));
osku's avatar
osku committed
5717 5718 5719 5720 5721 5722 5723 5724 5725 5726 5727 5728 5729 5730
	}

	if (rows <= 2) {

		return((double) rows);
	}

	/* Assume that the read time is proportional to the scan time for all
	rows + at most one seek per range. */

	time_for_scan = scan_time();

	if ((total_rows = estimate_rows_upper_bound()) < rows) {

5731
		return(time_for_scan);
osku's avatar
osku committed
5732 5733 5734 5735 5736 5737 5738 5739 5740
	}

	return(ranges + (double) rows / (double) total_rows * time_for_scan);
}

/*************************************************************************
Returns statistics information of the table to the MySQL interpreter,
in various fields of the handle object. */

5741
int
osku's avatar
osku committed
5742 5743 5744 5745 5746 5747 5748 5749 5750 5751 5752
ha_innobase::info(
/*==============*/
	uint flag)	/* in: what information MySQL requests */
{
	dict_table_t*	ib_table;
	dict_index_t*	index;
	ha_rows		rec_per_key;
	ib_longlong	n_rows;
	ulong		j;
	ulong		i;
	char		path[FN_REFLEN];
5753
	os_file_stat_t	stat_info;
osku's avatar
osku committed
5754

5755
	DBUG_ENTER("info");
osku's avatar
osku committed
5756

5757
	/* If we are forcing recovery at a high level, we will suppress
osku's avatar
osku committed
5758 5759 5760
	statistics calculation on tables, because that may crash the
	server if an index is badly corrupted. */

5761
	if (srv_force_recovery >= SRV_FORCE_NO_IBUF_MERGE) {
osku's avatar
osku committed
5762

5763 5764 5765 5766 5767 5768
		/* We return success (0) instead of HA_ERR_CRASHED,
		because we want MySQL to process this query and not
		stop, like it would do if it received the error code
		HA_ERR_CRASHED. */

		DBUG_RETURN(0);
5769
	}
osku's avatar
osku committed
5770 5771 5772 5773 5774

	/* We do not know if MySQL can call this function before calling
	external_lock(). To be safe, update the thd of the current table
	handle. */

5775
	update_thd(ha_thd());
osku's avatar
osku committed
5776 5777 5778 5779 5780 5781 5782 5783

	/* In case MySQL calls this in the middle of a SELECT query, release
	possible adaptive hash latch to avoid deadlocks of threads */

	prebuilt->trx->op_info = (char*)"returning various info to MySQL";

	trx_search_latch_release_if_reserved(prebuilt->trx);

5784
	ib_table = prebuilt->table;
osku's avatar
osku committed
5785

5786
	if (flag & HA_STATUS_TIME) {
marko's avatar
marko committed
5787
		if (srv_stats_on_metadata) {
5788 5789
			/* In sql_show we call with this flag: update
			then statistics so that they are up-to-date */
osku's avatar
osku committed
5790

5791
			prebuilt->trx->op_info = "updating table statistics";
osku's avatar
osku committed
5792

marko's avatar
marko committed
5793
			dict_update_statistics(ib_table);
osku's avatar
osku committed
5794

5795
			prebuilt->trx->op_info = "returning various info to MySQL";
marko's avatar
marko committed
5796
		}
osku's avatar
osku committed
5797

5798
		my_snprintf(path, sizeof(path), "%s/%s%s",
5799 5800
				mysql_data_home, ib_table->name, reg_ext);

5801
		unpack_filename(path,path);
osku's avatar
osku committed
5802

5803
		/* Note that we do not know the access time of the table,
osku's avatar
osku committed
5804 5805 5806
		nor the CHECK TABLE time, nor the UPDATE or INSERT time. */

		if (os_file_get_status(path,&stat_info)) {
marko's avatar
marko committed
5807
			stats.create_time = stat_info.ctime;
osku's avatar
osku committed
5808
		}
5809
	}
osku's avatar
osku committed
5810 5811 5812 5813 5814 5815 5816 5817 5818 5819 5820 5821 5822 5823 5824 5825 5826 5827 5828 5829 5830 5831 5832 5833 5834

	if (flag & HA_STATUS_VARIABLE) {
		n_rows = ib_table->stat_n_rows;

		/* Because we do not protect stat_n_rows by any mutex in a
		delete, it is theoretically possible that the value can be
		smaller than zero! TODO: fix this race.

		The MySQL optimizer seems to assume in a left join that n_rows
		is an accurate estimate if it is zero. Of course, it is not,
		since we do not have any locks on the rows yet at this phase.
		Since SHOW TABLE STATUS seems to call this function with the
		HA_STATUS_TIME flag set, while the left join optimizer does not
		set that flag, we add one to a zero value if the flag is not
		set. That way SHOW TABLE STATUS will show the best estimate,
		while the optimizer never sees the table empty. */

		if (n_rows < 0) {
			n_rows = 0;
		}

		if (n_rows == 0 && !(flag & HA_STATUS_TIME)) {
			n_rows++;
		}

5835 5836 5837 5838 5839
		/* Fix bug#29507: TRUNCATE shows too many rows affected.
		Do not show the estimates for TRUNCATE command. */
		if (thd_sql_command(user_thd) == SQLCOM_TRUNCATE) {

			n_rows = 0;
5840 5841 5842 5843 5844 5845 5846 5847

			/* We need to reset the prebuilt value too, otherwise
			checks for values greater than the last value written
			to the table will fail and the autoinc counter will
			not be updated. This will force write_row() into
			attempting an update of the table's AUTOINC counter. */

			prebuilt->last_value = 0;
5848 5849
		}

marko's avatar
marko committed
5850 5851 5852
		stats.records = (ha_rows)n_rows;
		stats.deleted = 0;
		stats.data_file_length = ((ulonglong)
osku's avatar
osku committed
5853
				ib_table->stat_clustered_index_size)
5854
					* UNIV_PAGE_SIZE;
marko's avatar
marko committed
5855
		stats.index_file_length = ((ulonglong)
osku's avatar
osku committed
5856
				ib_table->stat_sum_of_other_index_sizes)
5857
					* UNIV_PAGE_SIZE;
vasil's avatar
vasil committed
5858 5859 5860 5861 5862 5863 5864 5865 5866 5867 5868 5869 5870 5871 5872

		/* Since fsp_get_available_space_in_free_extents() is
		acquiring latches inside InnoDB, we do not call it if we
		are asked by MySQL to avoid locking. Another reason to
		avoid the call is that it uses quite a lot of CPU.
		See Bug#38185.
		We do not update delete_length if no locking is requested
		so the "old" value can remain. delete_length is initialized
		to 0 in the ha_statistics' constructor. */
		if (!(flag & HA_STATUS_NO_LOCK)) {
			stats.delete_length =
				fsp_get_available_space_in_free_extents(
					ib_table->space) * 1024;
		}

marko's avatar
marko committed
5873
		stats.check_time = 0;
osku's avatar
osku committed
5874

marko's avatar
marko committed
5875 5876
		if (stats.records == 0) {
			stats.mean_rec_length = 0;
5877
		} else {
marko's avatar
marko committed
5878
			stats.mean_rec_length = (ulong) (stats.data_file_length / stats.records);
5879 5880
		}
	}
osku's avatar
osku committed
5881 5882 5883 5884 5885 5886 5887 5888 5889 5890

	if (flag & HA_STATUS_CONST) {
		index = dict_table_get_first_index_noninline(ib_table);

		if (prebuilt->clust_index_was_generated) {
			index = dict_table_get_next_index_noninline(index);
		}

		for (i = 0; i < table->s->keys; i++) {
			if (index == NULL) {
5891
				sql_print_error("Table %s contains fewer "
osku's avatar
osku committed
5892 5893 5894 5895
						"indexes inside InnoDB than "
						"are defined in the MySQL "
						".frm file. Have you mixed up "
						".frm files from different "
5896 5897 5898
						"installations? See "
"http://dev.mysql.com/doc/refman/5.1/en/innodb-troubleshooting.html\n",

osku's avatar
osku committed
5899 5900 5901 5902 5903 5904 5905
						ib_table->name);
				break;
			}

			for (j = 0; j < table->key_info[i].key_parts; j++) {

				if (j + 1 > index->n_uniq) {
5906 5907 5908 5909 5910
					sql_print_error(
"Index %s of %s has %lu columns unique inside InnoDB, but MySQL is asking "
"statistics for %lu columns. Have you mixed up .frm files from different "
"installations? "
"See http://dev.mysql.com/doc/refman/5.1/en/innodb-troubleshooting.html\n",
osku's avatar
osku committed
5911 5912 5913 5914
							index->name,
							ib_table->name,
							(unsigned long)
							index->n_uniq, j + 1);
5915
					break;
osku's avatar
osku committed
5916 5917 5918 5919
				}

				if (index->stat_n_diff_key_vals[j + 1] == 0) {

marko's avatar
marko committed
5920
					rec_per_key = stats.records;
osku's avatar
osku committed
5921
				} else {
marko's avatar
marko committed
5922
					rec_per_key = (ha_rows)(stats.records /
5923
					 index->stat_n_diff_key_vals[j + 1]);
osku's avatar
osku committed
5924 5925 5926 5927 5928 5929 5930 5931 5932 5933 5934 5935 5936
				}

				/* Since MySQL seems to favor table scans
				too much over index searches, we pretend
				index selectivity is 2 times better than
				our estimate: */

				rec_per_key = rec_per_key / 2;

				if (rec_per_key == 0) {
					rec_per_key = 1;
				}

5937
				table->key_info[i].rec_per_key[j]=
osku's avatar
osku committed
5938
				  rec_per_key >= ~(ulong) 0 ? ~(ulong) 0 :
marko's avatar
marko committed
5939
				  (ulong) rec_per_key;
osku's avatar
osku committed
5940 5941 5942 5943 5944 5945
			}

			index = dict_table_get_next_index_noninline(index);
		}
	}

5946
	if (flag & HA_STATUS_ERRKEY) {
5947 5948
		ut_a(prebuilt->trx);
		ut_a(prebuilt->trx->magic_n == TRX_MAGIC_N);
osku's avatar
osku committed
5949 5950

		errkey = (unsigned int) row_get_mysql_key_number_for_index(
5951 5952
			(dict_index_t*) trx_get_error_info(prebuilt->trx));
	}
osku's avatar
osku committed
5953 5954

	if (flag & HA_STATUS_AUTO && table->found_next_number_field) {
5955
		ulonglong	auto_inc;
osku's avatar
osku committed
5956 5957 5958 5959 5960 5961 5962 5963
		int		ret;

		/* The following function call can the first time fail in
		a lock wait timeout error because it reserves the auto-inc
		lock on the table. If it fails, then someone is already initing
		the auto-inc counter, and the second call is guaranteed to
		succeed. */

5964
		ret = innobase_read_and_init_auto_inc(&auto_inc);
osku's avatar
osku committed
5965 5966 5967 5968 5969 5970 5971 5972 5973 5974 5975

		if (ret != 0) {
			ret = innobase_read_and_init_auto_inc(&auto_inc);

			if (ret != 0) {
				sql_print_error("Cannot get table %s auto-inc"
						"counter value in ::info\n",
						ib_table->name);
				auto_inc = 0;
			}
		}
5976

marko's avatar
marko committed
5977
		stats.auto_increment_value = auto_inc;
osku's avatar
osku committed
5978 5979 5980 5981
	}

	prebuilt->trx->op_info = (char*)"";

5982
  	DBUG_RETURN(0);
osku's avatar
osku committed
5983 5984 5985 5986 5987 5988 5989 5990
}

/**************************************************************************
Updates index cardinalities of the table, based on 8 random dives into
each index tree. This does NOT calculate exact statistics on the table. */

int
ha_innobase::analyze(
5991
/*=================*/
osku's avatar
osku committed
5992 5993 5994 5995 5996 5997 5998 5999 6000 6001 6002
					/* out: returns always 0 (success) */
	THD*		thd,		/* in: connection thread handle */
	HA_CHECK_OPT*	check_opt)	/* in: currently ignored */
{
	/* Simply call ::info() with all the flags */
	info(HA_STATUS_TIME | HA_STATUS_CONST | HA_STATUS_VARIABLE);

	return(0);
}

/**************************************************************************
6003
This is mapped to "ALTER TABLE tablename ENGINE=InnoDB", which rebuilds
osku's avatar
osku committed
6004 6005 6006 6007 6008 6009 6010 6011
the table in MySQL. */

int
ha_innobase::optimize(
/*==================*/
	THD*		thd,		/* in: connection thread handle */
	HA_CHECK_OPT*	check_opt)	/* in: currently ignored */
{
6012
	return(HA_ADMIN_TRY_ALTER);
osku's avatar
osku committed
6013 6014 6015 6016 6017 6018 6019 6020 6021 6022 6023 6024
}

/***********************************************************************
Tries to check that an InnoDB table is not corrupted. If corruption is
noticed, prints to stderr information about it. In case of corruption
may also assert a failure and crash the server. */

int
ha_innobase::check(
/*===============*/
					/* out: HA_ADMIN_CORRUPT or
					HA_ADMIN_OK */
6025 6026
	THD*		thd,		/* in: user thread handle */
	HA_CHECK_OPT*	check_opt)	/* in: check options, currently
osku's avatar
osku committed
6027 6028 6029 6030
					ignored */
{
	ulint		ret;

6031
	DBUG_ASSERT(thd == ha_thd());
6032 6033
	ut_a(prebuilt->trx);
	ut_a(prebuilt->trx->magic_n == TRX_MAGIC_N);
6034
	ut_a(prebuilt->trx == thd_to_trx(thd));
osku's avatar
osku committed
6035 6036 6037 6038 6039 6040 6041 6042 6043 6044 6045 6046 6047 6048

	if (prebuilt->mysql_template == NULL) {
		/* Build the template; we will use a dummy template
		in index scans done in checking */

		build_template(prebuilt, NULL, table, ROW_MYSQL_WHOLE_ROW);
	}

	ret = row_check_table_for_mysql(prebuilt);

	if (ret == DB_SUCCESS) {
		return(HA_ADMIN_OK);
	}

6049
	return(HA_ADMIN_CORRUPT);
osku's avatar
osku committed
6050 6051 6052 6053 6054 6055 6056 6057 6058 6059 6060 6061
}

/*****************************************************************
Adds information about free space in the InnoDB tablespace to a table comment
which is printed out when a user calls SHOW TABLE STATUS. Adds also info on
foreign keys. */

char*
ha_innobase::update_table_comment(
/*==============================*/
				/* out: table comment + InnoDB free space +
				info on foreign keys */
6062
	const char*	comment)/* in: table comment defined by user */
osku's avatar
osku committed
6063
{
osku's avatar
osku committed
6064 6065
	uint	length = (uint) strlen(comment);
	char*	str;
osku's avatar
osku committed
6066
	long	flen;
osku's avatar
osku committed
6067 6068 6069 6070 6071 6072 6073 6074 6075

	/* We do not know if MySQL can call this function before calling
	external_lock(). To be safe, update the thd of the current table
	handle. */

	if (length > 64000 - 3) {
		return((char*)comment); /* string too long */
	}

6076
	update_thd(ha_thd());
osku's avatar
osku committed
6077 6078 6079 6080 6081 6082 6083 6084 6085

	prebuilt->trx->op_info = (char*)"returning table comment";

	/* In case MySQL calls this in the middle of a SELECT query, release
	possible adaptive hash latch to avoid deadlocks of threads */

	trx_search_latch_release_if_reserved(prebuilt->trx);
	str = NULL;

osku's avatar
osku committed
6086
	/* output the data to a temporary file */
osku's avatar
osku committed
6087

osku's avatar
osku committed
6088 6089 6090
	mutex_enter_noninline(&srv_dict_tmpfile_mutex);
	rewind(srv_dict_tmpfile);

6091 6092 6093
	fprintf(srv_dict_tmpfile, "InnoDB free: %llu kB",
		fsp_get_available_space_in_free_extents(
			prebuilt->table->space));
osku's avatar
osku committed
6094

osku's avatar
osku committed
6095
	dict_print_info_on_foreign_keys(FALSE, srv_dict_tmpfile,
osku's avatar
osku committed
6096
				prebuilt->trx, prebuilt->table);
osku's avatar
osku committed
6097 6098 6099 6100 6101 6102
	flen = ftell(srv_dict_tmpfile);
	if (flen < 0) {
		flen = 0;
	} else if (length + flen + 3 > 64000) {
		flen = 64000 - 3 - length;
	}
osku's avatar
osku committed
6103

osku's avatar
osku committed
6104 6105
	/* allocate buffer for the full string, and
	read the contents of the temporary file */
osku's avatar
osku committed
6106

marko's avatar
marko committed
6107
	str = (char*) my_malloc(length + flen + 3, MYF(0));
osku's avatar
osku committed
6108

osku's avatar
osku committed
6109 6110 6111 6112 6113 6114
	if (str) {
		char* pos	= str + length;
		if (length) {
			memcpy(str, comment, length);
			*pos++ = ';';
			*pos++ = ' ';
osku's avatar
osku committed
6115
		}
osku's avatar
osku committed
6116 6117 6118
		rewind(srv_dict_tmpfile);
		flen = (uint) fread(pos, 1, flen, srv_dict_tmpfile);
		pos[flen] = 0;
osku's avatar
osku committed
6119 6120
	}

osku's avatar
osku committed
6121 6122
	mutex_exit_noninline(&srv_dict_tmpfile_mutex);

6123
	prebuilt->trx->op_info = (char*)"";
osku's avatar
osku committed
6124

6125
	return(str ? str : (char*) comment);
osku's avatar
osku committed
6126 6127 6128 6129 6130 6131 6132 6133 6134 6135 6136 6137 6138
}

/***********************************************************************
Gets the foreign key create info for a table stored in InnoDB. */

char*
ha_innobase::get_foreign_key_create_info(void)
/*==========================================*/
			/* out, own: character string in the form which
			can be inserted to the CREATE TABLE statement,
			MUST be freed with ::free_foreign_key_create_info */
{
	char*	str	= 0;
osku's avatar
osku committed
6139
	long	flen;
osku's avatar
osku committed
6140 6141 6142 6143 6144 6145 6146

	ut_a(prebuilt != NULL);

	/* We do not know if MySQL can call this function before calling
	external_lock(). To be safe, update the thd of the current table
	handle. */

6147
	update_thd(ha_thd());
osku's avatar
osku committed
6148

osku's avatar
osku committed
6149
	prebuilt->trx->op_info = (char*)"getting info on foreign keys";
osku's avatar
osku committed
6150

osku's avatar
osku committed
6151 6152 6153
	/* In case MySQL calls this in the middle of a SELECT query,
	release possible adaptive hash latch to avoid
	deadlocks of threads */
osku's avatar
osku committed
6154

osku's avatar
osku committed
6155
	trx_search_latch_release_if_reserved(prebuilt->trx);
osku's avatar
osku committed
6156

osku's avatar
osku committed
6157 6158
	mutex_enter_noninline(&srv_dict_tmpfile_mutex);
	rewind(srv_dict_tmpfile);
osku's avatar
osku committed
6159

osku's avatar
osku committed
6160 6161
	/* output the data to a temporary file */
	dict_print_info_on_foreign_keys(TRUE, srv_dict_tmpfile,
osku's avatar
osku committed
6162
				prebuilt->trx, prebuilt->table);
osku's avatar
osku committed
6163
	prebuilt->trx->op_info = (char*)"";
osku's avatar
osku committed
6164

osku's avatar
osku committed
6165 6166 6167 6168 6169 6170
	flen = ftell(srv_dict_tmpfile);
	if (flen < 0) {
		flen = 0;
	} else if (flen > 64000 - 1) {
		flen = 64000 - 1;
	}
osku's avatar
osku committed
6171

osku's avatar
osku committed
6172 6173
	/* allocate buffer for the string, and
	read the contents of the temporary file */
osku's avatar
osku committed
6174

marko's avatar
marko committed
6175
	str = (char*) my_malloc(flen + 1, MYF(0));
osku's avatar
osku committed
6176

osku's avatar
osku committed
6177 6178 6179 6180
	if (str) {
		rewind(srv_dict_tmpfile);
		flen = (uint) fread(str, 1, flen, srv_dict_tmpfile);
		str[flen] = 0;
osku's avatar
osku committed
6181 6182
	}

osku's avatar
osku committed
6183 6184
	mutex_exit_noninline(&srv_dict_tmpfile_mutex);

6185
	return(str);
osku's avatar
osku committed
6186 6187 6188
}


6189
int
osku's avatar
osku committed
6190 6191 6192 6193 6194 6195
ha_innobase::get_foreign_key_list(THD *thd, List<FOREIGN_KEY_INFO> *f_key_list)
{
  dict_foreign_t* foreign;

  DBUG_ENTER("get_foreign_key_list");
  ut_a(prebuilt != NULL);
6196
  update_thd(ha_thd());
osku's avatar
osku committed
6197 6198 6199 6200 6201
  prebuilt->trx->op_info = (char*)"getting list of foreign keys";
  trx_search_latch_release_if_reserved(prebuilt->trx);
  mutex_enter_noninline(&(dict_sys->mutex));
  foreign = UT_LIST_GET_FIRST(prebuilt->table->foreign_list);

6202 6203 6204 6205
  while (foreign != NULL) {
	  uint i;
	  FOREIGN_KEY_INFO f_key_info;
	  LEX_STRING *name= 0;
marko's avatar
marko committed
6206
          uint ulen;
marko's avatar
marko committed
6207 6208
          char uname[NAME_LEN+1];           /* Unencoded name */
          char db_name[NAME_LEN+1];
6209 6210 6211 6212 6213 6214 6215
	  const char *tmp_buff;

	  tmp_buff= foreign->id;
	  i= 0;
	  while (tmp_buff[i] != '/')
		  i++;
	  tmp_buff+= i + 1;
6216 6217
	  f_key_info.forein_id = thd_make_lex_string(thd, 0,
		  tmp_buff, (uint) strlen(tmp_buff), 1);
6218
	  tmp_buff= foreign->referenced_table_name;
marko's avatar
marko committed
6219 6220

          /* Database name */
6221 6222
	  i= 0;
	  while (tmp_buff[i] != '/')
marko's avatar
marko committed
6223 6224 6225 6226 6227 6228
          {
            db_name[i]= tmp_buff[i];
            i++;
          }
          db_name[i]= 0;
          ulen= filename_to_tablename(db_name, uname, sizeof(uname));
6229 6230
	  f_key_info.referenced_db = thd_make_lex_string(thd, 0,
		  uname, ulen, 1);
marko's avatar
marko committed
6231 6232

          /* Table name */
6233
	  tmp_buff+= i + 1;
marko's avatar
marko committed
6234
          ulen= filename_to_tablename(tmp_buff, uname, sizeof(uname));
6235 6236
	  f_key_info.referenced_table = thd_make_lex_string(thd, 0,
		  uname, ulen, 1);
6237 6238 6239

	  for (i= 0;;) {
		  tmp_buff= foreign->foreign_col_names[i];
6240 6241
		  name = thd_make_lex_string(thd, name,
			  tmp_buff, (uint) strlen(tmp_buff), 1);
6242 6243
		  f_key_info.foreign_fields.push_back(name);
		  tmp_buff= foreign->referenced_col_names[i];
6244 6245
		  name = thd_make_lex_string(thd, name,
			tmp_buff, (uint) strlen(tmp_buff), 1);
6246 6247 6248 6249 6250
		  f_key_info.referenced_fields.push_back(name);
		  if (++i >= foreign->n_fields)
			  break;
	  }

6251 6252 6253 6254 6255 6256 6257 6258 6259 6260 6261 6262 6263 6264 6265 6266 6267 6268 6269 6270 6271
          ulong length;
          if (foreign->type & DICT_FOREIGN_ON_DELETE_CASCADE)
          {
            length=7;
            tmp_buff= "CASCADE";
          }	
          else if (foreign->type & DICT_FOREIGN_ON_DELETE_SET_NULL)
          {
            length=8;
            tmp_buff= "SET NULL";
          }
          else if (foreign->type & DICT_FOREIGN_ON_DELETE_NO_ACTION)
          {
            length=9;
            tmp_buff= "NO ACTION";
          }
          else
          {
            length=8;
            tmp_buff= "RESTRICT";
          }
6272 6273
	  f_key_info.delete_method = thd_make_lex_string(
		  thd, f_key_info.delete_method, tmp_buff, length, 1);
6274 6275 6276 6277 6278 6279 6280 6281 6282 6283 6284 6285 6286 6287 6288 6289 6290 6291 6292 6293 6294 6295
 
 
          if (foreign->type & DICT_FOREIGN_ON_UPDATE_CASCADE)
          {
            length=7;
            tmp_buff= "CASCADE";
          }
          else if (foreign->type & DICT_FOREIGN_ON_UPDATE_SET_NULL)
          {
            length=8;
            tmp_buff= "SET NULL";
          }
          else if (foreign->type & DICT_FOREIGN_ON_UPDATE_NO_ACTION)
          {
            length=9;
            tmp_buff= "NO ACTION";
          }
          else
          {
            length=8;
            tmp_buff= "RESTRICT";
          }
6296 6297
	  f_key_info.update_method = thd_make_lex_string(
		  thd, f_key_info.update_method, tmp_buff, length, 1);
marko's avatar
marko committed
6298 6299 6300
          if (foreign->referenced_index &&
              foreign->referenced_index->name)
          {
6301 6302 6303 6304
	    f_key_info.referenced_key_name = thd_make_lex_string(
		    thd, f_key_info.referenced_key_name,
		    foreign->referenced_index->name,
		    strlen(foreign->referenced_index->name), 1);
marko's avatar
marko committed
6305
          }
vasil's avatar
vasil committed
6306 6307
          else
            f_key_info.referenced_key_name= 0;
6308

6309
	  FOREIGN_KEY_INFO *pf_key_info = (FOREIGN_KEY_INFO *)
6310
		  thd_memdup(thd, &f_key_info, sizeof(FOREIGN_KEY_INFO));
6311 6312
	  f_key_list->push_back(pf_key_info);
	  foreign = UT_LIST_GET_NEXT(foreign_list, foreign);
osku's avatar
osku committed
6313 6314 6315
  }
  mutex_exit_noninline(&(dict_sys->mutex));
  prebuilt->trx->op_info = (char*)"";
6316

osku's avatar
osku committed
6317 6318 6319 6320 6321 6322 6323 6324 6325 6326 6327 6328 6329 6330
  DBUG_RETURN(0);
}

/*********************************************************************
Checks if ALTER TABLE may change the storage engine of the table.
Changing storage engines is not allowed for tables for which there
are foreign key constraints (parent or child tables). */

bool
ha_innobase::can_switch_engines(void)
/*=================================*/
{
	bool	can_switch;

6331
	DBUG_ENTER("ha_innobase::can_switch_engines");
6332

6333
	ut_a(prebuilt->trx == thd_to_trx(ha_thd()));
6334

osku's avatar
osku committed
6335 6336 6337 6338 6339 6340 6341 6342 6343 6344 6345 6346 6347 6348 6349 6350 6351 6352 6353 6354 6355 6356 6357 6358 6359 6360 6361 6362 6363 6364 6365 6366 6367 6368 6369 6370 6371 6372 6373
	prebuilt->trx->op_info =
			"determining if there are foreign key constraints";
	row_mysql_lock_data_dictionary(prebuilt->trx);

	can_switch = !UT_LIST_GET_FIRST(prebuilt->table->referenced_list)
			&& !UT_LIST_GET_FIRST(prebuilt->table->foreign_list);

	row_mysql_unlock_data_dictionary(prebuilt->trx);
	prebuilt->trx->op_info = "";

	DBUG_RETURN(can_switch);
}

/***********************************************************************
Checks if a table is referenced by a foreign key. The MySQL manual states that
a REPLACE is either equivalent to an INSERT, or DELETE(s) + INSERT. Only a
delete is then allowed internally to resolve a duplicate key conflict in
REPLACE, not an update. */

uint
ha_innobase::referenced_by_foreign_key(void)
/*========================================*/
			/* out: > 0 if referenced by a FOREIGN KEY */
{
	if (dict_table_referenced_by_foreign_key(prebuilt->table)) {

		return(1);
	}

	return(0);
}

/***********************************************************************
Frees the foreign key create info for a table stored in InnoDB, if it is
non-NULL. */

void
ha_innobase::free_foreign_key_create_info(
/*======================================*/
6374
	char*	str)	/* in, own: create info string to free	*/
osku's avatar
osku committed
6375 6376 6377 6378 6379 6380 6381 6382 6383 6384 6385 6386 6387 6388
{
	if (str) {
		my_free(str, MYF(0));
	}
}

/***********************************************************************
Tells something additional to the handler about how to do things. */

int
ha_innobase::extra(
/*===============*/
			   /* out: 0 or error number */
	enum ha_extra_function operation)
marko's avatar
marko committed
6389
			   /* in: HA_EXTRA_FLUSH or some other flag */
osku's avatar
osku committed
6390 6391 6392 6393 6394 6395
{
	/* Warning: since it is not sure that MySQL calls external_lock
	before calling this function, the trx field in prebuilt can be
	obsolete! */

	switch (operation) {
6396 6397 6398 6399 6400 6401
		case HA_EXTRA_FLUSH:
			if (prebuilt->blob_heap) {
				row_mysql_prebuilt_free_blob_heap(prebuilt);
			}
			break;
		case HA_EXTRA_RESET_STATE:
6402
			reset_template(prebuilt);
6403
			break;
osku's avatar
osku committed
6404
		case HA_EXTRA_NO_KEYREAD:
6405 6406 6407 6408 6409
			prebuilt->read_just_key = 0;
			break;
		case HA_EXTRA_KEYREAD:
			prebuilt->read_just_key = 1;
			break;
osku's avatar
osku committed
6410 6411 6412
		case HA_EXTRA_KEYREAD_PRESERVE_FIELDS:
			prebuilt->keep_other_fields_on_keyread = 1;
			break;
6413 6414 6415 6416 6417 6418 6419

			/* IMPORTANT: prebuilt->trx can be obsolete in
			this method, because it is not sure that MySQL
			calls external_lock before this method with the
			parameters below.  We must not invoke update_thd()
			either, because the calling threads may change.
			CAREFUL HERE, OR MEMORY CORRUPTION MAY OCCUR! */
6420
		case HA_EXTRA_IGNORE_DUP_KEY:
6421
			thd_to_trx(ha_thd())->duplicates |= TRX_DUP_IGNORE;
6422 6423
			break;
		case HA_EXTRA_WRITE_CAN_REPLACE:
6424
			thd_to_trx(ha_thd())->duplicates |= TRX_DUP_REPLACE;
6425 6426
			break;
		case HA_EXTRA_WRITE_CANNOT_REPLACE:
6427
			thd_to_trx(ha_thd())->duplicates &= ~TRX_DUP_REPLACE;
6428 6429
			break;
		case HA_EXTRA_NO_IGNORE_DUP_KEY:
6430
			thd_to_trx(ha_thd())->duplicates &=
6431 6432
				~(TRX_DUP_IGNORE | TRX_DUP_REPLACE);
			break;
osku's avatar
osku committed
6433 6434 6435 6436 6437 6438 6439
		default:/* Do nothing */
			;
	}

	return(0);
}

6440 6441 6442 6443
/**********************************************************************
Reset state of file to after 'open'.
This function is called after every statement for all tables used
by that statement.  */
marko's avatar
marko committed
6444 6445
int ha_innobase::reset()
{
6446 6447 6448 6449 6450 6451 6452 6453 6454 6455 6456
	if (prebuilt->blob_heap) {
		row_mysql_prebuilt_free_blob_heap(prebuilt);
	}

	reset_template(prebuilt);

	/* TODO: This should really be reset in reset_template() but for now
	it's safer to do it explicitly here. */

	/* This is a statement level counter. */
	prebuilt->last_value = 0;
marko's avatar
marko committed
6457

6458 6459
	return(0);
}
marko's avatar
marko committed
6460

osku's avatar
osku committed
6461 6462 6463 6464 6465 6466 6467 6468 6469
/**********************************************************************
MySQL calls this function at the start of each SQL statement inside LOCK
TABLES. Inside LOCK TABLES the ::external_lock method does not work to
mark SQL statement borders. Note also a special case: if a temporary table
is created inside LOCK TABLES, MySQL has not called external_lock() at all
on that table.
MySQL-5.0 also calls this before each statement in an execution of a stored
procedure. To make the execution more deterministic for binlogging, MySQL-5.0
locks all tables involved in a stored procedure with full explicit table
6470
locks (thd_in_lock_tables(thd) holds in store_lock()) before executing the
osku's avatar
osku committed
6471 6472 6473 6474 6475
procedure. */

int
ha_innobase::start_stmt(
/*====================*/
6476 6477 6478
				/* out: 0 or error code */
	THD*		thd,	/* in: handle to the user thread */
	thr_lock_type	lock_type)
osku's avatar
osku committed
6479 6480 6481 6482 6483 6484 6485 6486 6487 6488 6489 6490 6491 6492 6493 6494
{
	trx_t*		trx;

	update_thd(thd);

	trx = prebuilt->trx;

	/* Here we release the search latch and the InnoDB thread FIFO ticket
	if they were reserved. They should have been released already at the
	end of the previous statement, but because inside LOCK TABLES the
	lock count method does not work to mark the end of a SELECT statement,
	that may not be the case. We MUST release the search latch before an
	INSERT, for example. */

	innobase_release_stat_resources(trx);

sunny's avatar
sunny committed
6495 6496 6497
	/* Reset the AUTOINC statement level counter for multi-row INSERTs. */
	trx->n_autoinc_rows = 0;

osku's avatar
osku committed
6498 6499
	prebuilt->sql_stat_start = TRUE;
	prebuilt->hint_need_to_fetch_extra_cols = 0;
6500
	reset_template(prebuilt);
osku's avatar
osku committed
6501 6502

	if (!prebuilt->mysql_has_locked) {
6503 6504 6505 6506 6507 6508
		/* This handle is for a temporary table created inside
		this same LOCK TABLES; since MySQL does NOT call external_lock
		in this case, we must use x-row locks inside InnoDB to be
		prepared for an update of a row */

		prebuilt->select_lock_type = LOCK_X;
osku's avatar
osku committed
6509 6510
	} else {
		if (trx->isolation_level != TRX_ISO_SERIALIZABLE
6511
			&& thd_sql_command(thd) == SQLCOM_SELECT
6512 6513
			&& lock_type == TL_READ) {

osku's avatar
osku committed
6514 6515 6516 6517 6518 6519 6520 6521 6522
			/* For other than temporary tables, we obtain
			no lock for consistent read (plain SELECT). */

			prebuilt->select_lock_type = LOCK_NONE;
		} else {
			/* Not a consistent read: restore the
			select_lock_type value. The value of
			stored_select_lock_type was decided in:
			1) ::store_lock(),
6523 6524
			2) ::external_lock(),
			3) ::init_table_handle_for_HANDLER(), and
6525
			4) ::transactional_table_lock(). */
osku's avatar
osku committed
6526 6527 6528 6529 6530 6531 6532 6533 6534

			prebuilt->select_lock_type =
				prebuilt->stored_select_lock_type;
		}
	}

	trx->detailed_error[0] = '\0';

	/* Set the MySQL flag to mark that there is an active transaction */
6535
	if (trx->active_trans == 0) {
osku's avatar
osku committed
6536

6537
		innobase_register_trx_and_stmt(ht, thd);
6538 6539
		trx->active_trans = 1;
	} else {
6540
		innobase_register_stmt(ht, thd);
osku's avatar
osku committed
6541 6542 6543 6544 6545 6546 6547 6548 6549 6550 6551 6552 6553 6554 6555 6556 6557 6558 6559 6560
	}

	return(0);
}

/**********************************************************************
Maps a MySQL trx isolation level code to the InnoDB isolation level code */
inline
ulint
innobase_map_isolation_level(
/*=========================*/
					/* out: InnoDB isolation level */
	enum_tx_isolation	iso)	/* in: MySQL isolation level code */
{
	switch(iso) {
		case ISO_REPEATABLE_READ: return(TRX_ISO_REPEATABLE_READ);
		case ISO_READ_COMMITTED: return(TRX_ISO_READ_COMMITTED);
		case ISO_SERIALIZABLE: return(TRX_ISO_SERIALIZABLE);
		case ISO_READ_UNCOMMITTED: return(TRX_ISO_READ_UNCOMMITTED);
		default: ut_a(0); return(0);
6561
	}
osku's avatar
osku committed
6562
}
6563

osku's avatar
osku committed
6564 6565 6566 6567 6568 6569 6570 6571 6572 6573 6574 6575
/**********************************************************************
As MySQL will execute an external lock for every new table it uses when it
starts to process an SQL statement (an exception is when MySQL calls
start_stmt for the handle) we can use this function to store the pointer to
the THD in the handle. We will also use this function to communicate
to InnoDB that a new SQL statement has started and that we must store a
savepoint to our transaction handle, so that we are able to roll back
the SQL statement in case of an error. */

int
ha_innobase::external_lock(
/*=======================*/
6576
				/* out: 0 */
osku's avatar
osku committed
6577
	THD*	thd,		/* in: handle to the user thread */
6578
	int	lock_type)	/* in: lock type */
osku's avatar
osku committed
6579 6580 6581
{
	trx_t*		trx;

6582
	DBUG_ENTER("ha_innobase::external_lock");
osku's avatar
osku committed
6583 6584 6585 6586
	DBUG_PRINT("enter",("lock_type: %d", lock_type));

	update_thd(thd);

6587 6588 6589 6590 6591 6592 6593 6594 6595 6596 6597 6598 6599 6600 6601 6602 6603 6604 6605 6606 6607 6608 6609
	/* Statement based binlogging does not work in isolation level
	READ UNCOMMITTED and READ COMMITTED since the necessary
	locks cannot be taken. In this case, we print an
	informative error message and return with an error. */
	if (lock_type == F_WRLCK)
	{
		ulong const binlog_format= thd_binlog_format(thd);
		ulong const tx_isolation = thd_tx_isolation(current_thd);
		if (tx_isolation <= ISO_READ_COMMITTED &&
		    binlog_format == BINLOG_FORMAT_STMT)
		{
			char buf[256];
			my_snprintf(buf, sizeof(buf),
				    "Transaction level '%s' in"
				    " InnoDB is not safe for binlog mode '%s'",
				    tx_isolation_names[tx_isolation],
				    binlog_format_names[binlog_format]);
			my_error(ER_BINLOG_LOGGING_IMPOSSIBLE, MYF(0), buf);
			DBUG_RETURN(HA_ERR_LOGGING_IMPOSSIBLE);
		}
	}


osku's avatar
osku committed
6610 6611 6612 6613 6614
	trx = prebuilt->trx;

	prebuilt->sql_stat_start = TRUE;
	prebuilt->hint_need_to_fetch_extra_cols = 0;

6615
	reset_template(prebuilt);
osku's avatar
osku committed
6616 6617 6618 6619 6620 6621 6622 6623 6624 6625 6626 6627 6628

	if (lock_type == F_WRLCK) {

		/* If this is a SELECT, then it is in UPDATE TABLE ...
		or SELECT ... FOR UPDATE */
		prebuilt->select_lock_type = LOCK_X;
		prebuilt->stored_select_lock_type = LOCK_X;
	}

	if (lock_type != F_UNLCK) {
		/* MySQL is setting a new table lock */

		trx->detailed_error[0] = '\0';
6629

osku's avatar
osku committed
6630 6631
		/* Set the MySQL flag to mark that there is an active
		transaction */
6632
		if (trx->active_trans == 0) {
osku's avatar
osku committed
6633

6634
			innobase_register_trx_and_stmt(ht, thd);
6635 6636
			trx->active_trans = 1;
		} else if (trx->n_mysql_tables_in_use == 0) {
6637
			innobase_register_stmt(ht, thd);
osku's avatar
osku committed
6638 6639 6640
		}

		if (trx->isolation_level == TRX_ISO_SERIALIZABLE
6641
			&& prebuilt->select_lock_type == LOCK_NONE
6642 6643
			&& thd_test_options(thd,
				OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN)) {
osku's avatar
osku committed
6644 6645 6646 6647 6648 6649 6650 6651 6652 6653 6654 6655 6656 6657 6658 6659 6660

			/* To get serializable execution, we let InnoDB
			conceptually add 'LOCK IN SHARE MODE' to all SELECTs
			which otherwise would have been consistent reads. An
			exception is consistent reads in the AUTOCOMMIT=1 mode:
			we know that they are read-only transactions, and they
			can be serialized also if performed as consistent
			reads. */

			prebuilt->select_lock_type = LOCK_S;
			prebuilt->stored_select_lock_type = LOCK_S;
		}

		/* Starting from 4.1.9, no InnoDB table lock is taken in LOCK
		TABLES if AUTOCOMMIT=1. It does not make much sense to acquire
		an InnoDB table lock if it is released immediately at the end
		of LOCK TABLES, and InnoDB's table locks in that case cause
6661
		VERY easily deadlocks.
jan's avatar
jan committed
6662 6663

		We do not set InnoDB table locks if user has not explicitly
6664 6665
		requested a table lock. Note that thd_in_lock_tables(thd)
		can hold in some cases, e.g., at the start of a stored
jan's avatar
jan committed
6666
		procedure call (SQLCOM_CALL). */
osku's avatar
osku committed
6667 6668 6669

		if (prebuilt->select_lock_type != LOCK_NONE) {

6670 6671 6672
			if (thd_sql_command(thd) == SQLCOM_LOCK_TABLES
			    && THDVAR(thd, table_locks)
			    && thd_test_options(thd, OPTION_NOT_AUTOCOMMIT)
6673
			    && thd_in_lock_tables(thd)) {
osku's avatar
osku committed
6674

6675 6676
				ulint	error = row_lock_table_for_mysql(
					prebuilt, NULL, 0);
osku's avatar
osku committed
6677 6678 6679

				if (error != DB_SUCCESS) {
					error = convert_error_code_to_mysql(
6680
						(int) error, thd);
osku's avatar
osku committed
6681 6682 6683 6684
					DBUG_RETURN((int) error);
				}
			}

6685
			trx->mysql_n_tables_locked++;
osku's avatar
osku committed
6686 6687
		}

6688 6689 6690
		trx->n_mysql_tables_in_use++;
		prebuilt->mysql_has_locked = TRUE;

osku's avatar
osku committed
6691 6692 6693 6694 6695 6696 6697 6698
		DBUG_RETURN(0);
	}

	/* MySQL is releasing a table lock */

	trx->n_mysql_tables_in_use--;
	prebuilt->mysql_has_locked = FALSE;

vasil's avatar
vasil committed
6699 6700 6701 6702 6703 6704
	/* Release a possible FIFO ticket and search latch. Since we
	may reserve the kernel mutex, we have to release the search
	system latch first to obey the latching order. */

	innobase_release_stat_resources(trx);

osku's avatar
osku committed
6705 6706 6707 6708 6709
	/* If the MySQL lock count drops to zero we know that the current SQL
	statement has ended */

	if (trx->n_mysql_tables_in_use == 0) {

6710
		trx->mysql_n_tables_locked = 0;
osku's avatar
osku committed
6711
		prebuilt->used_in_HANDLER = FALSE;
6712

6713
		if (!thd_test_options(thd, OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN)) {
6714
			if (trx->active_trans != 0) {
6715
				innobase_commit(ht, thd, TRUE);
osku's avatar
osku committed
6716 6717 6718
			}
		} else {
			if (trx->isolation_level <= TRX_ISO_READ_COMMITTED
6719
						&& trx->global_read_view) {
osku's avatar
osku committed
6720 6721 6722 6723 6724 6725 6726 6727 6728 6729 6730 6731 6732 6733 6734 6735 6736 6737 6738

				/* At low transaction isolation levels we let
				each consistent read set its own snapshot */

				read_view_close_for_mysql(trx);
			}
		}
	}

	DBUG_RETURN(0);
}

/**********************************************************************
With this function MySQL request a transactional lock to a table when
user issued query LOCK TABLES..WHERE ENGINE = InnoDB. */

int
ha_innobase::transactional_table_lock(
/*==================================*/
6739
				/* out: error code */
osku's avatar
osku committed
6740
	THD*	thd,		/* in: handle to the user thread */
6741
	int	lock_type)	/* in: lock type */
osku's avatar
osku committed
6742 6743 6744
{
	trx_t*		trx;

6745
	DBUG_ENTER("ha_innobase::transactional_table_lock");
osku's avatar
osku committed
6746 6747 6748 6749 6750 6751 6752 6753
	DBUG_PRINT("enter",("lock_type: %d", lock_type));

	/* We do not know if MySQL can call this function before calling
	external_lock(). To be safe, update the thd of the current table
	handle. */

	update_thd(thd);

6754
	if (prebuilt->table->ibd_file_missing && !thd_tablespace_op(thd)) {
6755
		ut_print_timestamp(stderr);
6756 6757 6758 6759 6760 6761 6762 6763 6764 6765 6766
		fprintf(stderr,
			"  InnoDB: MySQL is trying to use a table handle"
			" but the .ibd file for\n"
			"InnoDB: table %s does not exist.\n"
			"InnoDB: Have you deleted the .ibd file"
			" from the database directory under\n"
			"InnoDB: the MySQL datadir?"
			"InnoDB: See"
			" http://dev.mysql.com/doc/refman/5.1/en/innodb-troubleshooting.html\n"
			"InnoDB: how you can resolve the problem.\n",
			prebuilt->table->name);
osku's avatar
osku committed
6767 6768 6769 6770 6771 6772 6773 6774
		DBUG_RETURN(HA_ERR_CRASHED);
	}

	trx = prebuilt->trx;

	prebuilt->sql_stat_start = TRUE;
	prebuilt->hint_need_to_fetch_extra_cols = 0;

6775
	reset_template(prebuilt);
osku's avatar
osku committed
6776 6777 6778 6779 6780 6781 6782 6783

	if (lock_type == F_WRLCK) {
		prebuilt->select_lock_type = LOCK_X;
		prebuilt->stored_select_lock_type = LOCK_X;
	} else if (lock_type == F_RDLCK) {
		prebuilt->select_lock_type = LOCK_S;
		prebuilt->stored_select_lock_type = LOCK_S;
	} else {
6784 6785
		ut_print_timestamp(stderr);
		fprintf(stderr, "  InnoDB error:\n"
osku's avatar
osku committed
6786 6787 6788 6789 6790 6791 6792 6793 6794
"MySQL is trying to set transactional table lock with corrupted lock type\n"
"to table %s, lock type %d does not exist.\n",
				prebuilt->table->name, lock_type);
		DBUG_RETURN(HA_ERR_CRASHED);
	}

	/* MySQL is setting a new transactional table lock */

	/* Set the MySQL flag to mark that there is an active transaction */
6795
	if (trx->active_trans == 0) {
osku's avatar
osku committed
6796

6797
		innobase_register_trx_and_stmt(ht, thd);
6798 6799
		trx->active_trans = 1;
	}
osku's avatar
osku committed
6800

6801
	if (THDVAR(thd, table_locks) && thd_in_lock_tables(thd)) {
osku's avatar
osku committed
6802 6803 6804 6805 6806
		ulint	error = DB_SUCCESS;

		error = row_lock_table_for_mysql(prebuilt, NULL, 0);

		if (error != DB_SUCCESS) {
6807
			error = convert_error_code_to_mysql((int) error, thd);
osku's avatar
osku committed
6808 6809 6810
			DBUG_RETURN((int) error);
		}

6811
		if (thd_test_options(thd, OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN)) {
osku's avatar
osku committed
6812

6813 6814
			/* Store the current undo_no of the transaction
			so that we know where to roll back if we have
osku's avatar
osku committed
6815 6816 6817 6818 6819 6820 6821 6822 6823 6824 6825
			to roll back the next SQL statement */

			trx_mark_sql_stat_end(trx);
		}
	}

	DBUG_RETURN(0);
}

/****************************************************************************
Here we export InnoDB status variables to MySQL.  */
6826
static
osku's avatar
osku committed
6827
int
6828 6829
innodb_export_status()
/*==================*/
osku's avatar
osku committed
6830
{
6831 6832 6833 6834 6835
	if (innodb_inited) {
		srv_export_innodb_status();
	}

	return 0;
osku's avatar
osku committed
6836 6837 6838 6839 6840
}

/****************************************************************************
Implements the SHOW INNODB STATUS command. Sends the output of the InnoDB
Monitor to the client. */
6841
static
osku's avatar
osku committed
6842 6843 6844
bool
innodb_show_status(
/*===============*/
6845
	handlerton*	hton,	/* in: the innodb handlerton */
osku's avatar
osku committed
6846 6847
	THD*	thd,	/* in: the MySQL query thread of the caller */
	stat_print_fn *stat_print)
osku's avatar
osku committed
6848 6849 6850 6851 6852 6853 6854
{
	trx_t*			trx;
	static const char	truncated_msg[] = "... truncated...\n";
	const long		MAX_STATUS_SIZE = 64000;
	ulint			trx_list_start = ULINT_UNDEFINED;
	ulint			trx_list_end = ULINT_UNDEFINED;

6855
	DBUG_ENTER("innodb_show_status");
osku's avatar
osku committed
6856

6857
	trx = check_trx_exists(thd);
osku's avatar
osku committed
6858 6859 6860 6861 6862 6863 6864 6865 6866 6867 6868 6869 6870 6871 6872 6873 6874 6875 6876 6877 6878 6879 6880 6881 6882 6883 6884 6885 6886

	innobase_release_stat_resources(trx);

	/* We let the InnoDB Monitor to output at most MAX_STATUS_SIZE
	bytes of text. */

	long	flen, usable_len;
	char*	str;

	mutex_enter_noninline(&srv_monitor_file_mutex);
	rewind(srv_monitor_file);
	srv_printf_innodb_monitor(srv_monitor_file,
				&trx_list_start, &trx_list_end);
	flen = ftell(srv_monitor_file);
	os_file_set_eof(srv_monitor_file);

	if (flen < 0) {
		flen = 0;
	}

	if (flen > MAX_STATUS_SIZE) {
		usable_len = MAX_STATUS_SIZE;
	} else {
		usable_len = flen;
	}

	/* allocate buffer for the string, and
	read the contents of the temporary file */

marko's avatar
marko committed
6887
	if (!(str = (char*) my_malloc(usable_len + 1, MYF(0)))) {
6888 6889 6890
	  mutex_exit_noninline(&srv_monitor_file_mutex);
	  DBUG_RETURN(TRUE);
	}
osku's avatar
osku committed
6891 6892 6893 6894 6895 6896 6897 6898 6899 6900 6901 6902 6903 6904 6905 6906 6907 6908 6909 6910 6911 6912 6913 6914

	rewind(srv_monitor_file);
	if (flen < MAX_STATUS_SIZE) {
		/* Display the entire output. */
		flen = (long) fread(str, 1, flen, srv_monitor_file);
	} else if (trx_list_end < (ulint) flen
			&& trx_list_start < trx_list_end
			&& trx_list_start + (flen - trx_list_end)
			< MAX_STATUS_SIZE - sizeof truncated_msg - 1) {
		/* Omit the beginning of the list of active transactions. */
		long len = (long) fread(str, 1, trx_list_start, srv_monitor_file);
		memcpy(str + len, truncated_msg, sizeof truncated_msg - 1);
		len += sizeof truncated_msg - 1;
		usable_len = (MAX_STATUS_SIZE - 1) - len;
		fseek(srv_monitor_file, flen - usable_len, SEEK_SET);
		len += (long) fread(str + len, 1, usable_len, srv_monitor_file);
		flen = len;
	} else {
		/* Omit the end of the output. */
		flen = (long) fread(str, 1, MAX_STATUS_SIZE - 1, srv_monitor_file);
	}

	mutex_exit_noninline(&srv_monitor_file_mutex);

osku's avatar
osku committed
6915
	bool result = FALSE;
osku's avatar
osku committed
6916

marko's avatar
marko committed
6917
	if (stat_print(thd, innobase_hton_name, strlen(innobase_hton_name),
6918
			STRING_WITH_LEN(""), str, flen)) {
osku's avatar
osku committed
6919
		result= TRUE;
osku's avatar
osku committed
6920
	}
osku's avatar
osku committed
6921
	my_free(str, MYF(0));
osku's avatar
osku committed
6922

osku's avatar
osku committed
6923
	DBUG_RETURN(FALSE);
osku's avatar
osku committed
6924 6925 6926 6927
}

/****************************************************************************
Implements the SHOW MUTEX STATUS command. . */
6928
static
osku's avatar
osku committed
6929 6930
bool
innodb_mutex_show_status(
6931
/*=====================*/
6932
	handlerton*	hton,	/* in: the innodb handlerton */
6933 6934 6935 6936 6937 6938
	THD*		thd,		/* in: the MySQL query thread of the
					caller */
	stat_print_fn*	stat_print)
{
	char buf1[IO_SIZE], buf2[IO_SIZE];
	mutex_t*  mutex;
6939
#ifdef UNIV_DEBUG
6940 6941 6942 6943 6944 6945
	ulint	  rw_lock_count= 0;
	ulint	  rw_lock_count_spin_loop= 0;
	ulint	  rw_lock_count_spin_rounds= 0;
	ulint	  rw_lock_count_os_wait= 0;
	ulint	  rw_lock_count_os_yield= 0;
	ulonglong rw_lock_wait_time= 0;
6946
#endif /* UNIV_DEBUG */
marko's avatar
marko committed
6947
	uint	  hton_name_len= strlen(innobase_hton_name), buf1len, buf2len;
6948
	DBUG_ENTER("innodb_mutex_show_status");
osku's avatar
osku committed
6949

6950
	mutex_enter_noninline(&mutex_list_mutex);
osku's avatar
osku committed
6951

6952 6953 6954
	mutex = UT_LIST_GET_FIRST(mutex_list);

	while (mutex != NULL) {
6955
#ifdef UNIV_DEBUG
6956 6957 6958 6959 6960 6961 6962 6963 6964 6965 6966 6967 6968 6969 6970
		if (mutex->mutex_type != 1) {
			if (mutex->count_using > 0) {
				buf1len= my_snprintf(buf1, sizeof(buf1),
					"%s:%s",
					mutex->cmutex_name, mutex->cfile_name);
				buf2len= my_snprintf(buf2, sizeof(buf2),
					"count=%lu, spin_waits=%lu,"
					" spin_rounds=%lu, "
					"os_waits=%lu, os_yields=%lu,"
					" os_wait_times=%lu",
					mutex->count_using,
					mutex->count_spin_loop,
					mutex->count_spin_rounds,
					mutex->count_os_wait,
					mutex->count_os_yield,
marko's avatar
marko committed
6971
					(ulong) (mutex->lspent_time/1000));
6972

marko's avatar
marko committed
6973
				if (stat_print(thd, innobase_hton_name,
6974 6975
						hton_name_len, buf1, buf1len,
						buf2, buf2len)) {
6976 6977
					mutex_exit_noninline(
						&mutex_list_mutex);
6978 6979 6980 6981 6982 6983 6984 6985 6986 6987 6988 6989
					DBUG_RETURN(1);
				}
			}
		}
		else {
			rw_lock_count += mutex->count_using;
			rw_lock_count_spin_loop += mutex->count_spin_loop;
			rw_lock_count_spin_rounds += mutex->count_spin_rounds;
			rw_lock_count_os_wait += mutex->count_os_wait;
			rw_lock_count_os_yield += mutex->count_os_yield;
			rw_lock_wait_time += mutex->lspent_time;
		}
6990 6991 6992 6993 6994 6995 6996 6997 6998 6999 7000 7001 7002
#else /* UNIV_DEBUG */
		buf1len= my_snprintf(buf1, sizeof(buf1), "%s:%lu",
				     mutex->cfile_name, (ulong) mutex->cline);
		buf2len= my_snprintf(buf2, sizeof(buf2), "os_waits=%lu",
				     mutex->count_os_wait);

		if (stat_print(thd, innobase_hton_name,
			       hton_name_len, buf1, buf1len,
			       buf2, buf2len)) {
			mutex_exit_noninline(&mutex_list_mutex);
			DBUG_RETURN(1);
		}
#endif /* UNIV_DEBUG */
osku's avatar
osku committed
7003

7004 7005 7006
		mutex = UT_LIST_GET_NEXT(list, mutex);
	}

7007 7008 7009
	mutex_exit_noninline(&mutex_list_mutex);

#ifdef UNIV_DEBUG
7010 7011 7012 7013 7014 7015
	buf2len= my_snprintf(buf2, sizeof(buf2),
		"count=%lu, spin_waits=%lu, spin_rounds=%lu, "
		"os_waits=%lu, os_yields=%lu, os_wait_times=%lu",
		rw_lock_count, rw_lock_count_spin_loop,
		rw_lock_count_spin_rounds,
		rw_lock_count_os_wait, rw_lock_count_os_yield,
marko's avatar
marko committed
7016
		(ulong) (rw_lock_wait_time/1000));
7017

marko's avatar
marko committed
7018
	if (stat_print(thd, innobase_hton_name, hton_name_len,
7019 7020 7021
			STRING_WITH_LEN("rw_lock_mutexes"), buf2, buf2len)) {
		DBUG_RETURN(1);
	}
7022
#endif /* UNIV_DEBUG */
7023 7024

	DBUG_RETURN(FALSE);
osku's avatar
osku committed
7025 7026
}

7027
static
7028 7029 7030
bool innobase_show_status(handlerton *hton, THD* thd, 
                          stat_print_fn* stat_print,
                          enum ha_stat_type stat_type)
7031 7032 7033
{
	switch (stat_type) {
	case HA_ENGINE_STATUS:
7034
		return innodb_show_status(hton, thd, stat_print);
7035
	case HA_ENGINE_MUTEX:
7036
		return innodb_mutex_show_status(hton, thd, stat_print);
7037 7038 7039
	default:
		return FALSE;
	}
osku's avatar
osku committed
7040 7041 7042
}


osku's avatar
osku committed
7043 7044 7045 7046 7047
/****************************************************************************
 Handling the shared INNOBASE_SHARE structure that is needed to provide table
 locking.
****************************************************************************/

7048
static uchar* innobase_get_key(INNOBASE_SHARE* share, size_t *length,
7049 7050 7051 7052
	my_bool not_used __attribute__((unused)))
{
	*length=share->table_name_length;

7053
	return (uchar*) share->table_name;
osku's avatar
osku committed
7054 7055
}

7056
static INNOBASE_SHARE* get_share(const char* table_name)
osku's avatar
osku committed
7057
{
7058 7059 7060 7061 7062
	INNOBASE_SHARE *share;
	pthread_mutex_lock(&innobase_share_mutex);
	uint length=(uint) strlen(table_name);

	if (!(share=(INNOBASE_SHARE*) hash_search(&innobase_open_tables,
7063
				(uchar*) table_name,
7064 7065
				length))) {

osku's avatar
osku committed
7066 7067
		share = (INNOBASE_SHARE *) my_malloc(sizeof(*share)+length+1,
			MYF(MY_FAE | MY_ZEROFILL));
7068

osku's avatar
osku committed
7069 7070 7071 7072 7073
		share->table_name_length=length;
		share->table_name=(char*) (share+1);
		strmov(share->table_name,table_name);

		if (my_hash_insert(&innobase_open_tables,
7074
				(uchar*) share)) {
osku's avatar
osku committed
7075
			pthread_mutex_unlock(&innobase_share_mutex);
marko's avatar
marko committed
7076
			my_free(share,0);
osku's avatar
osku committed
7077 7078

			return 0;
7079
		}
osku's avatar
osku committed
7080 7081 7082

		thr_lock_init(&share->lock);
		pthread_mutex_init(&share->mutex,MY_MUTEX_INIT_FAST);
7083 7084 7085 7086 7087 7088 7089 7090 7091 7092 7093 7094 7095
	}

	share->use_count++;
	pthread_mutex_unlock(&innobase_share_mutex);

	return share;
}

static void free_share(INNOBASE_SHARE* share)
{
	pthread_mutex_lock(&innobase_share_mutex);

	if (!--share->use_count) {
7096
		hash_delete(&innobase_open_tables, (uchar*) share);
7097 7098
		thr_lock_delete(&share->lock);
		pthread_mutex_destroy(&share->mutex);
marko's avatar
marko committed
7099
		my_free(share, MYF(0));
7100 7101 7102
	}

	pthread_mutex_unlock(&innobase_share_mutex);
osku's avatar
osku committed
7103 7104 7105 7106 7107 7108 7109 7110 7111 7112 7113 7114 7115 7116 7117 7118 7119 7120 7121 7122 7123 7124
}

/*********************************************************************
Converts a MySQL table lock stored in the 'lock' field of the handle to
a proper type before storing pointer to the lock into an array of pointers.
MySQL also calls this if it wants to reset some table locks to a not-locked
state during the processing of an SQL query. An example is that during a
SELECT the read lock is released early on the 'const' tables where we only
fetch one row. MySQL does not call this when it releases all locks at the
end of an SQL statement. */

THR_LOCK_DATA**
ha_innobase::store_lock(
/*====================*/
						/* out: pointer to the next
						element in the 'to' array */
	THD*			thd,		/* in: user thread handle */
	THR_LOCK_DATA**		to,		/* in: pointer to an array
						of pointers to lock structs;
						pointer to the 'lock' field
						of current handle is stored
						next to this array */
7125
	enum thr_lock_type	lock_type)	/* in: lock type to store in
osku's avatar
osku committed
7126 7127 7128
						'lock'; this may also be
						TL_IGNORE */
{
7129 7130
	trx_t*		trx;

7131 7132 7133
	/* Note that trx in this function is NOT necessarily prebuilt->trx
	because we call update_thd() later, in ::external_lock()! Failure to
	understand this caused a serious memory corruption bug in 5.1.11. */
7134

7135
	trx = check_trx_exists(thd);
osku's avatar
osku committed
7136

7137
	/* NOTE: MySQL can call this function with lock 'type' TL_IGNORE!
osku's avatar
osku committed
7138 7139 7140
	Be careful to ignore TL_IGNORE if we are going to do something with
	only 'real' locks! */

7141
	/* If no MySQL table is in use, we need to set the isolation level
7142 7143 7144
	of the transaction. */

	if (lock_type != TL_IGNORE
7145
	    && trx->n_mysql_tables_in_use == 0) {
7146
		trx->isolation_level = innobase_map_isolation_level(
7147
			(enum_tx_isolation) thd_tx_isolation(thd));
7148 7149 7150 7151 7152 7153 7154 7155 7156

		if (trx->isolation_level <= TRX_ISO_READ_COMMITTED
		    && trx->global_read_view) {

			/* At low transaction isolation levels we let
			each consistent read set its own snapshot */

			read_view_close_for_mysql(trx);
		}
7157 7158
	}

7159
	DBUG_ASSERT(thd == current_thd);
7160
	const bool in_lock_tables = thd_in_lock_tables(thd);
7161
	const uint sql_command = thd_sql_command(thd);
7162

7163
	if (sql_command == SQLCOM_DROP_TABLE) {
7164 7165 7166 7167 7168

		/* MySQL calls this function in DROP TABLE though this table
		handle may belong to another thd that is running a query. Let
		us in that case skip any changes to the prebuilt struct. */ 

7169 7170 7171 7172 7173 7174
	} else if ((lock_type == TL_READ && in_lock_tables)
		   || (lock_type == TL_READ_HIGH_PRIORITY && in_lock_tables)
		   || lock_type == TL_READ_WITH_SHARED_LOCKS
		   || lock_type == TL_READ_NO_INSERT
		   || (lock_type != TL_IGNORE
		       && sql_command != SQLCOM_SELECT)) {
osku's avatar
osku committed
7175 7176

		/* The OR cases above are in this order:
7177 7178
		1) MySQL is doing LOCK TABLES ... READ LOCAL, or we
		are processing a stored procedure or function, or
osku's avatar
osku committed
7179 7180 7181 7182 7183 7184 7185 7186 7187 7188 7189 7190 7191 7192 7193
		2) (we do not know when TL_READ_HIGH_PRIORITY is used), or
		3) this is a SELECT ... IN SHARE MODE, or
		4) we are doing a complex SQL statement like
		INSERT INTO ... SELECT ... and the logical logging (MySQL
		binlog) requires the use of a locking read, or
		MySQL is doing LOCK TABLES ... READ.
		5) we let InnoDB do locking reads for all SQL statements that
		are not simple SELECTs; note that select_lock_type in this
		case may get strengthened in ::external_lock() to LOCK_X.
		Note that we MUST use a locking read in all data modifying
		SQL statements, because otherwise the execution would not be
		serializable, and also the results from the update could be
		unexpected if an obsolete consistent read view would be
		used. */

7194 7195 7196 7197 7198
		ulint	isolation_level;

		isolation_level = trx->isolation_level;

		if ((srv_locks_unsafe_for_binlog
7199 7200 7201 7202 7203 7204
		     || isolation_level == TRX_ISO_READ_COMMITTED)
		    && isolation_level != TRX_ISO_SERIALIZABLE
		    && (lock_type == TL_READ || lock_type == TL_READ_NO_INSERT)
		    && (sql_command == SQLCOM_INSERT_SELECT
			|| sql_command == SQLCOM_UPDATE
			|| sql_command == SQLCOM_CREATE_TABLE)) {
osku's avatar
osku committed
7205

7206 7207 7208
			/* If we either have innobase_locks_unsafe_for_binlog
			option set or this session is using READ COMMITTED
			isolation level and isolation level of the transaction
osku's avatar
osku committed
7209
			is not set to serializable and MySQL is doing
7210 7211 7212 7213
			INSERT INTO...SELECT or UPDATE ... = (SELECT ...) or
			CREATE  ... SELECT... without FOR UPDATE or
			IN SHARE MODE in select, then we use consistent
			read for select. */
osku's avatar
osku committed
7214 7215 7216

			prebuilt->select_lock_type = LOCK_NONE;
			prebuilt->stored_select_lock_type = LOCK_NONE;
7217
		} else if (sql_command == SQLCOM_CHECKSUM) {
osku's avatar
osku committed
7218 7219 7220 7221 7222 7223 7224 7225 7226 7227 7228
			/* Use consistent read for checksum table */

			prebuilt->select_lock_type = LOCK_NONE;
			prebuilt->stored_select_lock_type = LOCK_NONE;
		} else {
			prebuilt->select_lock_type = LOCK_S;
			prebuilt->stored_select_lock_type = LOCK_S;
		}

	} else if (lock_type != TL_IGNORE) {

jan's avatar
jan committed
7229
		/* We set possible LOCK_X value in external_lock, not yet
osku's avatar
osku committed
7230 7231 7232 7233 7234 7235 7236 7237
		here even if this would be SELECT ... FOR UPDATE */

		prebuilt->select_lock_type = LOCK_NONE;
		prebuilt->stored_select_lock_type = LOCK_NONE;
	}

	if (lock_type != TL_IGNORE && lock.type == TL_UNLOCK) {

jan's avatar
jan committed
7238
		/* Starting from 5.0.7, we weaken also the table locks
osku's avatar
osku committed
7239 7240
		set at the start of a MySQL stored procedure call, just like
		we weaken the locks set at the start of an SQL statement.
7241
		MySQL does set in_lock_tables TRUE there, but in reality
osku's avatar
osku committed
7242 7243 7244 7245
		we do not need table locks to make the execution of a
		single transaction stored procedure call deterministic
		(if it does not use a consistent read). */

7246
		if (lock_type == TL_READ
7247
		    && sql_command == SQLCOM_LOCK_TABLES) {
osku's avatar
osku committed
7248 7249 7250 7251 7252 7253 7254 7255 7256 7257 7258 7259 7260 7261
			/* We come here if MySQL is processing LOCK TABLES
			... READ LOCAL. MyISAM under that table lock type
			reads the table as it was at the time the lock was
			granted (new inserts are allowed, but not seen by the
			reader). To get a similar effect on an InnoDB table,
			we must use LOCK TABLES ... READ. We convert the lock
			type here, so that for InnoDB, READ LOCAL is
			equivalent to READ. This will change the InnoDB
			behavior in mysqldump, so that dumps of InnoDB tables
			are consistent with dumps of MyISAM tables. */

			lock_type = TL_READ_NO_INSERT;
		}

jan's avatar
jan committed
7262
		/* If we are not doing a LOCK TABLE, DISCARD/IMPORT
7263
		TABLESPACE or TRUNCATE TABLE then allow multiple
jan's avatar
jan committed
7264 7265 7266
		writers. Note that ALTER TABLE uses a TL_WRITE_ALLOW_READ
		< TL_WRITE_CONCURRENT_INSERT.

7267
		We especially allow multiple writers if MySQL is at the
jan's avatar
jan committed
7268
		start of a stored procedure call (SQLCOM_CALL) or a
7269
		stored function call (MySQL does have in_lock_tables
jan's avatar
jan committed
7270
		TRUE there). */
osku's avatar
osku committed
7271

7272
		if ((lock_type >= TL_WRITE_CONCURRENT_INSERT
7273 7274 7275 7276 7277 7278 7279
		     && lock_type <= TL_WRITE)
		    && !(in_lock_tables
			 && sql_command == SQLCOM_LOCK_TABLES)
		    && !thd_tablespace_op(thd)
		    && sql_command != SQLCOM_TRUNCATE
		    && sql_command != SQLCOM_OPTIMIZE
		    && sql_command != SQLCOM_CREATE_TABLE) {
osku's avatar
osku committed
7280

jan's avatar
jan committed
7281
			lock_type = TL_WRITE_ALLOW_WRITE;
7282
		}
osku's avatar
osku committed
7283 7284 7285 7286 7287

		/* In queries of type INSERT INTO t1 SELECT ... FROM t2 ...
		MySQL would use the lock TL_READ_NO_INSERT on t2, and that
		would conflict with TL_WRITE_ALLOW_WRITE, blocking all inserts
		to t2. Convert the lock to a normal read lock to allow
7288
		concurrent inserts to t2.
jan's avatar
jan committed
7289

7290 7291
		We especially allow concurrent inserts if MySQL is at the
		start of a stored procedure call (SQLCOM_CALL)
7292
		(MySQL does have thd_in_lock_tables() TRUE there). */
7293

osku's avatar
osku committed
7294
		if (lock_type == TL_READ_NO_INSERT
7295
		    && sql_command != SQLCOM_LOCK_TABLES) {
osku's avatar
osku committed
7296 7297 7298

			lock_type = TL_READ;
		}
7299

jan's avatar
jan committed
7300 7301
		lock.type = lock_type;
	}
osku's avatar
osku committed
7302

jan's avatar
jan committed
7303
	*to++= &lock;
osku's avatar
osku committed
7304 7305 7306 7307 7308 7309 7310 7311 7312 7313 7314 7315 7316

	return(to);
}

/***********************************************************************
This function initializes the auto-inc counter if it has not been
initialized yet. This function does not change the value of the auto-inc
counter if it already has been initialized. In parameter ret returns
the value of the auto-inc counter. */

int
ha_innobase::innobase_read_and_init_auto_inc(
/*=========================================*/
7317 7318
						/* out: 0 or generic MySQL
						error code */
7319
        ulonglong*	value)			/* out: the autoinc value */
osku's avatar
osku committed
7320
{
7321
	ulonglong	auto_inc;
7322
	ibool		stmt_start;
7323 7324 7325
	int		mysql_error = 0;
	dict_table_t*	innodb_table = prebuilt->table;
	ibool		trx_was_not_started	= FALSE;
osku's avatar
osku committed
7326

7327
	ut_a(prebuilt);
osku's avatar
osku committed
7328
	ut_a(prebuilt->table);
7329

7330 7331 7332 7333
	/* Remember if we are in the beginning of an SQL statement.
	This function must not change that flag. */
	stmt_start = prebuilt->sql_stat_start;

7334
	/* Prepare prebuilt->trx in the table handle */
7335
	update_thd(ha_thd());
7336

osku's avatar
osku committed
7337 7338 7339 7340 7341 7342 7343 7344 7345
	if (prebuilt->trx->conc_state == TRX_NOT_STARTED) {
		trx_was_not_started = TRUE;
	}

	/* In case MySQL calls this in the middle of a SELECT query, release
	possible adaptive hash latch to avoid deadlocks of threads */

	trx_search_latch_release_if_reserved(prebuilt->trx);

marko's avatar
marko committed
7346
	dict_table_autoinc_lock(prebuilt->table);
osku's avatar
osku committed
7347 7348 7349

	auto_inc = dict_table_autoinc_read(prebuilt->table);

7350 7351 7352 7353 7354
	/* Was the AUTOINC counter reset during normal processing, if
	so then we simply start count from 1. No need to go to the index.*/
	if (auto_inc == 0 && innodb_table->autoinc_inited) {
		++auto_inc;
		dict_table_autoinc_initialize(innodb_table, auto_inc);
osku's avatar
osku committed
7355 7356
	}

7357 7358
	if (auto_inc == 0) {
		dict_index_t* index;
marko's avatar
marko committed
7359
		ulint error;
7360
		const char* autoinc_col_name;
7361

7362
		ut_a(!innodb_table->autoinc_inited);
osku's avatar
osku committed
7363

7364
		index = innobase_get_index(table->s->next_number_index);
osku's avatar
osku committed
7365

7366
		autoinc_col_name = table->found_next_number_field->field_name;
osku's avatar
osku committed
7367

7368 7369
		error = row_search_max_autoinc(
			index, autoinc_col_name, &auto_inc);
osku's avatar
osku committed
7370

7371
		if (error == DB_SUCCESS) {
7372 7373 7374
			if (auto_inc < ~0x0ULL) {
				++auto_inc;
			}
7375
			dict_table_autoinc_initialize(innodb_table, auto_inc);
osku's avatar
osku committed
7376
		} else {
7377 7378
			ut_print_timestamp(stderr);
			fprintf(stderr, "  InnoDB: Error: (%lu) Couldn't read "
7379 7380
				"the max AUTOINC value from the index (%s).\n",
				error, index->name);
osku's avatar
osku committed
7381

7382
			mysql_error = 1;
7383
		}
7384 7385
	}

7386
	*value = auto_inc;
osku's avatar
osku committed
7387

7388
	dict_table_autoinc_unlock(prebuilt->table);
osku's avatar
osku committed
7389 7390 7391 7392 7393 7394 7395 7396 7397 7398 7399 7400 7401

	/* Since MySQL does not seem to call autocommit after SHOW TABLE
	STATUS (even if we would register the trx here), we commit our
	transaction here if it was started here. This is to eliminate a
	dangling transaction. If the user had AUTOCOMMIT=0, then SHOW
	TABLE STATUS does leave a dangling transaction if the user does not
	himself call COMMIT. */

	if (trx_was_not_started) {

		innobase_commit_low(prebuilt->trx);
	}

7402 7403
	prebuilt->sql_stat_start = stmt_start;

7404 7405 7406 7407 7408 7409 7410 7411 7412
	return(mysql_error);
}

/*******************************************************************************
Read the next autoinc value, initialize the table if it's not initialized.
On return if there is no error then the tables AUTOINC lock is locked.*/

ulong
ha_innobase::innobase_get_auto_increment(
7413
/*=====================================*/
7414 7415
	ulonglong*	value)		/* out: autoinc value */
{
marko's avatar
marko committed
7416
	ulong		error;
7417

7418
	*value = 0;
7419 7420 7421 7422

	/* Note: If the table is not initialized when we attempt the
	read below. We initialize the table's auto-inc counter  and
	always do a reread of the AUTOINC value. */
7423 7424 7425 7426
	do {
		error = innobase_autoinc_lock();

		if (error == DB_SUCCESS) {
7427
			ulonglong	autoinc;
7428 7429 7430 7431 7432 7433

			/* Determine the first value of the interval */
			autoinc = dict_table_autoinc_read(prebuilt->table);

			/* We need to initialize the AUTO-INC value, for
			that we release all locks.*/
7434
			if (autoinc == 0) {
7435 7436 7437 7438 7439
				trx_t*		trx;

				trx = prebuilt->trx;
				dict_table_autoinc_unlock(prebuilt->table);

marko's avatar
marko committed
7440 7441 7442 7443
				/* If we had reserved the AUTO-INC
				lock in this SQL statement we release
				it before retrying.*/
				row_unlock_table_autoinc_for_mysql(trx);
7444 7445 7446 7447 7448 7449 7450 7451 7452

				/* Just to make sure */
				ut_a(!trx->auto_inc_lock);

				int	mysql_error;

				mysql_error = innobase_read_and_init_auto_inc(
					&autoinc);

7453
				if (mysql_error) {
7454 7455 7456
					error = DB_ERROR;
				}
			} else {
7457
				*value = autoinc;
7458
			}
7459 7460 7461 7462
		/* A deadlock error during normal processing is OK
		and can be ignored. */
		} else if (error != DB_DEADLOCK) {

7463
			sql_print_error("InnoDB: Error: %lu in "
7464 7465
					"::innobase_get_auto_increment()",
					error);
7466
		}
7467

7468 7469
	} while (*value == 0 && error == DB_SUCCESS);

7470
	return(error);
osku's avatar
osku committed
7471 7472
}

marko's avatar
marko committed
7473
/*******************************************************************************
osku's avatar
osku committed
7474 7475 7476
This function initializes the auto-inc counter if it has not been
initialized yet. This function does not change the value of the auto-inc
counter if it already has been initialized. Returns the value of the
marko's avatar
marko committed
7477 7478 7479
auto-inc counter in *first_value, and ULONGLONG_MAX in *nb_reserved_values (as
we have a table-level lock). offset, increment, nb_desired_values are ignored.
*first_value is set to -1 if error (deadlock or lock wait timeout)            */
osku's avatar
osku committed
7480

7481 7482
void
ha_innobase::get_auto_increment(
7483
/*============================*/
7484 7485 7486 7487 7488
        ulonglong	offset,              /* in: */
        ulonglong	increment,           /* in: table autoinc increment */
        ulonglong	nb_desired_values,   /* in: number of values reqd */
        ulonglong	*first_value,        /* out: the autoinc value */
        ulonglong	*nb_reserved_values) /* out: count of reserved values */
osku's avatar
osku committed
7489
{
sunny's avatar
sunny committed
7490
	trx_t*		trx;
7491 7492
	ulint		error;
	ulonglong	autoinc = 0;
7493

7494
	/* Prepare prebuilt->trx in the table handle */
7495
	update_thd(ha_thd());
7496

7497
	error = innobase_get_auto_increment(&autoinc);
osku's avatar
osku committed
7498

7499 7500
	if (error != DB_SUCCESS) {
		*first_value = (~(ulonglong) 0);
marko's avatar
marko committed
7501
		return;
osku's avatar
osku committed
7502 7503
	}

7504 7505 7506 7507 7508 7509
	/* This is a hack, since nb_desired_values seems to be accurate only
	for the first call to get_auto_increment() for multi-row INSERT and
	meaningless for other statements e.g, LOAD etc. Subsequent calls to
	this method for the same statement results in different values which
	don't make sense. Therefore we store the value the first time we are
	called and count down from that as rows are written (see write_row()).
sunny's avatar
sunny committed
7510
	*/
7511

sunny's avatar
sunny committed
7512
	trx = prebuilt->trx;
7513

7514 7515 7516 7517 7518
	/* Note: We can't rely on *first_value since some MySQL engines,
	in particular the partition engine, don't initialize it to 0 when
	invoking this method. So we are not sure if it's guaranteed to
	be 0 or not. */

sunny's avatar
sunny committed
7519 7520
	/* Called for the first time ? */
	if (trx->n_autoinc_rows == 0) {
7521

marko's avatar
marko committed
7522
		trx->n_autoinc_rows = (ulint) nb_desired_values;
7523

sunny's avatar
sunny committed
7524 7525 7526 7527 7528
		/* It's possible for nb_desired_values to be 0:
		e.g., INSERT INTO T1(C) SELECT C FROM T2; */
		if (nb_desired_values == 0) {

			trx->n_autoinc_rows = 1;
7529 7530
		}

marko's avatar
marko committed
7531
		set_if_bigger(*first_value, autoinc);
sunny's avatar
sunny committed
7532 7533
	/* Not in the middle of a mult-row INSERT. */
	} else if (prebuilt->last_value == 0) {
marko's avatar
marko committed
7534
		set_if_bigger(*first_value, autoinc);
7535 7536
	}

sunny's avatar
sunny committed
7537
	*nb_reserved_values = trx->n_autoinc_rows;
7538

7539 7540 7541
	/* With old style AUTOINC locking we only update the table's
	AUTOINC counter after attempting to insert the row. */
	if (innobase_autoinc_lock_mode != AUTOINC_OLD_STYLE_LOCKING) {
7542 7543 7544 7545 7546 7547 7548 7549 7550 7551
		ulonglong	have;
		ulonglong	need;

		/* Check for overflow conditions. */
		need = *nb_reserved_values * increment;
		have = ~0x0ULL - *first_value;

		if (have < need) {
			need = have;
		}
7552

7553
		/* Compute the last value in the interval */
7554
		prebuilt->last_value = *first_value + need;
7555

7556 7557 7558 7559 7560 7561 7562 7563 7564 7565
		ut_a(prebuilt->last_value >= *first_value);

		/* Update the table autoinc variable */
		dict_table_autoinc_update(
			prebuilt->table, prebuilt->last_value);
	} else {
		/* This will force write_row() into attempting an update
		of the table's AUTOINC counter. */
		prebuilt->last_value = 0;
	}
7566 7567 7568 7569 7570 7571 7572

	/* The increment to be used to increase the AUTOINC value, we use
	this in write_row() and update_row() to increase the autoinc counter
	for columns that are filled by the user.*/
	prebuilt->table->autoinc_increment = increment;

	dict_table_autoinc_unlock(prebuilt->table);
osku's avatar
osku committed
7573 7574 7575 7576
}

/* See comment in handler.h */
int
7577 7578 7579
ha_innobase::reset_auto_increment(
/*==============================*/
	ulonglong	value)		/* in: new value for table autoinc */
osku's avatar
osku committed
7580 7581 7582
{
	DBUG_ENTER("ha_innobase::reset_auto_increment");

osku's avatar
osku committed
7583
	int	error;
osku's avatar
osku committed
7584

7585
	update_thd(ha_thd());
7586

osku's avatar
osku committed
7587 7588 7589 7590 7591 7592
	error = row_lock_table_autoinc_for_mysql(prebuilt);

	if (error != DB_SUCCESS) {
		error = convert_error_code_to_mysql(error, user_thd);

		DBUG_RETURN(error);
7593
	}
osku's avatar
osku committed
7594

7595
	innobase_reset_autoinc(value);
osku's avatar
osku committed
7596 7597 7598 7599 7600 7601 7602 7603

	DBUG_RETURN(0);
}

/* See comment in handler.cc */
bool
ha_innobase::get_error_message(int error, String *buf)
{
7604
	trx_t*	trx = check_trx_exists(ha_thd());
osku's avatar
osku committed
7605 7606 7607 7608 7609 7610 7611 7612 7613 7614 7615 7616 7617 7618 7619 7620 7621

	buf->copy(trx->detailed_error, strlen(trx->detailed_error),
		system_charset_info);

	return FALSE;
}

/***********************************************************************
Compares two 'refs'. A 'ref' is the (internal) primary key value of the row.
If there is no explicitly declared non-null unique key or a primary key, then
InnoDB internally uses the row id as the primary key. */

int
ha_innobase::cmp_ref(
/*=================*/
				/* out: < 0 if ref1 < ref2, 0 if equal, else
				> 0 */
7622
	const uchar*	ref1,	/* in: an (internal) primary key value in the
osku's avatar
osku committed
7623
				MySQL key value format */
7624
	const uchar*	ref2)	/* in: an (internal) primary key value in the
osku's avatar
osku committed
7625 7626 7627 7628 7629 7630 7631 7632
				MySQL key value format */
{
	enum_field_types mysql_type;
	Field*		field;
	KEY_PART_INFO*	key_part;
	KEY_PART_INFO*	key_part_end;
	uint		len1;
	uint		len2;
7633
	int		result;
osku's avatar
osku committed
7634 7635 7636 7637 7638 7639 7640 7641 7642 7643 7644 7645 7646 7647 7648 7649 7650 7651 7652

	if (prebuilt->clust_index_was_generated) {
		/* The 'ref' is an InnoDB row id */

		return(memcmp(ref1, ref2, DATA_ROW_ID_LEN));
	}

	/* Do a type-aware comparison of primary key fields. PK fields
	are always NOT NULL, so no checks for NULL are performed. */

	key_part = table->key_info[table->s->primary_key].key_part;

	key_part_end = key_part
			+ table->key_info[table->s->primary_key].key_parts;

	for (; key_part != key_part_end; ++key_part) {
		field = key_part->field;
		mysql_type = field->type();

marko's avatar
marko committed
7653 7654 7655 7656
		if (mysql_type == MYSQL_TYPE_TINY_BLOB
			|| mysql_type == MYSQL_TYPE_MEDIUM_BLOB
			|| mysql_type == MYSQL_TYPE_BLOB
			|| mysql_type == MYSQL_TYPE_LONG_BLOB) {
7657

osku's avatar
osku committed
7658 7659 7660 7661 7662 7663 7664 7665
			/* In the MySQL key value format, a column prefix of
			a BLOB is preceded by a 2-byte length field */

			len1 = innobase_read_from_2_little_endian(ref1);
			len2 = innobase_read_from_2_little_endian(ref2);

			ref1 += 2;
			ref2 += 2;
marko's avatar
marko committed
7666 7667
			result = ((Field_blob*)field)->cmp( ref1, len1,
                                                            ref2, len2);
osku's avatar
osku committed
7668 7669 7670 7671 7672 7673 7674 7675 7676 7677 7678 7679 7680 7681 7682 7683
		} else {
			result = field->key_cmp(ref1, ref2);
		}

		if (result) {

			return(result);
		}

		ref1 += key_part->store_length;
		ref2 += key_part->store_length;
	}

	return(0);
}

marko's avatar
marko committed
7684 7685 7686 7687 7688 7689 7690 7691 7692 7693 7694 7695 7696 7697 7698 7699 7700 7701 7702 7703 7704 7705 7706 7707 7708 7709 7710
/***********************************************************************
Ask InnoDB if a query to a table can be cached. */

my_bool
ha_innobase::register_query_cache_table(
/*====================================*/
					/* out: TRUE if query caching
					of the table is permitted */
	THD*		thd,		/* in: user thread handle */
	char*		table_key,	/* in: concatenation of database name,
					the null character '\0',
					and the table name */
	uint		key_length,	/* in: length of the full name, i.e.
					len(dbname) + len(tablename) + 1 */
	qc_engine_callback*
			call_back,	/* out: pointer to function for
					checking if query caching
					is permitted */
	ulonglong	*engine_data)	/* in/out: data to call_back */
{
	*call_back = innobase_query_caching_of_table_permitted;
	*engine_data = 0;
	return(innobase_query_caching_of_table_permitted(thd, table_key,
							 key_length,
							 engine_data));
}

osku's avatar
osku committed
7711 7712 7713 7714 7715 7716 7717 7718 7719
char*
ha_innobase::get_mysql_bin_log_name()
{
	return(trx_sys_mysql_bin_log_name);
}

ulonglong
ha_innobase::get_mysql_bin_log_pos()
{
7720
	/* trx... is ib_longlong, which is a typedef for a 64-bit integer
osku's avatar
osku committed
7721 7722
	(__int64 or longlong) so it's ok to cast it to ulonglong. */

7723
	return(trx_sys_mysql_bin_log_pos);
osku's avatar
osku committed
7724 7725 7726 7727 7728 7729 7730 7731 7732 7733
}

/**********************************************************************
This function is used to find the storage length in bytes of the first n
characters for prefix indexes using a multibyte character set. The function
finds charset information and returns length of prefix_len characters in the
index field in bytes.

NOTE: the prototype of this function is copied to data0type.c! If you change
this function, you MUST change also data0type.c! */
7734
extern "C"
osku's avatar
osku committed
7735 7736 7737 7738 7739 7740 7741 7742 7743
ulint
innobase_get_at_most_n_mbchars(
/*===========================*/
				/* out: number of bytes occupied by the first
				n characters */
	ulint charset_id,	/* in: character set id */
	ulint prefix_len,	/* in: prefix length in bytes of the index
				(this has to be divided by mbmaxlen to get the
				number of CHARACTERS n in the prefix) */
7744
	ulint data_len,		/* in: length of the string in bytes */
osku's avatar
osku committed
7745 7746 7747 7748 7749 7750 7751 7752 7753 7754 7755 7756 7757 7758 7759 7760 7761 7762 7763 7764 7765 7766 7767 7768 7769 7770 7771 7772 7773 7774 7775 7776 7777 7778 7779 7780 7781 7782 7783 7784 7785 7786 7787
	const char* str)	/* in: character string */
{
	ulint char_length;	/* character length in bytes */
	ulint n_chars;		/* number of characters in prefix */
	CHARSET_INFO* charset;	/* charset used in the field */

	charset = get_charset((uint) charset_id, MYF(MY_WME));

	ut_ad(charset);
	ut_ad(charset->mbmaxlen);

	/* Calculate how many characters at most the prefix index contains */

	n_chars = prefix_len / charset->mbmaxlen;

	/* If the charset is multi-byte, then we must find the length of the
	first at most n chars in the string. If the string contains less
	characters than n, then we return the length to the end of the last
	character. */

	if (charset->mbmaxlen > 1) {
		/* my_charpos() returns the byte length of the first n_chars
		characters, or a value bigger than the length of str, if
		there were not enough full characters in str.

		Why does the code below work:
		Suppose that we are looking for n UTF-8 characters.

		1) If the string is long enough, then the prefix contains at
		least n complete UTF-8 characters + maybe some extra
		characters + an incomplete UTF-8 character. No problem in
		this case. The function returns the pointer to the
		end of the nth character.

		2) If the string is not long enough, then the string contains
		the complete value of a column, that is, only complete UTF-8
		characters, and we can store in the column prefix index the
		whole string. */

		char_length = my_charpos(charset, str,
						str + data_len, (int) n_chars);
		if (char_length > data_len) {
			char_length = data_len;
7788
		}
osku's avatar
osku committed
7789 7790 7791 7792 7793 7794 7795 7796 7797 7798 7799 7800 7801
	} else {
		if (data_len < prefix_len) {
			char_length = data_len;
		} else {
			char_length = prefix_len;
		}
	}

	return(char_length);
}

/***********************************************************************
This function is used to prepare X/Open XA distributed transaction   */
7802
static
7803
int
osku's avatar
osku committed
7804 7805 7806
innobase_xa_prepare(
/*================*/
			/* out: 0 or error number */
7807
        handlerton *hton,
osku's avatar
osku committed
7808 7809 7810 7811 7812 7813
	THD*	thd,	/* in: handle to the MySQL thread of the user
			whose XA transaction should be prepared */
	bool	all)	/* in: TRUE - commit transaction
			FALSE - the current SQL statement ended */
{
	int error = 0;
7814
	trx_t* trx = check_trx_exists(thd);
osku's avatar
osku committed
7815

7816 7817
	if (thd_sql_command(thd) != SQLCOM_XA_PREPARE &&
	    (all || !thd_test_options(thd, OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN)))
7818
	{
osku's avatar
osku committed
7819

7820 7821
		/* For ibbackup to work the order of transactions in binlog
		and InnoDB must be the same. Consider the situation
osku's avatar
osku committed
7822

7823 7824 7825 7826
		  thread1> prepare; write to binlog; ...
			  <context switch>
		  thread2> prepare; write to binlog; commit
		  thread1>			     ... commit
osku's avatar
osku committed
7827

7828 7829
		To ensure this will not happen we're taking the mutex on
		prepare, and releasing it on commit.
osku's avatar
osku committed
7830

7831 7832 7833 7834 7835 7836 7837 7838 7839 7840 7841
		Note: only do it for normal commits, done via ha_commit_trans.
		If 2pc protocol is executed by external transaction
		coordinator, it will be just a regular MySQL client
		executing XA PREPARE and XA COMMIT commands.
		In this case we cannot know how many minutes or hours
		will be between XA PREPARE and XA COMMIT, and we don't want
		to block for undefined period of time.
		*/
		pthread_mutex_lock(&prepare_commit_mutex);
		trx->active_trans = 2;
	}
osku's avatar
osku committed
7842

7843
	if (!THDVAR(thd, support_xa)) {
osku's avatar
osku committed
7844 7845 7846 7847

		return(0);
	}

7848
	thd_get_xid(thd, (MYSQL_XID*) &trx->xid);
osku's avatar
osku committed
7849 7850 7851 7852 7853 7854 7855 7856 7857 7858 7859 7860 7861 7862

	/* Release a possible FIFO ticket and search latch. Since we will
	reserve the kernel mutex, we have to release the search system latch
	first to obey the latching order. */

	innobase_release_stat_resources(trx);

	if (trx->active_trans == 0 && trx->conc_state != TRX_NOT_STARTED) {

	  sql_print_error("trx->active_trans == 0, but trx->conc_state != "
			  "TRX_NOT_STARTED");
	}

	if (all
7863
		|| (!thd_test_options(thd, OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN))) {
osku's avatar
osku committed
7864

7865 7866
		/* We were instructed to prepare the whole transaction, or
		this is an SQL statement end and autocommit is on */
osku's avatar
osku committed
7867

7868
		ut_ad(trx->active_trans);
osku's avatar
osku committed
7869 7870 7871

		error = (int) trx_prepare_for_mysql(trx);
	} else {
7872
		/* We just mark the SQL statement ended and do not do a
osku's avatar
osku committed
7873 7874
		transaction prepare */

marko's avatar
marko committed
7875 7876
		/* If we had reserved the auto-inc lock for some
		table in this SQL statement we release it now */
osku's avatar
osku committed
7877

marko's avatar
marko committed
7878
		row_unlock_table_autoinc_for_mysql(trx);
7879

osku's avatar
osku committed
7880 7881 7882 7883 7884 7885 7886 7887 7888 7889 7890 7891
		/* Store the current undo_no of the transaction so that we
		know where to roll back if we have to roll back the next
		SQL statement */

		trx_mark_sql_stat_end(trx);
	}

	/* Tell the InnoDB server that there might be work for utility
	threads: */

	srv_active_wake_master_thread();

7892
	return error;
osku's avatar
osku committed
7893 7894 7895 7896
}

/***********************************************************************
This function is used to recover X/Open XA distributed transactions   */
7897
static
7898
int
osku's avatar
osku committed
7899 7900
innobase_xa_recover(
/*================*/
7901
				/* out: number of prepared transactions
osku's avatar
osku committed
7902
				stored in xid_list */
7903
        handlerton *hton,
7904
	XID*	xid_list,	/* in/out: prepared transactions */
osku's avatar
osku committed
7905 7906 7907 7908 7909 7910 7911 7912 7913 7914 7915 7916 7917
	uint	len)		/* in: number of slots in xid_list */
{
	if (len == 0 || xid_list == NULL) {

		return(0);
	}

	return(trx_recover_for_mysql(xid_list, len));
}

/***********************************************************************
This function is used to commit one X/Open XA distributed transaction
which is in the prepared state */
7918
static
7919
int
osku's avatar
osku committed
7920 7921 7922
innobase_commit_by_xid(
/*===================*/
			/* out: 0 or error number */
7923
        handlerton *hton,
osku's avatar
osku committed
7924 7925 7926 7927 7928 7929 7930 7931
	XID*	xid)	/* in: X/Open XA transaction identification */
{
	trx_t*	trx;

	trx = trx_get_trx_by_xid(xid);

	if (trx) {
		innobase_commit_low(trx);
7932

osku's avatar
osku committed
7933 7934 7935 7936 7937 7938 7939 7940 7941
		return(XA_OK);
	} else {
		return(XAER_NOTA);
	}
}

/***********************************************************************
This function is used to rollback one X/Open XA distributed transaction
which is in the prepared state */
7942
static
7943
int
osku's avatar
osku committed
7944 7945 7946
innobase_rollback_by_xid(
/*=====================*/
			/* out: 0 or error number */
7947
        handlerton *hton,
osku's avatar
osku committed
7948 7949 7950 7951 7952 7953 7954 7955 7956 7957 7958 7959 7960 7961 7962 7963
	XID	*xid)	/* in: X/Open XA transaction identification */
{
	trx_t*	trx;

	trx = trx_get_trx_by_xid(xid);

	if (trx) {
		return(innobase_rollback_trx(trx));
	} else {
		return(XAER_NOTA);
	}
}

/***********************************************************************
Create a consistent view for a cursor based on current transaction
which is created if the corresponding MySQL thread still lacks one.
7964
This consistent view is then used inside of MySQL when accessing records
osku's avatar
osku committed
7965
using a cursor. */
7966
static
osku's avatar
osku committed
7967
void*
7968
innobase_create_cursor_view(
7969
/*========================*/
7970 7971 7972
                          /* out: pointer to cursor view or NULL */
        handlerton *hton, /* in: innobase hton */
	THD* thd)	  /* in: user thread handle */
osku's avatar
osku committed
7973
{
7974
	return(read_cursor_view_create_for_mysql(check_trx_exists(thd)));
osku's avatar
osku committed
7975 7976 7977 7978
}

/***********************************************************************
Close the given consistent cursor view of a transaction and restore
7979
global read view to a transaction read view. Transaction is created if the
osku's avatar
osku committed
7980
corresponding MySQL thread still lacks one. */
7981
static
osku's avatar
osku committed
7982 7983
void
innobase_close_cursor_view(
7984
/*=======================*/
7985 7986
        handlerton *hton,
	THD*	thd,	/* in: user thread handle */
osku's avatar
osku committed
7987 7988
	void*	curview)/* in: Consistent read view to be closed */
{
7989
	read_cursor_view_close_for_mysql(check_trx_exists(thd),
7990
					 (cursor_view_t*) curview);
osku's avatar
osku committed
7991 7992 7993
}

/***********************************************************************
7994 7995
Set the given consistent cursor view to a transaction which is created
if the corresponding MySQL thread still lacks one. If the given
osku's avatar
osku committed
7996 7997
consistent cursor view is NULL global read view of a transaction is
restored to a transaction read view. */
7998
static
osku's avatar
osku committed
7999 8000 8001
void
innobase_set_cursor_view(
/*=====================*/
8002 8003
        handlerton *hton,
	THD*	thd,	/* in: user thread handle */
osku's avatar
osku committed
8004 8005
	void*	curview)/* in: Consistent cursor view to be set */
{
8006
	read_cursor_set_for_mysql(check_trx_exists(thd),
8007
				  (cursor_view_t*) curview);
osku's avatar
osku committed
8008 8009
}

osku's avatar
osku committed
8010

8011 8012 8013
bool ha_innobase::check_if_incompatible_data(
	HA_CREATE_INFO*	info,
	uint		table_changes)
osku's avatar
osku committed
8014
{
8015
	if (table_changes != IS_EQUAL_YES) {
osku's avatar
osku committed
8016

8017 8018 8019 8020 8021 8022 8023 8024 8025 8026 8027
		return COMPATIBLE_DATA_NO;
	}

	/* Check that auto_increment value was not changed */
	if ((info->used_fields & HA_CREATE_USED_AUTO) &&
		info->auto_increment_value != 0) {

		return COMPATIBLE_DATA_NO;
	}

	/* Check that row format didn't change */
8028
	if ((info->used_fields & HA_CREATE_USED_ROW_FORMAT) &&
8029
		get_row_type() != info->row_type) {
osku's avatar
osku committed
8030

8031 8032 8033 8034 8035
		return COMPATIBLE_DATA_NO;
	}

	return COMPATIBLE_DATA_YES;
}
8036

marko's avatar
marko committed
8037 8038 8039 8040 8041 8042 8043 8044
static int show_innodb_vars(THD *thd, SHOW_VAR *var, char *buff)
{
  innodb_export_status();
  var->type= SHOW_ARRAY;
  var->value= (char *) &innodb_status_variables;
  return 0;
}

8045
static SHOW_VAR innodb_status_variables_export[]= {
marko's avatar
marko committed
8046 8047 8048 8049
  {"Innodb",                   (char*) &show_innodb_vars, SHOW_FUNC},
  {NullS, NullS, SHOW_LONG}
};

8050
static struct st_mysql_storage_engine innobase_storage_engine=
8051
{ MYSQL_HANDLERTON_INTERFACE_VERSION };
8052

8053 8054 8055 8056 8057 8058 8059 8060 8061 8062 8063 8064 8065 8066 8067 8068 8069 8070 8071 8072 8073 8074 8075 8076 8077 8078 8079 8080 8081 8082 8083 8084 8085 8086 8087 8088 8089 8090 8091 8092 8093 8094 8095 8096 8097 8098 8099 8100 8101 8102 8103 8104 8105 8106 8107 8108 8109 8110 8111 8112 8113 8114 8115 8116 8117 8118 8119 8120 8121 8122 8123 8124 8125 8126 8127 8128 8129 8130 8131 8132 8133 8134 8135 8136 8137 8138 8139 8140 8141 8142
/* plugin options */
static MYSQL_SYSVAR_BOOL(checksums, innobase_use_checksums,
  PLUGIN_VAR_NOCMDARG | PLUGIN_VAR_READONLY,
  "Enable InnoDB checksums validation (enabled by default). "
  "Disable with --skip-innodb-checksums.",
  NULL, NULL, TRUE);

static MYSQL_SYSVAR_STR(data_home_dir, innobase_data_home_dir,
  PLUGIN_VAR_READONLY,
  "The common part for InnoDB table spaces.",
  NULL, NULL, NULL);

static MYSQL_SYSVAR_BOOL(doublewrite, innobase_use_doublewrite,
  PLUGIN_VAR_NOCMDARG | PLUGIN_VAR_READONLY,
  "Enable InnoDB doublewrite buffer (enabled by default). "
  "Disable with --skip-innodb-doublewrite.",
  NULL, NULL, TRUE);

static MYSQL_SYSVAR_ULONG(fast_shutdown, innobase_fast_shutdown,
  PLUGIN_VAR_OPCMDARG,
  "Speeds up the shutdown process of the InnoDB storage engine. Possible "
  "values are 0, 1 (faster)"
  /*
    NetWare can't close unclosed files, can't automatically kill remaining
    threads, etc, so on this OS we disable the crash-like InnoDB shutdown.
  */
  IF_NETWARE("", " or 2 (fastest - crash-like)")
  ".",
  NULL, NULL, 1, 0, IF_NETWARE(1,2), 0);

static MYSQL_SYSVAR_BOOL(file_per_table, innobase_file_per_table,
  PLUGIN_VAR_NOCMDARG | PLUGIN_VAR_READONLY,
  "Stores each InnoDB table to an .ibd file in the database dir.",
  NULL, NULL, FALSE);

static MYSQL_SYSVAR_ULONG(flush_log_at_trx_commit, srv_flush_log_at_trx_commit,
  PLUGIN_VAR_OPCMDARG,
  "Set to 0 (write and flush once per second),"
  " 1 (write and flush at each commit)"
  " or 2 (write at commit, flush once per second).",
  NULL, NULL, 1, 0, 2, 0);

static MYSQL_SYSVAR_STR(flush_method, innobase_unix_file_flush_method,
  PLUGIN_VAR_RQCMDARG | PLUGIN_VAR_READONLY,
  "With which method to flush data.", NULL, NULL, NULL);

static MYSQL_SYSVAR_BOOL(locks_unsafe_for_binlog, innobase_locks_unsafe_for_binlog,
  PLUGIN_VAR_NOCMDARG | PLUGIN_VAR_READONLY,
  "Force InnoDB to not use next-key locking, to use only row-level locking.",
  NULL, NULL, FALSE);

#ifdef UNIV_LOG_ARCHIVE
static MYSQL_SYSVAR_STR(log_arch_dir, innobase_log_arch_dir,
  PLUGIN_VAR_RQCMDARG | PLUGIN_VAR_READONLY,
  "Where full logs should be archived.", NULL, NULL, NULL);

static MYSQL_SYSVAR_BOOL(log_archive, innobase_log_archive,
  PLUGIN_VAR_OPCMDARG | PLUGIN_VAR_READONLY,
  "Set to 1 if you want to have logs archived.", NULL, NULL, FALSE);
#endif /* UNIV_LOG_ARCHIVE */

static MYSQL_SYSVAR_STR(log_group_home_dir, innobase_log_group_home_dir,
  PLUGIN_VAR_RQCMDARG | PLUGIN_VAR_READONLY,
  "Path to InnoDB log files.", NULL, NULL, NULL);

static MYSQL_SYSVAR_ULONG(max_dirty_pages_pct, srv_max_buf_pool_modified_pct,
  PLUGIN_VAR_RQCMDARG,
  "Percentage of dirty pages allowed in bufferpool.",
  NULL, NULL, 90, 0, 100, 0);

static MYSQL_SYSVAR_ULONG(max_purge_lag, srv_max_purge_lag,
  PLUGIN_VAR_RQCMDARG,
  "Desired maximum length of the purge queue (0 = no limit)",
  NULL, NULL, 0, 0, ~0L, 0);

static MYSQL_SYSVAR_BOOL(rollback_on_timeout, innobase_rollback_on_timeout,
  PLUGIN_VAR_OPCMDARG | PLUGIN_VAR_READONLY,
  "Roll back the complete transaction on lock wait timeout, for 4.x compatibility (disabled by default)",
  NULL, NULL, FALSE);

static MYSQL_SYSVAR_BOOL(status_file, innobase_create_status_file,
  PLUGIN_VAR_OPCMDARG | PLUGIN_VAR_NOSYSVAR,
  "Enable SHOW INNODB STATUS output in the innodb_status.<pid> file",
  NULL, NULL, FALSE);

static MYSQL_SYSVAR_BOOL(stats_on_metadata, innobase_stats_on_metadata,
  PLUGIN_VAR_OPCMDARG | PLUGIN_VAR_NOSYSVAR,
  "Enable statistics gathering for metadata commands such as SHOW TABLE STATUS (on by default)",
  NULL, NULL, TRUE);

vasil's avatar
vasil committed
8143
static MYSQL_SYSVAR_BOOL(adaptive_hash_index, innobase_adaptive_hash_index,
8144
  PLUGIN_VAR_OPCMDARG | PLUGIN_VAR_READONLY,
vasil's avatar
vasil committed
8145 8146
  "Enable InnoDB adaptive hash index (enabled by default).  "
  "Disable with --skip-innodb-adaptive-hash-index.",
8147 8148
  NULL, NULL, TRUE);

8149 8150 8151 8152 8153 8154 8155 8156 8157 8158 8159 8160 8161 8162 8163 8164 8165 8166 8167 8168 8169 8170 8171 8172 8173 8174 8175 8176 8177 8178 8179 8180 8181 8182 8183 8184 8185 8186 8187 8188 8189 8190 8191 8192 8193 8194 8195 8196 8197 8198 8199 8200 8201 8202 8203 8204 8205 8206 8207 8208 8209 8210 8211 8212 8213 8214 8215 8216 8217 8218 8219 8220 8221 8222 8223 8224 8225 8226 8227 8228 8229 8230 8231 8232 8233
static MYSQL_SYSVAR_LONG(additional_mem_pool_size, innobase_additional_mem_pool_size,
  PLUGIN_VAR_RQCMDARG | PLUGIN_VAR_READONLY,
  "Size of a memory pool InnoDB uses to store data dictionary information and other internal data structures.",
  NULL, NULL, 1*1024*1024L, 512*1024L, ~0L, 1024);

static MYSQL_SYSVAR_ULONG(autoextend_increment, srv_auto_extend_increment,
  PLUGIN_VAR_RQCMDARG,
  "Data file autoextend increment in megabytes",
  NULL, NULL, 8L, 1L, 1000L, 0);

static MYSQL_SYSVAR_LONGLONG(buffer_pool_size, innobase_buffer_pool_size,
  PLUGIN_VAR_RQCMDARG | PLUGIN_VAR_READONLY,
  "The size of the memory buffer InnoDB uses to cache data and indexes of its tables.",
  NULL, NULL, 8*1024*1024L, 1024*1024L, LONGLONG_MAX, 1024*1024L);

static MYSQL_SYSVAR_ULONG(commit_concurrency, srv_commit_concurrency,
  PLUGIN_VAR_RQCMDARG,
  "Helps in performance tuning in heavily concurrent environments.",
  NULL, NULL, 0, 0, 1000, 0);

static MYSQL_SYSVAR_ULONG(concurrency_tickets, srv_n_free_tickets_to_enter,
  PLUGIN_VAR_RQCMDARG,
  "Number of times a thread is allowed to enter InnoDB within the same SQL query after it has once got the ticket",
  NULL, NULL, 500L, 1L, ~0L, 0);

static MYSQL_SYSVAR_LONG(file_io_threads, innobase_file_io_threads,
  PLUGIN_VAR_RQCMDARG | PLUGIN_VAR_READONLY,
  "Number of file I/O threads in InnoDB.",
  NULL, NULL, 4, 4, 64, 0);

static MYSQL_SYSVAR_LONG(force_recovery, innobase_force_recovery,
  PLUGIN_VAR_RQCMDARG | PLUGIN_VAR_READONLY,
  "Helps to save your data in case the disk image of the database becomes corrupt.",
  NULL, NULL, 0, 0, 6, 0);

static MYSQL_SYSVAR_LONG(lock_wait_timeout, innobase_lock_wait_timeout,
  PLUGIN_VAR_RQCMDARG | PLUGIN_VAR_READONLY,
  "Timeout in seconds an InnoDB transaction may wait for a lock before being rolled back.",
  NULL, NULL, 50, 1, 1024 * 1024 * 1024, 0);

static MYSQL_SYSVAR_LONG(log_buffer_size, innobase_log_buffer_size,
  PLUGIN_VAR_RQCMDARG | PLUGIN_VAR_READONLY,
  "The size of the buffer which InnoDB uses to write log to the log files on disk.",
  NULL, NULL, 1024*1024L, 256*1024L, ~0L, 1024);

static MYSQL_SYSVAR_LONGLONG(log_file_size, innobase_log_file_size,
  PLUGIN_VAR_RQCMDARG | PLUGIN_VAR_READONLY,
  "Size of each log file in a log group.",
  NULL, NULL, 5*1024*1024L, 1*1024*1024L, LONGLONG_MAX, 1024*1024L);

static MYSQL_SYSVAR_LONG(log_files_in_group, innobase_log_files_in_group,
  PLUGIN_VAR_RQCMDARG | PLUGIN_VAR_READONLY,
  "Number of log files in the log group. InnoDB writes to the files in a circular fashion. Value 3 is recommended here.",
  NULL, NULL, 2, 2, 100, 0);

static MYSQL_SYSVAR_LONG(mirrored_log_groups, innobase_mirrored_log_groups,
  PLUGIN_VAR_RQCMDARG | PLUGIN_VAR_READONLY,
  "Number of identical copies of log groups we keep for the database. Currently this should be set to 1.",
  NULL, NULL, 1, 1, 10, 0);

static MYSQL_SYSVAR_LONG(open_files, innobase_open_files,
  PLUGIN_VAR_RQCMDARG | PLUGIN_VAR_READONLY,
  "How many files at the maximum InnoDB keeps open at the same time.",
  NULL, NULL, 300L, 10L, ~0L, 0);

static MYSQL_SYSVAR_ULONG(sync_spin_loops, srv_n_spin_wait_rounds,
  PLUGIN_VAR_RQCMDARG,
  "Count of spin-loop rounds in InnoDB mutexes",
  NULL, NULL, 20L, 0L, ~0L, 0);

static MYSQL_SYSVAR_ULONG(thread_concurrency, srv_thread_concurrency,
  PLUGIN_VAR_RQCMDARG,
  "Helps in performance tuning in heavily concurrent environments. Sets the maximum number of threads allowed inside InnoDB. Value 0 will disable the thread throttling.",
  NULL, NULL, 8, 0, 1000, 0);

static MYSQL_SYSVAR_ULONG(thread_sleep_delay, srv_thread_sleep_delay,
  PLUGIN_VAR_RQCMDARG,
  "Time of innodb thread sleeping before joining InnoDB queue (usec). Value 0 disable a sleep",
  NULL, NULL, 10000L, 0L, ~0L, 0);

static MYSQL_SYSVAR_STR(data_file_path, innobase_data_file_path,
  PLUGIN_VAR_RQCMDARG | PLUGIN_VAR_READONLY,
  "Path to individual files and their sizes.",
  NULL, NULL, NULL);

8234
static MYSQL_SYSVAR_LONG(autoinc_lock_mode, innobase_autoinc_lock_mode,
marko's avatar
marko committed
8235
  PLUGIN_VAR_RQCMDARG | PLUGIN_VAR_READONLY,
vasil's avatar
vasil committed
8236 8237 8238 8239 8240
  "The AUTOINC lock modes supported by InnoDB:               "
  "0 => Old style AUTOINC locking (for backward"
  " compatibility)                                           "
  "1 => New style AUTOINC locking                            "
  "2 => No AUTOINC locking (unsafe for SBR)",
8241 8242 8243 8244 8245
  NULL, NULL,
  AUTOINC_NEW_STYLE_LOCKING,	/* Default setting */
  AUTOINC_OLD_STYLE_LOCKING,	/* Minimum value */
  AUTOINC_NO_LOCKING, 0);	/* Maximum value */

8246 8247 8248 8249 8250 8251 8252 8253 8254 8255 8256 8257 8258 8259 8260 8261 8262 8263 8264 8265 8266 8267 8268 8269 8270 8271 8272 8273 8274 8275 8276 8277
static struct st_mysql_sys_var* innobase_system_variables[]= {
  MYSQL_SYSVAR(additional_mem_pool_size),
  MYSQL_SYSVAR(autoextend_increment),
  MYSQL_SYSVAR(buffer_pool_size),
  MYSQL_SYSVAR(checksums),
  MYSQL_SYSVAR(commit_concurrency),
  MYSQL_SYSVAR(concurrency_tickets),
  MYSQL_SYSVAR(data_file_path),
  MYSQL_SYSVAR(data_home_dir),
  MYSQL_SYSVAR(doublewrite),
  MYSQL_SYSVAR(fast_shutdown),
  MYSQL_SYSVAR(file_io_threads),
  MYSQL_SYSVAR(file_per_table),
  MYSQL_SYSVAR(flush_log_at_trx_commit),
  MYSQL_SYSVAR(flush_method),
  MYSQL_SYSVAR(force_recovery),
  MYSQL_SYSVAR(locks_unsafe_for_binlog),
  MYSQL_SYSVAR(lock_wait_timeout),
#ifdef UNIV_LOG_ARCHIVE
  MYSQL_SYSVAR(log_arch_dir),
  MYSQL_SYSVAR(log_archive),
#endif /* UNIV_LOG_ARCHIVE */
  MYSQL_SYSVAR(log_buffer_size),
  MYSQL_SYSVAR(log_file_size),
  MYSQL_SYSVAR(log_files_in_group),
  MYSQL_SYSVAR(log_group_home_dir),
  MYSQL_SYSVAR(max_dirty_pages_pct),
  MYSQL_SYSVAR(max_purge_lag),
  MYSQL_SYSVAR(mirrored_log_groups),
  MYSQL_SYSVAR(open_files),
  MYSQL_SYSVAR(rollback_on_timeout),
  MYSQL_SYSVAR(stats_on_metadata),
vasil's avatar
vasil committed
8278
  MYSQL_SYSVAR(adaptive_hash_index),
8279 8280 8281 8282 8283 8284
  MYSQL_SYSVAR(status_file),
  MYSQL_SYSVAR(support_xa),
  MYSQL_SYSVAR(sync_spin_loops),
  MYSQL_SYSVAR(table_locks),
  MYSQL_SYSVAR(thread_concurrency),
  MYSQL_SYSVAR(thread_sleep_delay),
8285
  MYSQL_SYSVAR(autoinc_lock_mode),
8286 8287 8288
  NULL
};

8289 8290 8291
mysql_declare_plugin(innobase)
{
  MYSQL_STORAGE_ENGINE_PLUGIN,
marko's avatar
marko committed
8292
  &innobase_storage_engine,
8293 8294
  innobase_hton_name,
  "Innobase OY",
marko's avatar
marko committed
8295
  "Supports transactions, row-level locking, and foreign keys",
8296
  PLUGIN_LICENSE_GPL,
marko's avatar
marko committed
8297
  innobase_init, /* Plugin Init */
8298 8299
  NULL, /* Plugin Deinit */
  0x0100 /* 1.0 */,
marko's avatar
marko committed
8300
  innodb_status_variables_export,/* status variables             */
8301 8302
  innobase_system_variables, /* system variables */
  NULL /* reserved */
8303 8304
}
mysql_declare_plugin_end;