btr0cur.h 33.7 KB
Newer Older
1 2
/*****************************************************************************

3
Copyright (c) 1994, 2010, Innobase Oy. All Rights Reserved.
4 5 6 7 8 9 10 11 12 13 14 15 16 17 18

This program is free software; you can redistribute it and/or modify it under
the terms of the GNU General Public License as published by the Free Software
Foundation; version 2 of the License.

This program is distributed in the hope that it will be useful, but WITHOUT
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.

You should have received a copy of the GNU General Public License along with
this program; if not, write to the Free Software Foundation, Inc., 59 Temple
Place, Suite 330, Boston, MA 02111-1307 USA

*****************************************************************************/

19 20
/**************************************************//**
@file include/btr0cur.h
osku's avatar
osku committed
21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39
The index tree cursor

Created 10/16/1994 Heikki Tuuri
*******************************************************/

#ifndef btr0cur_h
#define btr0cur_h

#include "univ.i"
#include "dict0dict.h"
#include "page0cur.h"
#include "btr0types.h"

/* Mode flags for btr_cur operations; these can be ORed */
#define BTR_NO_UNDO_LOG_FLAG	1	/* do no undo logging */
#define BTR_NO_LOCKING_FLAG	2	/* do no record lock checking */
#define BTR_KEEP_SYS_FLAG	4	/* sys fields will be found from the
					update vector or inserted entry */

40 41 42 43 44
#ifndef UNIV_HOTBACKUP
#include "que0types.h"
#include "row0types.h"
#include "ha0ha.h"

osku's avatar
osku committed
45 46 47
#define BTR_CUR_ADAPT
#define BTR_CUR_HASH_ADAPT

48
#ifdef UNIV_DEBUG
49
/*********************************************************//**
50 51
Returns the page cursor component of a tree cursor.
@return	pointer to page cursor component */
osku's avatar
osku committed
52 53 54 55
UNIV_INLINE
page_cur_t*
btr_cur_get_page_cur(
/*=================*/
56
	const btr_cur_t*	cursor);/*!< in: tree cursor */
57 58 59
#else /* UNIV_DEBUG */
# define btr_cur_get_page_cur(cursor) (&(cursor)->page_cur)
#endif /* UNIV_DEBUG */
60
/*********************************************************//**
61 62
Returns the buffer block on which the tree cursor is positioned.
@return	pointer to buffer block */
63 64 65 66
UNIV_INLINE
buf_block_t*
btr_cur_get_block(
/*==============*/
67
	btr_cur_t*	cursor);/*!< in: tree cursor */
68
/*********************************************************//**
69 70
Returns the record pointer of a tree cursor.
@return	pointer to record */
osku's avatar
osku committed
71 72 73 74
UNIV_INLINE
rec_t*
btr_cur_get_rec(
/*============*/
75
	btr_cur_t*	cursor);/*!< in: tree cursor */
76
/*********************************************************//**
77 78
Returns the compressed page on which the tree cursor is positioned.
@return	pointer to compressed page, or NULL if the page is not compressed */
79 80 81 82
UNIV_INLINE
page_zip_des_t*
btr_cur_get_page_zip(
/*=================*/
83
	btr_cur_t*	cursor);/*!< in: tree cursor */
84
/*********************************************************//**
osku's avatar
osku committed
85 86 87 88 89
Invalidates a tree cursor by setting record pointer to NULL. */
UNIV_INLINE
void
btr_cur_invalidate(
/*===============*/
90
	btr_cur_t*	cursor);/*!< in: tree cursor */
91
/*********************************************************//**
92 93
Returns the page of a tree cursor.
@return	pointer to page */
osku's avatar
osku committed
94 95 96 97
UNIV_INLINE
page_t*
btr_cur_get_page(
/*=============*/
98
	btr_cur_t*	cursor);/*!< in: tree cursor */
99
/*********************************************************//**
100 101
Returns the index of a cursor.
@return	index */
osku's avatar
osku committed
102
UNIV_INLINE
103 104 105
dict_index_t*
btr_cur_get_index(
/*==============*/
106
	btr_cur_t*	cursor);/*!< in: B-tree cursor */
107
/*********************************************************//**
osku's avatar
osku committed
108 109 110 111 112
Positions a tree cursor at a given record. */
UNIV_INLINE
void
btr_cur_position(
/*=============*/
113 114 115 116
	dict_index_t*	index,	/*!< in: index */
	rec_t*		rec,	/*!< in: record in tree */
	buf_block_t*	block,	/*!< in: buffer block of rec */
	btr_cur_t*	cursor);/*!< in: cursor */
117
/********************************************************************//**
osku's avatar
osku committed
118 119 120 121 122 123
Searches an index tree and positions a tree cursor on a given level.
NOTE: n_fields_cmp in tuple must be set so that it cannot be compared
to node pointer page number fields on the upper levels of the tree!
Note that if mode is PAGE_CUR_LE, which is used in inserts, then
cursor->up_match and cursor->low_match both will have sensible values.
If mode is PAGE_CUR_GE, then up_match will a have a sensible value. */
124
UNIV_INTERN
osku's avatar
osku committed
125 126 127
void
btr_cur_search_to_nth_level(
/*========================*/
128 129 130
	dict_index_t*	index,	/*!< in: index */
	ulint		level,	/*!< in: the tree level of search */
	const dtuple_t*	tuple,	/*!< in: data tuple; NOTE: n_fields_cmp in
osku's avatar
osku committed
131 132
				tuple must be set so that it cannot get
				compared to the node ptr page number field! */
133
	ulint		mode,	/*!< in: PAGE_CUR_L, ...;
osku's avatar
osku committed
134 135 136 137 138 139
				NOTE that if the search is made using a unique
				prefix of a record, mode should be PAGE_CUR_LE,
				not PAGE_CUR_GE, as the latter may end up on
				the previous page of the record! Inserts
				should always be made using PAGE_CUR_LE to
				search the position! */
140
	ulint		latch_mode, /*!< in: BTR_SEARCH_LEAF, ..., ORed with
141 142
				at most one of BTR_INSERT, BTR_DELETE_MARK,
				BTR_DELETE, or BTR_ESTIMATE;
143
				cursor->left_block is used to store a pointer
osku's avatar
osku committed
144 145 146 147 148 149 150
				to the left neighbor page, in the cases
				BTR_SEARCH_PREV and BTR_MODIFY_PREV;
				NOTE that if has_search_latch
				is != 0, we maybe do not have a latch set
				on the cursor page, we assume
				the caller uses his search latch
				to protect the record! */
151
	btr_cur_t*	cursor, /*!< in/out: tree cursor; the cursor page is
osku's avatar
osku committed
152
				s- or x-latched, but see also above! */
153
	ulint		has_search_latch,/*!< in: latch mode the caller
osku's avatar
osku committed
154 155
				currently has on btr_search_latch:
				RW_S_LATCH, or 0 */
156 157
	const char*	file,	/*!< in: file name */
	ulint		line,	/*!< in: line where called */
158
	mtr_t*		mtr);	/*!< in: mtr */
159
/*****************************************************************//**
osku's avatar
osku committed
160
Opens a cursor at either end of an index. */
161
UNIV_INTERN
osku's avatar
osku committed
162
void
163 164
btr_cur_open_at_index_side_func(
/*============================*/
165
	ibool		from_left,	/*!< in: TRUE if open to the low end,
osku's avatar
osku committed
166
					FALSE if to the high end */
167 168 169
	dict_index_t*	index,		/*!< in: index */
	ulint		latch_mode,	/*!< in: latch mode */
	btr_cur_t*	cursor,		/*!< in: cursor */
170 171
	const char*	file,		/*!< in: file name */
	ulint		line,		/*!< in: line where called */
172
	mtr_t*		mtr);		/*!< in: mtr */
173 174
#define btr_cur_open_at_index_side(f,i,l,c,m)				\
	btr_cur_open_at_index_side_func(f,i,l,c,__FILE__,__LINE__,m)
175
/**********************************************************************//**
osku's avatar
osku committed
176
Positions a cursor at a randomly chosen position within a B-tree. */
177
UNIV_INTERN
osku's avatar
osku committed
178
void
179 180
btr_cur_open_at_rnd_pos_func(
/*=========================*/
181 182 183
	dict_index_t*	index,		/*!< in: index */
	ulint		latch_mode,	/*!< in: BTR_SEARCH_LEAF, ... */
	btr_cur_t*	cursor,		/*!< in/out: B-tree cursor */
184 185
	const char*	file,		/*!< in: file name */
	ulint		line,		/*!< in: line where called */
186
	mtr_t*		mtr);		/*!< in: mtr */
187 188
#define btr_cur_open_at_rnd_pos(i,l,c,m)				\
	btr_cur_open_at_rnd_pos_func(i,l,c,__FILE__,__LINE__,m)
189
/*************************************************************//**
osku's avatar
osku committed
190 191 192 193
Tries to perform an insert to a page in an index tree, next to cursor.
It is assumed that mtr holds an x-latch on the page. The operation does
not succeed if there is too little space on the page. If there is just
one record on the page, the insert will always succeed; this is to
194 195
prevent trying to split a page with just one record.
@return	DB_SUCCESS, DB_WAIT_LOCK, DB_FAIL, or error number */
196
UNIV_INTERN
osku's avatar
osku committed
197 198 199
ulint
btr_cur_optimistic_insert(
/*======================*/
200
	ulint		flags,	/*!< in: undo logging and locking flags: if not
osku's avatar
osku committed
201 202
				zero, the parameters index and thr should be
				specified */
203
	btr_cur_t*	cursor,	/*!< in: cursor on page after which to insert;
osku's avatar
osku committed
204
				cursor stays valid */
205 206
	dtuple_t*	entry,	/*!< in/out: entry to insert */
	rec_t**		rec,	/*!< out: pointer to inserted record if
osku's avatar
osku committed
207
				succeed */
208
	big_rec_t**	big_rec,/*!< out: big rec vector whose fields have to
osku's avatar
osku committed
209 210
				be stored externally by the caller, or
				NULL */
211 212 213
	ulint		n_ext,	/*!< in: number of externally stored columns */
	que_thr_t*	thr,	/*!< in: query thread or NULL */
	mtr_t*		mtr);	/*!< in: mtr; if this function returns
214 215 216 217
				DB_SUCCESS on a leaf page of a secondary
				index in a compressed tablespace, the
				mtr must be committed before latching
				any further pages */
218
/*************************************************************//**
osku's avatar
osku committed
219 220 221
Performs an insert on a page of an index tree. It is assumed that mtr
holds an x-latch on the tree and on the cursor page. If the insert is
made on the leaf level, to avoid deadlocks, mtr must also own x-latches
222 223
to brothers of page, if those brothers exist.
@return	DB_SUCCESS or error number */
224
UNIV_INTERN
osku's avatar
osku committed
225 226 227
ulint
btr_cur_pessimistic_insert(
/*=======================*/
228
	ulint		flags,	/*!< in: undo logging and locking flags: if not
osku's avatar
osku committed
229 230 231 232 233
				zero, the parameter thr should be
				specified; if no undo logging is specified,
				then the caller must have reserved enough
				free extents in the file space so that the
				insertion will certainly succeed */
234
	btr_cur_t*	cursor,	/*!< in: cursor after which to insert;
osku's avatar
osku committed
235
				cursor stays valid */
236 237
	dtuple_t*	entry,	/*!< in/out: entry to insert */
	rec_t**		rec,	/*!< out: pointer to inserted record if
osku's avatar
osku committed
238
				succeed */
239
	big_rec_t**	big_rec,/*!< out: big rec vector whose fields have to
osku's avatar
osku committed
240 241
				be stored externally by the caller, or
				NULL */
242 243 244
	ulint		n_ext,	/*!< in: number of externally stored columns */
	que_thr_t*	thr,	/*!< in: query thread or NULL */
	mtr_t*		mtr);	/*!< in: mtr */
245
/*************************************************************//**
246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261
See if there is enough place in the page modification log to log
an update-in-place.
@return	TRUE if enough place */
UNIV_INTERN
ibool
btr_cur_update_alloc_zip(
/*=====================*/
	page_zip_des_t*	page_zip,/*!< in/out: compressed page */
	buf_block_t*	block,	/*!< in/out: buffer page */
	dict_index_t*	index,	/*!< in: the index corresponding to the block */
	ulint		length,	/*!< in: size needed */
	ibool		create,	/*!< in: TRUE=delete-and-insert,
				FALSE=update-in-place */
	mtr_t*		mtr)	/*!< in: mini-transaction */
	__attribute__((nonnull, warn_unused_result));
/*************************************************************//**
262 263
Updates a record when the update causes no size changes in its fields.
@return	DB_SUCCESS or error number */
264
UNIV_INTERN
osku's avatar
osku committed
265 266 267
ulint
btr_cur_update_in_place(
/*====================*/
268 269
	ulint		flags,	/*!< in: undo logging and locking flags */
	btr_cur_t*	cursor,	/*!< in: cursor on the record to update;
osku's avatar
osku committed
270 271
				cursor stays valid and positioned on the
				same record */
272 273
	const upd_t*	update,	/*!< in: update vector */
	ulint		cmpl_info,/*!< in: compiler info on secondary index
osku's avatar
osku committed
274
				updates */
275 276
	que_thr_t*	thr,	/*!< in: query thread */
	mtr_t*		mtr);	/*!< in: mtr; must be committed before
277
				latching any further pages */
278
/*************************************************************//**
osku's avatar
osku committed
279 280 281
Tries to update a record on a page in an index tree. It is assumed that mtr
holds an x-latch on the page. The operation does not succeed if there is too
little space on the page or if the update would result in too empty a page,
282
so that tree compression is recommended.
283 284 285
@return DB_SUCCESS, or DB_OVERFLOW if the updated record does not fit,
DB_UNDERFLOW if the page would become too empty, or DB_ZIP_OVERFLOW if
there is not enough space left on the compressed page */
286
UNIV_INTERN
osku's avatar
osku committed
287 288 289
ulint
btr_cur_optimistic_update(
/*======================*/
290 291
	ulint		flags,	/*!< in: undo logging and locking flags */
	btr_cur_t*	cursor,	/*!< in: cursor on the record to update;
osku's avatar
osku committed
292 293
				cursor stays valid and positioned on the
				same record */
294
	const upd_t*	update,	/*!< in: update vector; this must also
osku's avatar
osku committed
295
				contain trx id and roll ptr fields */
296
	ulint		cmpl_info,/*!< in: compiler info on secondary index
osku's avatar
osku committed
297
				updates */
298 299
	que_thr_t*	thr,	/*!< in: query thread */
	mtr_t*		mtr);	/*!< in: mtr; must be committed before
300
				latching any further pages */
301
/*************************************************************//**
osku's avatar
osku committed
302 303 304
Performs an update of a record on a page of a tree. It is assumed
that mtr holds an x-latch on the tree and on the cursor page. If the
update is made on the leaf level, to avoid deadlocks, mtr must also
305 306
own x-latches to brothers of page, if those brothers exist.
@return	DB_SUCCESS or error code */
307
UNIV_INTERN
osku's avatar
osku committed
308 309 310
ulint
btr_cur_pessimistic_update(
/*=======================*/
311
	ulint		flags,	/*!< in: undo logging, locking, and rollback
osku's avatar
osku committed
312
				flags */
313
	btr_cur_t*	cursor,	/*!< in: cursor on the record to update */
314 315
	mem_heap_t**	heap,	/*!< in/out: pointer to memory heap, or NULL */
	big_rec_t**	big_rec,/*!< out: big rec vector whose fields have to
osku's avatar
osku committed
316
				be stored externally by the caller, or NULL */
317
	const upd_t*	update,	/*!< in: update vector; this is allowed also
osku's avatar
osku committed
318 319
				contain trx id and roll ptr fields, but
				the values in update vector have no effect */
320
	ulint		cmpl_info,/*!< in: compiler info on secondary index
osku's avatar
osku committed
321
				updates */
322 323
	que_thr_t*	thr,	/*!< in: query thread */
	mtr_t*		mtr);	/*!< in: mtr; must be committed before
324
				latching any further pages */
325
/***********************************************************//**
osku's avatar
osku committed
326 327 328
Marks a clustered index record deleted. Writes an undo log record to
undo log on this delete marking. Writes in the trx id field the id
of the deleting transaction, and in the roll ptr field pointer to the
329 330
undo log record created.
@return	DB_SUCCESS, DB_LOCK_WAIT, or error number */
331
UNIV_INTERN
osku's avatar
osku committed
332 333 334
ulint
btr_cur_del_mark_set_clust_rec(
/*===========================*/
335
	ulint		flags,	/*!< in: undo logging and locking flags */
336 337 338 339
	buf_block_t*	block,	/*!< in/out: buffer block of the record */
	rec_t*		rec,	/*!< in/out: record */
	dict_index_t*	index,	/*!< in: clustered index of the record */
	const ulint*	offsets,/*!< in: rec_get_offsets(rec) */
340 341
	ibool		val,	/*!< in: value to set */
	que_thr_t*	thr,	/*!< in: query thread */
342 343
	mtr_t*		mtr)	/*!< in: mtr */
	__attribute__((nonnull));
344
/***********************************************************//**
345 346
Sets a secondary index record delete mark to TRUE or FALSE.
@return	DB_SUCCESS, DB_LOCK_WAIT, or error number */
347
UNIV_INTERN
osku's avatar
osku committed
348 349 350
ulint
btr_cur_del_mark_set_sec_rec(
/*=========================*/
351 352 353 354 355
	ulint		flags,	/*!< in: locking flag */
	btr_cur_t*	cursor,	/*!< in: cursor */
	ibool		val,	/*!< in: value to set */
	que_thr_t*	thr,	/*!< in: query thread */
	mtr_t*		mtr);	/*!< in: mtr */
356
/*************************************************************//**
osku's avatar
osku committed
357 358 359 360
Tries to compress a page of the tree if it seems useful. It is assumed
that mtr holds an x-latch on the tree and on the cursor page. To avoid
deadlocks, mtr must also own x-latches to brothers of page, if those
brothers exist. NOTE: it is assumed that the caller has reserved enough
361 362
free extents so that the compression will always succeed if done!
@return	TRUE if compression occurred */
363
UNIV_INTERN
osku's avatar
osku committed
364 365 366
ibool
btr_cur_compress_if_useful(
/*=======================*/
367
	btr_cur_t*	cursor,	/*!< in: cursor on the page to compress;
osku's avatar
osku committed
368 369
				cursor does not stay valid if compression
				occurs */
370
	mtr_t*		mtr);	/*!< in: mtr */
371
/*******************************************************//**
osku's avatar
osku committed
372 373
Removes the record on which the tree cursor is positioned. It is assumed
that the mtr has an x-latch on the page where the cursor is positioned,
374 375
but no latch on the whole tree.
@return	TRUE if success, i.e., the page did not become too empty */
376
UNIV_INTERN
osku's avatar
osku committed
377 378 379
ibool
btr_cur_optimistic_delete(
/*======================*/
380
	btr_cur_t*	cursor,	/*!< in: cursor on the record to delete;
osku's avatar
osku committed
381 382 383
				cursor stays valid: if deletion succeeds,
				on function exit it points to the successor
				of the deleted record */
384
	mtr_t*		mtr);	/*!< in: mtr; if this function returns
385 386 387
				TRUE on a leaf page of a secondary
				index, the mtr must be committed
				before latching any further pages */
388
/*************************************************************//**
osku's avatar
osku committed
389 390 391 392 393
Removes the record on which the tree cursor is positioned. Tries
to compress the page if its fillfactor drops below a threshold
or if it is the only page on the level. It is assumed that mtr holds
an x-latch on the tree and on the cursor page. To avoid deadlocks,
mtr must also own x-latches to brothers of page, if those brothers
394 395
exist.
@return	TRUE if compression occurred */
396
UNIV_INTERN
osku's avatar
osku committed
397 398 399
ibool
btr_cur_pessimistic_delete(
/*=======================*/
400
	ulint*		err,	/*!< out: DB_SUCCESS or DB_OUT_OF_FILE_SPACE;
osku's avatar
osku committed
401 402 403 404
				the latter may occur because we may have
				to update node pointers on upper levels,
				and in the case of variable length keys
				these may actually grow in size */
405
	ibool		has_reserved_extents, /*!< in: TRUE if the
osku's avatar
osku committed
406 407 408
				caller has already reserved enough free
				extents so that he knows that the operation
				will succeed */
409
	btr_cur_t*	cursor,	/*!< in: cursor on the record to delete;
osku's avatar
osku committed
410 411 412
				if compression does not occur, the cursor
				stays valid: it points to successor of
				deleted record on function exit */
413 414
	enum trx_rb_ctx	rb_ctx,	/*!< in: rollback context */
	mtr_t*		mtr);	/*!< in: mtr */
415
#endif /* !UNIV_HOTBACKUP */
416
/***********************************************************//**
417 418
Parses a redo log record of updating a record in-place.
@return	end of log record or NULL */
419
UNIV_INTERN
osku's avatar
osku committed
420 421 422
byte*
btr_cur_parse_update_in_place(
/*==========================*/
423 424 425 426 427
	byte*		ptr,	/*!< in: buffer */
	byte*		end_ptr,/*!< in: buffer end */
	page_t*		page,	/*!< in/out: page or NULL */
	page_zip_des_t*	page_zip,/*!< in/out: compressed page, or NULL */
	dict_index_t*	index);	/*!< in: index corresponding to page */
428
/****************************************************************//**
osku's avatar
osku committed
429
Parses the redo log record for delete marking or unmarking of a clustered
430 431
index record.
@return	end of log record or NULL */
432
UNIV_INTERN
osku's avatar
osku committed
433 434 435
byte*
btr_cur_parse_del_mark_set_clust_rec(
/*=================================*/
436 437 438 439 440
	byte*		ptr,	/*!< in: buffer */
	byte*		end_ptr,/*!< in: buffer end */
	page_t*		page,	/*!< in/out: page or NULL */
	page_zip_des_t*	page_zip,/*!< in/out: compressed page, or NULL */
	dict_index_t*	index);	/*!< in: index corresponding to page */
441
/****************************************************************//**
osku's avatar
osku committed
442
Parses the redo log record for delete marking or unmarking of a secondary
443 444
index record.
@return	end of log record or NULL */
445
UNIV_INTERN
osku's avatar
osku committed
446 447 448
byte*
btr_cur_parse_del_mark_set_sec_rec(
/*===============================*/
449 450 451 452
	byte*		ptr,	/*!< in: buffer */
	byte*		end_ptr,/*!< in: buffer end */
	page_t*		page,	/*!< in/out: page or NULL */
	page_zip_des_t*	page_zip);/*!< in/out: compressed page, or NULL */
453
#ifndef UNIV_HOTBACKUP
454
/*******************************************************************//**
455 456
Estimates the number of rows in a given index range.
@return	estimated number of rows */
457
UNIV_INTERN
458
ib_int64_t
osku's avatar
osku committed
459 460
btr_estimate_n_rows_in_range(
/*=========================*/
461 462 463 464 465
	dict_index_t*	index,	/*!< in: index */
	const dtuple_t*	tuple1,	/*!< in: range start, may also be empty tuple */
	ulint		mode1,	/*!< in: search mode for range start */
	const dtuple_t*	tuple2,	/*!< in: range end, may also be empty tuple */
	ulint		mode2);	/*!< in: search mode for range end */
466
/*******************************************************************//**
osku's avatar
osku committed
467 468
Estimates the number of different key values in a given index, for
each n-column prefix of the index where n <= dict_index_get_n_unique(index).
469 470 471 472
The estimates are stored in the array index->stat_n_diff_key_vals.
If innodb_stats_method is nulls_ignored, we also record the number of
non-null values for each prefix and stored the estimates in
array index->stat_n_non_null_key_vals. */
473
UNIV_INTERN
osku's avatar
osku committed
474 475 476
void
btr_estimate_number_of_different_key_vals(
/*======================================*/
477
	dict_index_t*	index);	/*!< in: index */
478
/*******************************************************************//**
479 480
Marks non-updated off-page fields as disowned by this record. The ownership
must be transferred to the updated record which is inserted elsewhere in the
osku's avatar
osku committed
481
index tree. In purge only the owner of externally stored field is allowed
482
to free the field. */
483
UNIV_INTERN
484
void
485 486
btr_cur_disown_inherited_fields(
/*============================*/
487
	page_zip_des_t*	page_zip,/*!< in/out: compressed page whose uncompressed
488
				part will be updated, or NULL */
489 490 491 492
	rec_t*		rec,	/*!< in/out: record in a clustered index */
	dict_index_t*	index,	/*!< in: index of the page */
	const ulint*	offsets,/*!< in: array returned by rec_get_offsets() */
	const upd_t*	update,	/*!< in: update vector */
493 494
	mtr_t*		mtr)	/*!< in/out: mini-transaction */
	__attribute__((nonnull(2,3,4,5,6)));
495
/*******************************************************************//**
osku's avatar
osku committed
496
Stores the fields in big_rec_vec to the tablespace and puts pointers to
497 498
them in rec.  The extern flags in rec will have to be set beforehand.
The fields are stored on pages allocated from leaf node
499
file segment of the index tree.
500
@return	DB_SUCCESS or DB_OUT_OF_FILE_SPACE */
501
UNIV_INTERN
osku's avatar
osku committed
502
ulint
503 504
btr_store_big_rec_extern_fields_func(
/*=================================*/
505
	dict_index_t*	index,		/*!< in: index of rec; the index tree
osku's avatar
osku committed
506
					MUST be X-latched */
507 508 509
	buf_block_t*	rec_block,	/*!< in/out: block containing rec */
	rec_t*		rec,		/*!< in: record */
	const ulint*	offsets,	/*!< in: rec_get_offsets(rec, index);
510 511 512
					the "external storage" flags in offsets
					will not correspond to rec when
					this function returns */
513 514 515 516 517 518 519 520
#ifdef UNIV_DEBUG
	mtr_t*		local_mtr,	/*!< in: mtr containing the
					latch to rec and to the tree */
#endif /* UNIV_DEBUG */
#if defined UNIV_DEBUG || defined UNIV_BLOB_LIGHT_DEBUG
	ibool		update_in_place,/*! in: TRUE if the record is updated
					in place (not delete+insert) */
#endif /* UNIV_DEBUG || UNIV_BLOB_LIGHT_DEBUG */
521 522 523
	const big_rec_t*big_rec_vec)	/*!< in: vector containing fields
					to be stored externally */
	__attribute__((nonnull));
524 525 526 527 528 529 530 531

/** Stores the fields in big_rec_vec to the tablespace and puts pointers to
them in rec.  The extern flags in rec will have to be set beforehand.
The fields are stored on pages allocated from leaf node
file segment of the index tree.
@param index	in: clustered index; MUST be X-latched by mtr
@param b	in/out: block containing rec; MUST be X-latched by mtr
@param rec	in/out: clustered index record
532
@param offsets	in: rec_get_offsets(rec, index);
533 534 535
		the "external storage" flags in offsets will not be adjusted
@param mtr	in: mini-transaction that holds x-latch on index and b
@param upd	in: TRUE if the record is updated in place (not delete+insert)
536
@param big	in: vector containing fields to be stored externally
537 538
@return	DB_SUCCESS or DB_OUT_OF_FILE_SPACE */
#ifdef UNIV_DEBUG
539 540
# define btr_store_big_rec_extern_fields(index,b,rec,offsets,mtr,upd,big) \
	btr_store_big_rec_extern_fields_func(index,b,rec,offsets,mtr,upd,big)
541
#elif defined UNIV_BLOB_LIGHT_DEBUG
542 543
# define btr_store_big_rec_extern_fields(index,b,rec,offsets,mtr,upd,big) \
	btr_store_big_rec_extern_fields_func(index,b,rec,offsets,upd,big)
544
#else
545 546
# define btr_store_big_rec_extern_fields(index,b,rec,offsets,mtr,upd,big) \
	btr_store_big_rec_extern_fields_func(index,b,rec,offsets,big)
547 548
#endif

549
/*******************************************************************//**
osku's avatar
osku committed
550 551 552 553
Frees the space in an externally stored field to the file space
management if the field in data is owned the externally stored field,
in a rollback we may have the additional condition that the field must
not be inherited. */
554
UNIV_INTERN
osku's avatar
osku committed
555 556 557
void
btr_free_externally_stored_field(
/*=============================*/
558
	dict_index_t*	index,		/*!< in: index of the data, the index
osku's avatar
osku committed
559 560 561 562 563 564 565
					tree MUST be X-latched; if the tree
					height is 1, then also the root page
					must be X-latched! (this is relevant
					in the case this function is called
					from purge where 'data' is located on
					an undo log page, not an index
					page) */
566 567
	byte*		field_ref,	/*!< in/out: field reference */
	const rec_t*	rec,		/*!< in: record containing field_ref, for
marko's avatar
marko committed
568
					page_zip_write_blob_ptr(), or NULL */
569
	const ulint*	offsets,	/*!< in: rec_get_offsets(rec, index),
570
					or NULL */
571
	page_zip_des_t*	page_zip,	/*!< in: compressed page corresponding
marko's avatar
marko committed
572
					to rec, or NULL if rec == NULL */
573
	ulint		i,		/*!< in: field number of field_ref;
marko's avatar
marko committed
574
					ignored if rec == NULL */
575 576
	enum trx_rb_ctx	rb_ctx,		/*!< in: rollback context */
	mtr_t*		local_mtr);	/*!< in: mtr containing the latch to
osku's avatar
osku committed
577 578
					data an an X-latch to the index
					tree */
579
/*******************************************************************//**
580
Copies the prefix of an externally stored field of a record.  The
581
clustered index record must be protected by a lock or a page latch.
582 583
@return the length of the copied field, or 0 if the column was being
or has been deleted */
584
UNIV_INTERN
585 586 587
ulint
btr_copy_externally_stored_field_prefix(
/*====================================*/
588 589 590
	byte*		buf,	/*!< out: the field, or a prefix of it */
	ulint		len,	/*!< in: length of buf, in bytes */
	ulint		zip_size,/*!< in: nonzero=compressed BLOB page size,
591
				zero for uncompressed BLOBs */
592
	const byte*	data,	/*!< in: 'internally' stored part of the
593
				field containing also the reference to
594 595
				the external part; must be protected by
				a lock or a page latch */
596
	ulint		local_len);/*!< in: length of data, in bytes */
597
/*******************************************************************//**
598
Copies an externally stored field of a record to mem heap.
599
@return	the field copied to heap, or NULL if the field is incomplete */
600
UNIV_INTERN
osku's avatar
osku committed
601 602 603
byte*
btr_rec_copy_externally_stored_field(
/*=================================*/
604
	const rec_t*	rec,	/*!< in: record in a clustered index;
605
				must be protected by a lock or a page latch */
606 607
	const ulint*	offsets,/*!< in: array returned by rec_get_offsets() */
	ulint		zip_size,/*!< in: nonzero=compressed BLOB page size,
608
				zero for uncompressed BLOBs */
609 610 611
	ulint		no,	/*!< in: field number */
	ulint*		len,	/*!< out: length of the field */
	mem_heap_t*	heap);	/*!< in: mem heap */
612
/*******************************************************************//**
613 614
Flags the data tuple fields that are marked as extern storage in the
update vector.  We use this function to remember which fields we must
615 616
mark as extern storage in a record inserted for an update.
@return	number of flagged external columns */
617
UNIV_INTERN
osku's avatar
osku committed
618 619 620
ulint
btr_push_update_extern_fields(
/*==========================*/
621 622 623
	dtuple_t*	tuple,	/*!< in/out: data tuple */
	const upd_t*	update,	/*!< in: update vector */
	mem_heap_t*	heap)	/*!< in: memory heap */
624
	__attribute__((nonnull));
625
/***********************************************************//**
626 627
Sets a secondary index record's delete mark to the given value. This
function is only used by the insert buffer merge mechanism. */
marko's avatar
marko committed
628
UNIV_INTERN
629 630 631
void
btr_cur_set_deleted_flag_for_ibuf(
/*==============================*/
632 633
	rec_t*		rec,		/*!< in/out: record */
	page_zip_des_t*	page_zip,	/*!< in/out: compressed page
634 635 636
					corresponding to rec, or NULL
					when the tablespace is
					uncompressed */
637 638
	ibool		val,		/*!< in: value to set */
	mtr_t*		mtr);		/*!< in: mtr */
osku's avatar
osku committed
639 640
/*######################################################################*/

641
/** In the pessimistic delete, if the page data size drops below this
osku's avatar
osku committed
642 643 644
limit, merging it to a neighbor is tried */
#define BTR_CUR_PAGE_COMPRESS_LIMIT	(UNIV_PAGE_SIZE / 2)

645
/** A slot in the path array. We store here info on a search path down the
osku's avatar
osku committed
646 647 648 649
tree. Each slot contains data on a single level of the tree. */

typedef struct btr_path_struct	btr_path_t;
struct btr_path_struct{
650
	ulint	nth_rec;	/*!< index of the record
osku's avatar
osku committed
651 652 653 654
				where the page cursor stopped on
				this level (index in alphabetical
				order); value ULINT_UNDEFINED
				denotes array end */
655
	ulint	n_recs;		/*!< number of records on the page */
656 657 658 659 660
	ulint	page_no;	/*!< no of the page containing the record */
	ulint	page_level;	/*!< level of the page, if later we fetch
				the page under page_no and it is no different
				level then we know that the tree has been
				reorganized */
osku's avatar
osku committed
661 662
};

663
#define BTR_PATH_ARRAY_N_SLOTS	250	/*!< size of path array (in slots) */
osku's avatar
osku committed
664

665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680
/** Values for the flag documenting the used search method */
enum btr_cur_method {
	BTR_CUR_HASH = 1,	/*!< successful shortcut using
				the hash index */
	BTR_CUR_HASH_FAIL,	/*!< failure using hash, success using
				binary search: the misleading hash
				reference is stored in the field
				hash_node, and might be necessary to
				update */
	BTR_CUR_BINARY,		/*!< success using the binary search */
	BTR_CUR_INSERT_TO_IBUF,	/*!< performed the intended insert to
				the insert buffer */
	BTR_CUR_DEL_MARK_IBUF,	/*!< performed the intended delete
				mark in the insert/delete buffer */
	BTR_CUR_DELETE_IBUF,	/*!< performed the intended delete in
				the insert/delete buffer */
681
	BTR_CUR_DELETE_REF	/*!< row_purge_poss_sec() failed */
682
};
osku's avatar
osku committed
683

684 685
/** The tree cursor: the definition appears here only for the compiler
to know struct size! */
osku's avatar
osku committed
686
struct btr_cur_struct {
687 688 689 690
	dict_index_t*	index;		/*!< index where positioned */
	page_cur_t	page_cur;	/*!< page cursor */
	purge_node_t*	purge_node;	/*!< purge node, for BTR_DELETE */
	buf_block_t*	left_block;	/*!< this field is used to store
691 692 693 694
					a pointer to the left neighbor
					page, in the cases
					BTR_SEARCH_PREV and
					BTR_MODIFY_PREV */
osku's avatar
osku committed
695
	/*------------------------------*/
696 697 698 699 700
	que_thr_t*	thr;		/*!< this field is only used
					when btr_cur_search_to_nth_level
					is called for an index entry
					insertion: the calling query
					thread is passed here to be
osku's avatar
osku committed
701 702
					used in the insert buffer */
	/*------------------------------*/
703 704 705 706 707
	/** The following fields are used in
	btr_cur_search_to_nth_level to pass information: */
	/* @{ */
	enum btr_cur_method	flag;	/*!< Search method used */
	ulint		tree_height;	/*!< Tree height if the search is done
osku's avatar
osku committed
708 709
					for a pessimistic insert or update
					operation */
710
	ulint		up_match;	/*!< If the search mode was PAGE_CUR_LE,
osku's avatar
osku committed
711 712 713
					the number of matched fields to the
					the first user record to the right of
					the cursor record after
714
					btr_cur_search_to_nth_level;
osku's avatar
osku committed
715 716 717 718 719 720 721 722 723
					for the mode PAGE_CUR_GE, the matched
					fields to the first user record AT THE
					CURSOR or to the right of it;
					NOTE that the up_match and low_match
					values may exceed the correct values
					for comparison to the adjacent user
					record if that record is on a
					different leaf page! (See the note in
					row_ins_duplicate_key.) */
724
	ulint		up_bytes;	/*!< number of matched bytes to the
osku's avatar
osku committed
725 726 727
					right at the time cursor positioned;
					only used internally in searches: not
					defined after the search */
728
	ulint		low_match;	/*!< if search mode was PAGE_CUR_LE,
osku's avatar
osku committed
729 730 731
					the number of matched fields to the
					first user record AT THE CURSOR or
					to the left of it after
732
					btr_cur_search_to_nth_level;
osku's avatar
osku committed
733 734 735
					NOT defined for PAGE_CUR_GE or any
					other search modes; see also the NOTE
					in up_match! */
736
	ulint		low_bytes;	/*!< number of matched bytes to the
osku's avatar
osku committed
737 738 739
					right at the time cursor positioned;
					only used internally in searches: not
					defined after the search */
740
	ulint		n_fields;	/*!< prefix length used in a hash
osku's avatar
osku committed
741
					search if hash_node != NULL */
742
	ulint		n_bytes;	/*!< hash prefix bytes if hash_node !=
osku's avatar
osku committed
743
					NULL */
744
	ulint		fold;		/*!< fold value used in the search if
osku's avatar
osku committed
745
					flag is BTR_CUR_HASH */
746 747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762
	/*----- Delete buffering -------*/
	ulint		ibuf_cnt;	/* in searches done on insert buffer
					trees, this contains the "counter"
					value (the first two bytes of the
					fourth field) extracted from the
					page above the leaf page, from the
					father node pointer that pointed to
					the leaf page. in other words, it
					contains the minimum counter value
					for records to be inserted on the
					chosen leaf page. If for some reason
					this can't be read, or if the search
					ended on the leftmost leaf page in
					the tree (in which case the father
					node pointer had the 'minimum
					record' flag set), this is
					ULINT_UNDEFINED. */
osku's avatar
osku committed
763
	/*------------------------------*/
764 765
	/* @} */
	btr_path_t*	path_arr;	/*!< in estimating the number of
osku's avatar
osku committed
766 767 768 769 770
					rows in range, we store in this array
					information of the path through
					the tree */
};

771 772 773
/** If pessimistic delete fails because of lack of file space, there
is still a good change of success a little later.  Try this many
times. */
osku's avatar
osku committed
774
#define BTR_CUR_RETRY_DELETE_N_TIMES	100
775 776 777
/** If pessimistic delete fails because of lack of file space, there
is still a good change of success a little later.  Sleep this many
microseconds between retries. */
osku's avatar
osku committed
778 779
#define BTR_CUR_RETRY_SLEEP_TIME	50000

780
/** The reference in a field for which data is stored on a different page.
osku's avatar
osku committed
781 782 783 784 785
The reference is at the end of the 'locally' stored part of the field.
'Locally' means storage in the index record.
We store locally a long enough prefix of each column so that we can determine
the ordering parts of each index record without looking into the externally
stored part. */
786 787 788 789
/*-------------------------------------- @{ */
#define BTR_EXTERN_SPACE_ID		0	/*!< space id where stored */
#define BTR_EXTERN_PAGE_NO		4	/*!< page no where stored */
#define BTR_EXTERN_OFFSET		8	/*!< offset of BLOB header
osku's avatar
osku committed
790
						on that page */
791
#define BTR_EXTERN_LEN			12	/*!< 8 bytes containing the
osku's avatar
osku committed
792 793 794 795
						length of the externally
						stored part of the BLOB.
						The 2 highest bits are
						reserved to the flags below. */
796
/*-------------------------------------- @} */
797
/* #define BTR_EXTERN_FIELD_REF_SIZE	20 // moved to btr0types.h */
osku's avatar
osku committed
798

799 800 801 802
/** The most significant bit of BTR_EXTERN_LEN (i.e., the most
significant bit of the byte at smallest address) is set to 1 if this
field does not 'own' the externally stored field; only the owner field
is allowed to free the field in purge! */
osku's avatar
osku committed
803
#define BTR_EXTERN_OWNER_FLAG		128
804 805 806 807 808
/** If the second most significant bit of BTR_EXTERN_LEN (i.e., the
second most significant bit of the byte at smallest address) is 1 then
it means that the externally stored field was inherited from an
earlier version of the row.  In rollback we are not allowed to free an
inherited external field. */
osku's avatar
osku committed
809 810
#define BTR_EXTERN_INHERITED_FLAG	64

811
/** Number of searches down the B-tree in btr_cur_search_to_nth_level(). */
osku's avatar
osku committed
812
extern ulint	btr_cur_n_non_sea;
813 814
/** Number of successful adaptive hash index lookups in
btr_cur_search_to_nth_level(). */
osku's avatar
osku committed
815
extern ulint	btr_cur_n_sea;
816 817 818
/** Old value of btr_cur_n_non_sea.  Copied by
srv_refresh_innodb_monitor_stats().  Referenced by
srv_printf_innodb_monitor(). */
osku's avatar
osku committed
819
extern ulint	btr_cur_n_non_sea_old;
820 821 822
/** Old value of btr_cur_n_sea.  Copied by
srv_refresh_innodb_monitor_stats().  Referenced by
srv_printf_innodb_monitor(). */
osku's avatar
osku committed
823
extern ulint	btr_cur_n_sea_old;
824
#endif /* !UNIV_HOTBACKUP */
osku's avatar
osku committed
825 826 827 828

#ifndef UNIV_NONINL
#include "btr0cur.ic"
#endif
829

osku's avatar
osku committed
830
#endif