Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
M
mariadb
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
Analytics
Analytics
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Commits
Issue Boards
Open sidebar
Kirill Smelkov
mariadb
Commits
79a03447
Commit
79a03447
authored
Aug 29, 2011
by
Marko Mäkelä
Browse files
Options
Browse Files
Download
Plain Diff
Merge mysql-5.1 to mysql-5.5.
parents
10637a25
41bb3537
Changes
15
Expand all
Show whitespace changes
Inline
Side-by-side
Showing
15 changed files
with
531 additions
and
290 deletions
+531
-290
storage/innobase/btr/btr0btr.c
storage/innobase/btr/btr0btr.c
+199
-21
storage/innobase/btr/btr0cur.c
storage/innobase/btr/btr0cur.c
+59
-55
storage/innobase/buf/buf0buf.c
storage/innobase/buf/buf0buf.c
+0
-25
storage/innobase/fsp/fsp0fsp.c
storage/innobase/fsp/fsp0fsp.c
+138
-96
storage/innobase/include/btr0btr.h
storage/innobase/include/btr0btr.h
+33
-1
storage/innobase/include/btr0cur.h
storage/innobase/include/btr0cur.h
+17
-21
storage/innobase/include/buf0buf.h
storage/innobase/include/buf0buf.h
+0
-9
storage/innobase/include/fsp0fsp.h
storage/innobase/include/fsp0fsp.h
+17
-13
storage/innobase/include/mtr0mtr.h
storage/innobase/include/mtr0mtr.h
+10
-5
storage/innobase/include/mtr0mtr.ic
storage/innobase/include/mtr0mtr.ic
+5
-3
storage/innobase/mtr/mtr0mtr.c
storage/innobase/mtr/mtr0mtr.c
+3
-4
storage/innobase/row/row0ins.c
storage/innobase/row/row0ins.c
+21
-12
storage/innobase/row/row0row.c
storage/innobase/row/row0row.c
+14
-13
storage/innobase/row/row0upd.c
storage/innobase/row/row0upd.c
+13
-10
storage/innobase/trx/trx0undo.c
storage/innobase/trx/trx0undo.c
+2
-2
No files found.
storage/innobase/btr/btr0btr.c
View file @
79a03447
...
...
@@ -906,28 +906,29 @@ btr_page_alloc_for_ibuf(
/**************************************************************//**
Allocates a new file page to be used in an index tree. NOTE: we assume
that the caller has made the reservation for free extents!
@return
new allocated block, x-latched;
NULL if out of space */
UNIV_INTERN
buf_block_t
*
btr_page_alloc
(
/*===========*/
@return
allocated page number, FIL_
NULL if out of space */
static
__attribute__
((
nonnull
(
1
,
5
),
warn_unused_result
))
ulint
btr_page_alloc
_low
(
/*===========
====
*/
dict_index_t
*
index
,
/*!< in: index */
ulint
hint_page_no
,
/*!< in: hint of a good page */
byte
file_direction
,
/*!< in: direction where a possible
page split is made */
ulint
level
,
/*!< in: level where the page is placed
in the tree */
mtr_t
*
mtr
)
/*!< in: mtr */
mtr_t
*
mtr
,
/*!< in/out: mini-transaction
for the allocation */
mtr_t
*
init_mtr
)
/*!< in/out: mini-transaction
in which the page should be
initialized (may be the same
as mtr), or NULL if it should
not be initialized (the page
at hint was previously freed
in mtr) */
{
fseg_header_t
*
seg_header
;
page_t
*
root
;
buf_block_t
*
new_block
;
ulint
new_page_no
;
if
(
dict_index_is_ibuf
(
index
))
{
return
(
btr_page_alloc_for_ibuf
(
index
,
mtr
));
}
root
=
btr_root_get
(
index
,
mtr
);
...
...
@@ -941,8 +942,42 @@ btr_page_alloc(
reservation for free extents, and thus we know that a page can
be allocated: */
new_page_no
=
fseg_alloc_free_page_general
(
seg_header
,
hint_page_no
,
file_direction
,
TRUE
,
mtr
);
return
(
fseg_alloc_free_page_general
(
seg_header
,
hint_page_no
,
file_direction
,
TRUE
,
mtr
,
init_mtr
));
}
/**************************************************************//**
Allocates a new file page to be used in an index tree. NOTE: we assume
that the caller has made the reservation for free extents!
@return new allocated block, x-latched; NULL if out of space */
UNIV_INTERN
buf_block_t
*
btr_page_alloc
(
/*===========*/
dict_index_t
*
index
,
/*!< in: index */
ulint
hint_page_no
,
/*!< in: hint of a good page */
byte
file_direction
,
/*!< in: direction where a possible
page split is made */
ulint
level
,
/*!< in: level where the page is placed
in the tree */
mtr_t
*
mtr
,
/*!< in/out: mini-transaction
for the allocation */
mtr_t
*
init_mtr
)
/*!< in/out: mini-transaction
for x-latching and initializing
the page */
{
buf_block_t
*
new_block
;
ulint
new_page_no
;
if
(
dict_index_is_ibuf
(
index
))
{
return
(
btr_page_alloc_for_ibuf
(
index
,
mtr
));
}
new_page_no
=
btr_page_alloc_low
(
index
,
hint_page_no
,
file_direction
,
level
,
mtr
,
init_mtr
);
if
(
new_page_no
==
FIL_NULL
)
{
return
(
NULL
);
...
...
@@ -950,9 +985,16 @@ btr_page_alloc(
new_block
=
buf_page_get
(
dict_index_get_space
(
index
),
dict_table_zip_size
(
index
->
table
),
new_page_no
,
RW_X_LATCH
,
mtr
);
new_page_no
,
RW_X_LATCH
,
init_
mtr
);
buf_block_dbg_add_level
(
new_block
,
SYNC_TREE_NODE_NEW
);
if
(
mtr
->
freed_clust_leaf
)
{
mtr_memo_release
(
mtr
,
new_block
,
MTR_MEMO_FREE_CLUST_LEAF
);
ut_ad
(
!
mtr_memo_contains
(
mtr
,
new_block
,
MTR_MEMO_FREE_CLUST_LEAF
));
}
ut_ad
(
btr_freed_leaves_validate
(
mtr
));
return
(
new_block
);
}
...
...
@@ -1065,6 +1107,15 @@ btr_page_free_low(
fseg_free_page
(
seg_header
,
buf_block_get_space
(
block
),
buf_block_get_page_no
(
block
),
mtr
);
/* The page was marked free in the allocation bitmap, but it
should remain buffer-fixed until mtr_commit(mtr) or until it
is explicitly freed from the mini-transaction. */
ut_ad
(
mtr_memo_contains
(
mtr
,
block
,
MTR_MEMO_PAGE_X_FIX
));
/* TODO: Discard any operations on the page from the redo log
and remove the block from the flush list and the buffer pool.
This would free up buffer pool earlier and reduce writes to
both the tablespace and the redo log. */
}
/**************************************************************//**
...
...
@@ -1078,12 +1129,139 @@ btr_page_free(
buf_block_t
*
block
,
/*!< in: block to be freed, x-latched */
mtr_t
*
mtr
)
/*!< in: mtr */
{
ulint
level
;
level
=
btr_page_get_level
(
buf_block_get_frame
(
block
),
mtr
);
const
page_t
*
page
=
buf_block_get_frame
(
block
);
ulint
level
=
btr_page_get_level
(
page
,
mtr
);
ut_ad
(
fil_page_get_type
(
block
->
frame
)
==
FIL_PAGE_INDEX
);
btr_page_free_low
(
index
,
block
,
level
,
mtr
);
/* The handling of MTR_MEMO_FREE_CLUST_LEAF assumes this. */
ut_ad
(
mtr_memo_contains
(
mtr
,
block
,
MTR_MEMO_PAGE_X_FIX
));
if
(
level
==
0
&&
dict_index_is_clust
(
index
))
{
/* We may have to call btr_mark_freed_leaves() to
temporarily mark the block nonfree for invoking
btr_store_big_rec_extern_fields_func() after an
update. Remember that the block was freed. */
mtr
->
freed_clust_leaf
=
TRUE
;
mtr_memo_push
(
mtr
,
block
,
MTR_MEMO_FREE_CLUST_LEAF
);
}
ut_ad
(
btr_freed_leaves_validate
(
mtr
));
}
/**************************************************************//**
Marks all MTR_MEMO_FREE_CLUST_LEAF pages nonfree or free.
For invoking btr_store_big_rec_extern_fields() after an update,
we must temporarily mark freed clustered index pages allocated, so
that off-page columns will not be allocated from them. Between the
btr_store_big_rec_extern_fields() and mtr_commit() we have to
mark the pages free again, so that no pages will be leaked. */
UNIV_INTERN
void
btr_mark_freed_leaves
(
/*==================*/
dict_index_t
*
index
,
/*!< in/out: clustered index */
mtr_t
*
mtr
,
/*!< in/out: mini-transaction */
ibool
nonfree
)
/*!< in: TRUE=mark nonfree, FALSE=mark freed */
{
/* This is loosely based on mtr_memo_release(). */
ulint
offset
;
ut_ad
(
dict_index_is_clust
(
index
));
ut_ad
(
mtr
->
magic_n
==
MTR_MAGIC_N
);
ut_ad
(
mtr
->
state
==
MTR_ACTIVE
);
if
(
!
mtr
->
freed_clust_leaf
)
{
return
;
}
offset
=
dyn_array_get_data_size
(
&
mtr
->
memo
);
while
(
offset
>
0
)
{
mtr_memo_slot_t
*
slot
;
buf_block_t
*
block
;
offset
-=
sizeof
*
slot
;
slot
=
dyn_array_get_element
(
&
mtr
->
memo
,
offset
);
if
(
slot
->
type
!=
MTR_MEMO_FREE_CLUST_LEAF
)
{
continue
;
}
/* Because btr_page_alloc() does invoke
mtr_memo_release on MTR_MEMO_FREE_CLUST_LEAF, all
blocks tagged with MTR_MEMO_FREE_CLUST_LEAF in the
memo must still be clustered index leaf tree pages. */
block
=
slot
->
object
;
ut_a
(
buf_block_get_space
(
block
)
==
dict_index_get_space
(
index
));
ut_a
(
fil_page_get_type
(
buf_block_get_frame
(
block
))
==
FIL_PAGE_INDEX
);
ut_a
(
page_is_leaf
(
buf_block_get_frame
(
block
)));
if
(
nonfree
)
{
/* Allocate the same page again. */
ulint
page_no
;
page_no
=
btr_page_alloc_low
(
index
,
buf_block_get_page_no
(
block
),
FSP_NO_DIR
,
0
,
mtr
,
NULL
);
ut_a
(
page_no
==
buf_block_get_page_no
(
block
));
}
else
{
/* Assert that the page is allocated and free it. */
btr_page_free_low
(
index
,
block
,
0
,
mtr
);
}
}
ut_ad
(
btr_freed_leaves_validate
(
mtr
));
}
#ifdef UNIV_DEBUG
/**************************************************************//**
Validates all pages marked MTR_MEMO_FREE_CLUST_LEAF.
@see btr_mark_freed_leaves()
@return TRUE */
UNIV_INTERN
ibool
btr_freed_leaves_validate
(
/*======================*/
mtr_t
*
mtr
)
/*!< in: mini-transaction */
{
ulint
offset
;
ut_ad
(
mtr
->
magic_n
==
MTR_MAGIC_N
);
ut_ad
(
mtr
->
state
==
MTR_ACTIVE
);
offset
=
dyn_array_get_data_size
(
&
mtr
->
memo
);
while
(
offset
>
0
)
{
const
mtr_memo_slot_t
*
slot
;
const
buf_block_t
*
block
;
offset
-=
sizeof
*
slot
;
slot
=
dyn_array_get_element
(
&
mtr
->
memo
,
offset
);
if
(
slot
->
type
!=
MTR_MEMO_FREE_CLUST_LEAF
)
{
continue
;
}
ut_a
(
mtr
->
freed_clust_leaf
);
/* Because btr_page_alloc() does invoke
mtr_memo_release on MTR_MEMO_FREE_CLUST_LEAF, all
blocks tagged with MTR_MEMO_FREE_CLUST_LEAF in the
memo must still be clustered index leaf tree pages. */
block
=
slot
->
object
;
ut_a
(
fil_page_get_type
(
buf_block_get_frame
(
block
))
==
FIL_PAGE_INDEX
);
ut_a
(
page_is_leaf
(
buf_block_get_frame
(
block
)));
}
return
(
TRUE
);
}
#endif
/* UNIV_DEBUG */
/**************************************************************//**
Sets the child node file address in a node pointer. */
...
...
@@ -1809,7 +1987,7 @@ btr_root_raise_and_insert(
level
=
btr_page_get_level
(
root
,
mtr
);
new_block
=
btr_page_alloc
(
index
,
0
,
FSP_NO_DIR
,
level
,
mtr
);
new_block
=
btr_page_alloc
(
index
,
0
,
FSP_NO_DIR
,
level
,
mtr
,
mtr
);
new_page
=
buf_block_get_frame
(
new_block
);
new_page_zip
=
buf_block_get_page_zip
(
new_block
);
ut_a
(
!
new_page_zip
==
!
root_page_zip
);
...
...
@@ -2545,7 +2723,7 @@ func_start:
/* 2. Allocate a new page to the index */
new_block
=
btr_page_alloc
(
cursor
->
index
,
hint_page_no
,
direction
,
btr_page_get_level
(
page
,
mtr
),
mtr
);
btr_page_get_level
(
page
,
mtr
),
mtr
,
mtr
);
new_page
=
buf_block_get_frame
(
new_block
);
new_page_zip
=
buf_block_get_page_zip
(
new_block
);
btr_page_create
(
new_block
,
new_page_zip
,
cursor
->
index
,
...
...
storage/innobase/btr/btr0cur.c
View file @
79a03447
...
...
@@ -2532,39 +2532,6 @@ return_after_reservations:
return
(
err
);
}
/**************************************************************//**
Commits and restarts a mini-transaction so that it will retain an
x-lock on index->lock and the cursor page. */
UNIV_INTERN
void
btr_cur_mtr_commit_and_start
(
/*=========================*/
btr_cur_t
*
cursor
,
/*!< in: cursor */
mtr_t
*
mtr
)
/*!< in/out: mini-transaction */
{
buf_block_t
*
block
;
block
=
btr_cur_get_block
(
cursor
);
ut_ad
(
mtr_memo_contains
(
mtr
,
dict_index_get_lock
(
cursor
->
index
),
MTR_MEMO_X_LOCK
));
ut_ad
(
mtr_memo_contains
(
mtr
,
block
,
MTR_MEMO_PAGE_X_FIX
));
/* Keep the locks across the mtr_commit(mtr). */
rw_lock_x_lock
(
dict_index_get_lock
(
cursor
->
index
));
rw_lock_x_lock
(
&
block
->
lock
);
mutex_enter
(
&
block
->
mutex
);
buf_block_buf_fix_inc
(
block
,
__FILE__
,
__LINE__
);
mutex_exit
(
&
block
->
mutex
);
/* Write out the redo log. */
mtr_commit
(
mtr
);
mtr_start
(
mtr
);
/* Reassociate the locks with the mini-transaction.
They will be released on mtr_commit(mtr). */
mtr_memo_push
(
mtr
,
dict_index_get_lock
(
cursor
->
index
),
MTR_MEMO_X_LOCK
);
mtr_memo_push
(
mtr
,
block
,
MTR_MEMO_PAGE_X_FIX
);
}
/*==================== B-TREE DELETE MARK AND UNMARK ===============*/
/****************************************************************//**
...
...
@@ -4190,6 +4157,9 @@ btr_store_big_rec_extern_fields_func(
the "external storage" flags in offsets
will not correspond to rec when
this function returns */
const
big_rec_t
*
big_rec_vec
,
/*!< in: vector containing fields
to be stored externally */
#ifdef UNIV_DEBUG
mtr_t
*
local_mtr
,
/*!< in: mtr containing the
latch to rec and to the tree */
...
...
@@ -4198,9 +4168,11 @@ btr_store_big_rec_extern_fields_func(
ibool
update_in_place
,
/*! in: TRUE if the record is updated
in place (not delete+insert) */
#endif
/* UNIV_DEBUG || UNIV_BLOB_LIGHT_DEBUG */
const
big_rec_t
*
big_rec_vec
)
/*!< in: vector containing fields
to be stored externally */
mtr_t
*
alloc_mtr
)
/*!< in/out: in an insert, NULL;
in an update, local_mtr for
allocating BLOB pages and
updating BLOB pointers; alloc_mtr
must not have freed any leaf pages */
{
ulint
rec_page_no
;
byte
*
field_ref
;
...
...
@@ -4219,6 +4191,9 @@ btr_store_big_rec_extern_fields_func(
ut_ad
(
rec_offs_validate
(
rec
,
index
,
offsets
));
ut_ad
(
rec_offs_any_extern
(
offsets
));
ut_ad
(
local_mtr
);
ut_ad
(
!
alloc_mtr
||
alloc_mtr
==
local_mtr
);
ut_ad
(
!
update_in_place
||
alloc_mtr
);
ut_ad
(
mtr_memo_contains
(
local_mtr
,
dict_index_get_lock
(
index
),
MTR_MEMO_X_LOCK
));
ut_ad
(
mtr_memo_contains
(
local_mtr
,
rec_block
,
MTR_MEMO_PAGE_X_FIX
));
...
...
@@ -4234,6 +4209,25 @@ btr_store_big_rec_extern_fields_func(
rec_page_no
=
buf_block_get_page_no
(
rec_block
);
ut_a
(
fil_page_get_type
(
page_align
(
rec
))
==
FIL_PAGE_INDEX
);
if
(
alloc_mtr
)
{
/* Because alloc_mtr will be committed after
mtr, it is possible that the tablespace has been
extended when the B-tree record was updated or
inserted, or it will be extended while allocating
pages for big_rec.
TODO: In mtr (not alloc_mtr), write a redo log record
about extending the tablespace to its current size,
and remember the current size. Whenever the tablespace
grows as pages are allocated, write further redo log
records to mtr. (Currently tablespace extension is not
covered by the redo log. If it were, the record would
only be written to alloc_mtr, which is committed after
mtr.) */
}
else
{
alloc_mtr
=
&
mtr
;
}
if
(
UNIV_LIKELY_NULL
(
page_zip
))
{
int
err
;
...
...
@@ -4310,7 +4304,7 @@ btr_store_big_rec_extern_fields_func(
}
block
=
btr_page_alloc
(
index
,
hint_page_no
,
FSP_NO_DIR
,
0
,
&
mtr
);
FSP_NO_DIR
,
0
,
alloc_mtr
,
&
mtr
);
if
(
UNIV_UNLIKELY
(
block
==
NULL
))
{
mtr_commit
(
&
mtr
);
...
...
@@ -4437,11 +4431,15 @@ btr_store_big_rec_extern_fields_func(
goto
next_zip_page
;
}
rec_block
=
buf_page_get
(
space_id
,
zip_size
,
if
(
alloc_mtr
==
&
mtr
)
{
rec_block
=
buf_page_get
(
space_id
,
zip_size
,
rec_page_no
,
RW_X_LATCH
,
&
mtr
);
buf_block_dbg_add_level
(
rec_block
,
buf_block_dbg_add_level
(
rec_block
,
SYNC_NO_ORDER_CHECK
);
}
if
(
err
==
Z_STREAM_END
)
{
mach_write_to_4
(
field_ref
...
...
@@ -4475,7 +4473,8 @@ btr_store_big_rec_extern_fields_func(
page_zip_write_blob_ptr
(
page_zip
,
rec
,
index
,
offsets
,
big_rec_vec
->
fields
[
i
].
field_no
,
&
mtr
);
big_rec_vec
->
fields
[
i
].
field_no
,
alloc_mtr
);
next_zip_page:
prev_page_no
=
page_no
;
...
...
@@ -4520,19 +4519,23 @@ next_zip_page:
extern_len
-=
store_len
;
rec_block
=
buf_page_get
(
space_id
,
zip_size
,
if
(
alloc_mtr
==
&
mtr
)
{
rec_block
=
buf_page_get
(
space_id
,
zip_size
,
rec_page_no
,
RW_X_LATCH
,
&
mtr
);
buf_block_dbg_add_level
(
rec_block
,
buf_block_dbg_add_level
(
rec_block
,
SYNC_NO_ORDER_CHECK
);
}
mlog_write_ulint
(
field_ref
+
BTR_EXTERN_LEN
,
0
,
MLOG_4BYTES
,
&
mtr
);
MLOG_4BYTES
,
alloc_
mtr
);
mlog_write_ulint
(
field_ref
+
BTR_EXTERN_LEN
+
4
,
big_rec_vec
->
fields
[
i
].
len
-
extern_len
,
MLOG_4BYTES
,
&
mtr
);
MLOG_4BYTES
,
alloc_
mtr
);
if
(
prev_page_no
==
FIL_NULL
)
{
btr_blob_dbg_add_blob
(
...
...
@@ -4542,18 +4545,19 @@ next_zip_page:
mlog_write_ulint
(
field_ref
+
BTR_EXTERN_SPACE_ID
,
space_id
,
MLOG_4BYTES
,
&
mtr
);
space_id
,
MLOG_4BYTES
,
alloc_
mtr
);
mlog_write_ulint
(
field_ref
+
BTR_EXTERN_PAGE_NO
,
page_no
,
MLOG_4BYTES
,
&
mtr
);
page_no
,
MLOG_4BYTES
,
alloc_
mtr
);
mlog_write_ulint
(
field_ref
+
BTR_EXTERN_OFFSET
,
FIL_PAGE_DATA
,
MLOG_4BYTES
,
&
mtr
);
MLOG_4BYTES
,
alloc_mtr
);
}
prev_page_no
=
page_no
;
...
...
storage/innobase/buf/buf0buf.c
View file @
79a03447
...
...
@@ -1715,31 +1715,6 @@ buf_page_set_accessed_make_young(
}
}
/********************************************************************//**
Resets the check_index_page_at_flush field of a page if found in the buffer
pool. */
UNIV_INTERN
void
buf_reset_check_index_page_at_flush
(
/*================================*/
ulint
space
,
/*!< in: space id */
ulint
offset
)
/*!< in: page number */
{
buf_block_t
*
block
;
buf_pool_t
*
buf_pool
=
buf_pool_get
(
space
,
offset
);
buf_pool_mutex_enter
(
buf_pool
);
block
=
(
buf_block_t
*
)
buf_page_hash_get
(
buf_pool
,
space
,
offset
);
if
(
block
&&
buf_block_get_state
(
block
)
==
BUF_BLOCK_FILE_PAGE
)
{
ut_ad
(
!
buf_pool_watch_is_sentinel
(
buf_pool
,
&
block
->
page
));
block
->
check_index_page_at_flush
=
FALSE
;
}
buf_pool_mutex_exit
(
buf_pool
);
}
/********************************************************************//**
Returns the current state of is_hashed of a page. FALSE if the page is
not in the pool. NOTE that this operation does not fix the page in the
...
...
storage/innobase/fsp/fsp0fsp.c
View file @
79a03447
This diff is collapsed.
Click to expand it.
storage/innobase/include/btr0btr.h
View file @
79a03447
...
...
@@ -568,7 +568,12 @@ btr_page_alloc(
page split is made */
ulint
level
,
/*!< in: level where the page is placed
in the tree */
mtr_t
*
mtr
);
/*!< in: mtr */
mtr_t
*
mtr
,
/*!< in/out: mini-transaction
for the allocation */
mtr_t
*
init_mtr
)
/*!< in/out: mini-transaction
for x-latching and initializing
the page */
__attribute__
((
nonnull
,
warn_unused_result
));
/**************************************************************//**
Frees a file page used in an index tree. NOTE: cannot free field external
storage pages because the page must contain info on its level. */
...
...
@@ -591,6 +596,33 @@ btr_page_free_low(
buf_block_t
*
block
,
/*!< in: block to be freed, x-latched */
ulint
level
,
/*!< in: page level */
mtr_t
*
mtr
);
/*!< in: mtr */
/**************************************************************//**
Marks all MTR_MEMO_FREE_CLUST_LEAF pages nonfree or free.
For invoking btr_store_big_rec_extern_fields() after an update,
we must temporarily mark freed clustered index pages allocated, so
that off-page columns will not be allocated from them. Between the
btr_store_big_rec_extern_fields() and mtr_commit() we have to
mark the pages free again, so that no pages will be leaked. */
UNIV_INTERN
void
btr_mark_freed_leaves
(
/*==================*/
dict_index_t
*
index
,
/*!< in/out: clustered index */
mtr_t
*
mtr
,
/*!< in/out: mini-transaction */
ibool
nonfree
)
/*!< in: TRUE=mark nonfree, FALSE=mark freed */
UNIV_COLD
__attribute__
((
nonnull
));
#ifdef UNIV_DEBUG
/**************************************************************//**
Validates all pages marked MTR_MEMO_FREE_CLUST_LEAF.
@see btr_mark_freed_leaves()
@return TRUE */
UNIV_INTERN
ibool
btr_freed_leaves_validate
(
/*======================*/
mtr_t
*
mtr
)
/*!< in: mini-transaction */
__attribute__
((
nonnull
,
warn_unused_result
));
#endif
/* UNIV_DEBUG */
#ifdef UNIV_BTR_PRINT
/*************************************************************//**
Prints size info of a B-tree. */
...
...
storage/innobase/include/btr0cur.h
View file @
79a03447
...
...
@@ -327,16 +327,6 @@ btr_cur_pessimistic_update(
que_thr_t
*
thr
,
/*!< in: query thread */
mtr_t
*
mtr
);
/*!< in: mtr; must be committed before
latching any further pages */
/*****************************************************************
Commits and restarts a mini-transaction so that it will retain an
x-lock on index->lock and the cursor page. */
UNIV_INTERN
void
btr_cur_mtr_commit_and_start
(
/*=========================*/
btr_cur_t
*
cursor
,
/*!< in: cursor */
mtr_t
*
mtr
)
/*!< in/out: mini-transaction */
UNIV_COLD
__attribute__
((
nonnull
));
/***********************************************************//**
Marks a clustered index record deleted. Writes an undo log record to
undo log on this delete marking. Writes in the trx id field the id
...
...
@@ -528,6 +518,8 @@ btr_store_big_rec_extern_fields_func(
the "external storage" flags in offsets
will not correspond to rec when
this function returns */
const
big_rec_t
*
big_rec_vec
,
/*!< in: vector containing fields
to be stored externally */
#ifdef UNIV_DEBUG
mtr_t
*
local_mtr
,
/*!< in: mtr containing the
latch to rec and to the tree */
...
...
@@ -536,9 +528,12 @@ btr_store_big_rec_extern_fields_func(
ibool
update_in_place
,
/*! in: TRUE if the record is updated
in place (not delete+insert) */
#endif
/* UNIV_DEBUG || UNIV_BLOB_LIGHT_DEBUG */
const
big_rec_t
*
big_rec_vec
)
/*!< in: vector containing fields
to be stored externally */
__attribute__
((
nonnull
));
mtr_t
*
alloc_mtr
)
/*!< in/out: in an insert, NULL;
in an update, local_mtr for
allocating BLOB pages and
updating BLOB pointers; alloc_mtr
must not have freed any leaf pages */
__attribute__
((
nonnull
(
1
,
2
,
3
,
4
,
5
),
warn_unused_result
));
/** Stores the fields in big_rec_vec to the tablespace and puts pointers to
them in rec. The extern flags in rec will have to be set beforehand.
...
...
@@ -547,21 +542,22 @@ file segment of the index tree.
@param index in: clustered index; MUST be X-latched by mtr
@param b in/out: block containing rec; MUST be X-latched by mtr
@param rec in/out: clustered index record
@param offs
ets
in: rec_get_offsets(rec, index);
@param offs in: rec_get_offsets(rec, index);
the "external storage" flags in offsets will not be adjusted
@param big in: vector containing fields to be stored externally
@param mtr in: mini-transaction that holds x-latch on index and b
@param upd in: TRUE if the record is updated in place (not delete+insert)
@param
big in: vector containing fields to be stored externally
@param
rmtr in/out: in updates, the mini-transaction that holds rec
@return DB_SUCCESS or DB_OUT_OF_FILE_SPACE */
#ifdef UNIV_DEBUG
# define btr_store_big_rec_extern_fields(index,b,rec,offs
ets,mtr,upd,big
) \
btr_store_big_rec_extern_fields_func(index,b,rec,offs
ets,mtr,upd,big
)
# define btr_store_big_rec_extern_fields(index,b,rec,offs
,big,mtr,upd,rmtr
) \
btr_store_big_rec_extern_fields_func(index,b,rec,offs
,big,mtr,upd,rmtr
)
#elif defined UNIV_BLOB_LIGHT_DEBUG
# define btr_store_big_rec_extern_fields(index,b,rec,offs
ets,mtr,upd,big
) \
btr_store_big_rec_extern_fields_func(index,b,rec,offs
ets,upd,big
)
# define btr_store_big_rec_extern_fields(index,b,rec,offs
,big,mtr,upd,rmtr
) \
btr_store_big_rec_extern_fields_func(index,b,rec,offs
,big,upd,rmtr
)
#else
# define btr_store_big_rec_extern_fields(index,b,rec,offs
ets,mtr,upd,big
) \
btr_store_big_rec_extern_fields_func(index,b,rec,offs
ets,big
)
# define btr_store_big_rec_extern_fields(index,b,rec,offs
,big,mtr,upd,rmtr
) \
btr_store_big_rec_extern_fields_func(index,b,rec,offs
,big,rmtr
)
#endif
/*******************************************************************//**
...
...
storage/innobase/include/buf0buf.h
View file @
79a03447
...
...
@@ -491,15 +491,6 @@ buf_page_peek(
/*==========*/
ulint
space
,
/*!< in: space id */
ulint
offset
);
/*!< in: page number */
/********************************************************************//**
Resets the check_index_page_at_flush field of a page if found in the buffer
pool. */
UNIV_INTERN
void
buf_reset_check_index_page_at_flush
(
/*================================*/
ulint
space
,
/*!< in: space id */
ulint
offset
);
/*!< in: page number */
#if defined UNIV_DEBUG_FILE_ACCESSES || defined UNIV_DEBUG
/********************************************************************//**
Sets file_page_was_freed TRUE if the page is found in the buffer pool.
...
...
storage/innobase/include/fsp0fsp.h
View file @
79a03447
/*****************************************************************************
Copyright (c) 1995, 20
09, Innobase Oy
. All Rights Reserved.
Copyright (c) 1995, 20
11, Oracle and/or its affiliates
. All Rights Reserved.
This program is free software; you can redistribute it and/or modify it under
the terms of the GNU General Public License as published by the Free Software
...
...
@@ -176,19 +176,18 @@ fseg_n_reserved_pages(
Allocates a single free page from a segment. This function implements
the intelligent allocation strategy which tries to minimize
file space fragmentation.
@return the allocated page offset FIL_NULL if no page could be allocated */
UNIV_INTERN
ulint
fseg_alloc_free_page
(
/*=================*/
fseg_header_t
*
seg_header
,
/*!< in: segment header */
ulint
hint
,
/*!< in: hint of which page would be desirable */
byte
direction
,
/*!< in: if the new page is needed because
@param[in/out] seg_header segment header
@param[in] hint hint of which page would be desirable
@param[in] direction if the new page is needed because
of an index page split, and records are
inserted there in order, into which
direction they go alphabetically: FSP_DOWN,
FSP_UP, FSP_NO_DIR */
mtr_t
*
mtr
);
/*!< in: mtr handle */
FSP_UP, FSP_NO_DIR
@param[in/out] mtr mini-transaction
@return the allocated page offset FIL_NULL if no page could be allocated */
#define fseg_alloc_free_page(seg_header, hint, direction, mtr) \
fseg_alloc_free_page_general(seg_header, hint, direction, \
FALSE, mtr, mtr)
/**********************************************************************//**
Allocates a single free page from a segment. This function implements
the intelligent allocation strategy which tries to minimize file space
...
...
@@ -198,7 +197,7 @@ UNIV_INTERN
ulint
fseg_alloc_free_page_general
(
/*=========================*/
fseg_header_t
*
seg_header
,
/*!< in: segment header */
fseg_header_t
*
seg_header
,
/*!< in
/out
: segment header */
ulint
hint
,
/*!< in: hint of which page would be desirable */
byte
direction
,
/*!< in: if the new page is needed because
of an index page split, and records are
...
...
@@ -210,7 +209,12 @@ fseg_alloc_free_page_general(
with fsp_reserve_free_extents, then there
is no need to do the check for this individual
page */
mtr_t
*
mtr
);
/*!< in: mtr handle */
mtr_t
*
mtr
,
/*!< in/out: mini-transaction */
mtr_t
*
init_mtr
)
/*!< in/out: mtr or another mini-transaction
in which the page should be initialized,
or NULL if this is a "fake allocation" of
a page that was previously freed in mtr */
__attribute__
((
warn_unused_result
,
nonnull
(
1
,
5
)));
/**********************************************************************//**
Reserves free pages from a tablespace. All mini-transactions which may
use several pages from the tablespace should call this function beforehand
...
...
storage/innobase/include/mtr0mtr.h
View file @
79a03447
/*****************************************************************************
Copyright (c) 1995, 20
09, Innobase Oy
. All Rights Reserved.
Copyright (c) 1995, 20
11, Oracle and/or its affiliates
. All Rights Reserved.
This program is free software; you can redistribute it and/or modify it under
the terms of the GNU General Public License as published by the Free Software
...
...
@@ -53,6 +53,8 @@ first 3 values must be RW_S_LATCH, RW_X_LATCH, RW_NO_LATCH */
#define MTR_MEMO_MODIFY 54
#define MTR_MEMO_S_LOCK 55
#define MTR_MEMO_X_LOCK 56
/** The mini-transaction freed a clustered index leaf page. */
#define MTR_MEMO_FREE_CLUST_LEAF 57
/** @name Log item types
The log items are declared 'byte' so that the compiler can warn if val
...
...
@@ -378,11 +380,14 @@ struct mtr_struct{
#endif
dyn_array_t
memo
;
/*!< memo stack for locks etc. */
dyn_array_t
log
;
/*!< mini-transaction log */
ibool
inside_ibuf
;
unsigned
inside_ibuf
:
1
;
/*!< TRUE if inside ibuf changes */
ibool
modifications
;
/* TRUE if the mtr made modifications to
buffer pool pages */
unsigned
modifications
:
1
;
/*!< TRUE if the mini-transaction
modified buffer pool pages */
unsigned
freed_clust_leaf
:
1
;
/*!< TRUE if MTR_MEMO_FREE_CLUST_LEAF
was logged in the mini-transaction */
ulint
n_log_recs
;
/* count of how many page initial log records
have been written to the mtr log */
...
...
storage/innobase/include/mtr0mtr.ic
View file @
79a03447
/*****************************************************************************
Copyright (c) 1995, 201
0, Innobase Oy
. All Rights Reserved.
Copyright (c) 1995, 201
1, Oracle and/or its affiliates
. All Rights Reserved.
This program is free software; you can redistribute it and/or modify it under
the terms of the GNU General Public License as published by the Free Software
...
...
@@ -43,8 +43,9 @@ mtr_start(
dyn_array_create(&(mtr->log));
mtr->log_mode = MTR_LOG_ALL;
mtr->modifications = FALSE;
mtr->inside_ibuf = FALSE;
mtr->modifications = FALSE;
mtr->freed_clust_leaf = FALSE;
mtr->n_log_recs = 0;
ut_d(mtr->state = MTR_ACTIVE);
...
...
@@ -66,7 +67,8 @@ mtr_memo_push(
ut_ad(object);
ut_ad(type >= MTR_MEMO_PAGE_S_FIX);
ut_ad(type <= MTR_MEMO_X_LOCK);
ut_ad(type <= MTR_MEMO_FREE_CLUST_LEAF);
ut_ad(type != MTR_MEMO_FREE_CLUST_LEAF || mtr->freed_clust_leaf);
ut_ad(mtr);
ut_ad(mtr->magic_n == MTR_MAGIC_N);
ut_ad(mtr->state == MTR_ACTIVE);
...
...
storage/innobase/mtr/mtr0mtr.c
View file @
79a03447
/*****************************************************************************
Copyright (c) 1995, 20
09, Innobase Oy
. All Rights Reserved.
Copyright (c) 1995, 20
11, Oracle and/or its affiliates
. All Rights Reserved.
This program is free software; you can redistribute it and/or modify it under
the terms of the GNU General Public License as published by the Free Software
...
...
@@ -64,12 +64,11 @@ mtr_memo_slot_release(
buf_page_release
((
buf_block_t
*
)
object
,
type
);
}
else
if
(
type
==
MTR_MEMO_S_LOCK
)
{
rw_lock_s_unlock
((
rw_lock_t
*
)
object
);
#ifdef UNIV_DEBUG
}
else
if
(
type
!=
MTR_MEMO_X_LOCK
)
{
ut_ad
(
type
==
MTR_MEMO_MODIFY
);
ut_ad
(
type
==
MTR_MEMO_MODIFY
||
type
==
MTR_MEMO_FREE_CLUST_LEAF
);
ut_ad
(
mtr_memo_contains
(
mtr
,
object
,
MTR_MEMO_PAGE_X_FIX
));
#endif
/* UNIV_DEBUG */
}
else
{
rw_lock_x_unlock
((
rw_lock_t
*
)
object
);
}
...
...
storage/innobase/row/row0ins.c
View file @
79a03447
...
...
@@ -2088,15 +2088,20 @@ row_ins_index_entry_low(
if
(
big_rec
)
{
ut_a
(
err
==
DB_SUCCESS
);
/* Write out the externally stored
columns while still x-latching
index->lock and block->lock. We have
to mtr_commit(mtr) first, so that the
redo log will be written in the
correct order. Otherwise, we would run
into trouble on crash recovery if mtr
freed B-tree pages on which some of
the big_rec fields will be written. */
btr_cur_mtr_commit_and_start
(
&
cursor
,
&
mtr
);
columns, but allocate the pages and
write the pointers using the
mini-transaction of the record update.
If any pages were freed in the update,
temporarily mark them allocated so
that off-page columns will not
overwrite them. We must do this,
because we will write the redo log for
the BLOB writes before writing the
redo log for the record update. Thus,
redo log application at crash recovery
will see BLOBs being written to free pages. */
btr_mark_freed_leaves
(
index
,
&
mtr
,
TRUE
);
rec
=
btr_cur_get_rec
(
&
cursor
);
offsets
=
rec_get_offsets
(
...
...
@@ -2105,7 +2110,8 @@ row_ins_index_entry_low(
err
=
btr_store_big_rec_extern_fields
(
index
,
btr_cur_get_block
(
&
cursor
),
rec
,
offsets
,
&
mtr
,
FALSE
,
big_rec
);
rec
,
offsets
,
big_rec
,
&
mtr
,
FALSE
,
&
mtr
);
/* If writing big_rec fails (for
example, because of DB_OUT_OF_FILE_SPACE),
the record will be corrupted. Even if
...
...
@@ -2118,6 +2124,9 @@ row_ins_index_entry_low(
undo log, and thus the record cannot
be rolled back. */
ut_a
(
err
==
DB_SUCCESS
);
/* Free the pages again
in order to avoid a leak. */
btr_mark_freed_leaves
(
index
,
&
mtr
,
FALSE
);
goto
stored_big_rec
;
}
}
else
{
...
...
@@ -2159,7 +2168,7 @@ function_exit:
err
=
btr_store_big_rec_extern_fields
(
index
,
btr_cur_get_block
(
&
cursor
),
rec
,
offsets
,
&
mtr
,
FALSE
,
big_rec
);
rec
,
offsets
,
big_rec
,
&
mtr
,
FALSE
,
NULL
);
stored_big_rec:
if
(
modify
)
{
...
...
@@ -2434,7 +2443,7 @@ row_ins(
node
->
index
=
dict_table_get_next_index
(
node
->
index
);
node
->
entry
=
UT_LIST_GET_NEXT
(
tuple_list
,
node
->
entry
);
/* Skip corrupted secondar index and its entry */
/* Skip corrupted secondar
y
index and its entry */
while
(
node
->
index
&&
dict_index_is_corrupted
(
node
->
index
))
{
node
->
index
=
dict_table_get_next_index
(
node
->
index
);
...
...
storage/innobase/row/row0row.c
View file @
79a03447
...
...
@@ -243,19 +243,20 @@ row_build(
}
#if defined UNIV_DEBUG || defined UNIV_BLOB_LIGHT_DEBUG
/* This condition can occur during crash recovery before
trx_rollback_active() has completed execution.
if
(
rec_offs_any_null_extern
(
rec
,
offsets
))
{
/* This condition can occur during crash recovery
before trx_rollback_active() has completed execution.
This condition is possible if the server crashed
during an insert or update
before
during an insert or update-by-delete-and-insert
before
btr_store_big_rec_extern_fields() did mtr_commit() all
BLOB pointers to the clustered index record.
If the record contains a null BLOB pointer, look up the
transaction that holds the implicit lock on this record, and
assert that it was recovered (and will soon be rolled back). */
ut_a
(
!
rec_offs_any_null_extern
(
rec
,
offsets
)
||
trx_assert_recovered
(
row_get_rec_trx_id
(
rec
,
index
,
offsets
)));
BLOB pointers to the freshly inserted clustered index
record. */
ut_a
(
trx_assert_recovered
(
row_get_rec_trx_id
(
rec
,
index
,
offsets
)));
ut_a
(
trx_undo_roll_ptr_is_insert
(
row_get_rec_roll_ptr
(
rec
,
index
,
offsets
)));
}
#endif
/* UNIV_DEBUG || UNIV_BLOB_LIGHT_DEBUG */
if
(
type
!=
ROW_COPY_POINTERS
)
{
...
...
storage/innobase/row/row0upd.c
View file @
79a03447
...
...
@@ -2008,21 +2008,22 @@ row_upd_clust_rec(
rec_offs_init
(
offsets_
);
ut_a
(
err
==
DB_SUCCESS
);
/* Write out the externally stored columns while still
x-latching index->lock and block->lock. We have to
mtr_commit(mtr) first, so that the redo log will be
written in the correct order. Otherwise, we would run
into trouble on crash recovery if mtr freed B-tree
pages on which some of the big_rec fields will be
written. */
btr_cur_mtr_commit_and_start
(
btr_cur
,
mtr
);
/* Write out the externally stored columns, but
allocate the pages and write the pointers using the
mini-transaction of the record update. If any pages
were freed in the update, temporarily mark them
allocated so that off-page columns will not overwrite
them. We must do this, because we write the redo log
for the BLOB writes before writing the redo log for
the record update. */
btr_mark_freed_leaves
(
index
,
mtr
,
TRUE
);
rec
=
btr_cur_get_rec
(
btr_cur
);
err
=
btr_store_big_rec_extern_fields
(
index
,
btr_cur_get_block
(
btr_cur
),
rec
,
rec_get_offsets
(
rec
,
index
,
offsets_
,
ULINT_UNDEFINED
,
&
heap
),
mtr
,
TRUE
,
big_rec
);
big_rec
,
mtr
,
TRUE
,
mtr
);
/* If writing big_rec fails (for example, because of
DB_OUT_OF_FILE_SPACE), the record will be corrupted.
Even if we did not update any externally stored
...
...
@@ -2032,6 +2033,8 @@ row_upd_clust_rec(
to the undo log, and thus the record cannot be rolled
back. */
ut_a
(
err
==
DB_SUCCESS
);
/* Free the pages again in order to avoid a leak. */
btr_mark_freed_leaves
(
index
,
mtr
,
FALSE
);
}
mtr_commit
(
mtr
);
...
...
storage/innobase/trx/trx0undo.c
View file @
79a03447
/*****************************************************************************
Copyright (c) 1996, 20
09, Innobase Oy
. All Rights Reserved.
Copyright (c) 1996, 20
11, Oracle and/or its affiliates
. All Rights Reserved.
This program is free software; you can redistribute it and/or modify it under
the terms of the GNU General Public License as published by the Free Software
...
...
@@ -918,7 +918,7 @@ trx_undo_add_page(
page_no
=
fseg_alloc_free_page_general
(
header_page
+
TRX_UNDO_SEG_HDR
+
TRX_UNDO_FSEG_HEADER
,
undo
->
top_page_no
+
1
,
FSP_UP
,
TRUE
,
mtr
);
TRUE
,
mtr
,
mtr
);
fil_space_release_free_extents
(
undo
->
space
,
n_reserved
);
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment