Commit 2945f773 authored by Jon Olav Hauglid's avatar Jon Olav Hauglid

Backport of revno: 2617.68.37

Bug #46654 False deadlock on concurrent DML/DDL with partitions, 
           inconsistent behavior

The problem was that if one connection is running a multi-statement 
transaction which involves a single partitioned table, and another 
connection attempts to alter the table, the first connection gets 
ER_LOCK_DEADLOCK and cannot proceed anymore, even when the ALTER TABLE 
statement in another connection has timed out or failed.

The reason for this was that the prepare phase for ALTER TABLE for 
partitioned tables removed all instances of the table from the table 
definition cache before it started waiting on the lock. The transaction 
running in the first connection would notice this and report ER_LOCK_DEADLOCK. 

This patch changes the prep_alter_part_table() ALTER TABLE code so that 
tdc_remove_table() is no longer called. Instead, only the TABLE instance
changed by prep_alter_part_table() is marked as needing reopen.

The patch also removes an unnecessary call to tdc_remove_table() from 
mysql_unpack_partition() as the changed TABLE object is destroyed by the 
caller at a later point.

Test case added in partition_sync.test.
parent 28b0eeff
# Disabled until Bug#46654 False deadlock on concurrent DML/DDL # Disabled until Bug#46654 False deadlock on concurrent DML/DDL
# with partitions, inconsistent behavior is backported # with partitions, inconsistent behavior is backported
#
# Bug #46654 False deadlock on concurrent DML/DDL
# with partitions, inconsistent behavior
#
DROP TABLE IF EXISTS tbl_with_partitions;
CREATE TABLE tbl_with_partitions ( i INT )
PARTITION BY HASH(i);
INSERT INTO tbl_with_partitions VALUES (1);
# Connection 3
LOCK TABLE tbl_with_partitions READ;
# Connection 1
# Access table with disabled autocommit
SET AUTOCOMMIT = 0;
SELECT * FROM tbl_with_partitions;
i
1
# Connection 2
# Alter table, abort after prepare
set session debug="+d,abort_copy_table";
ALTER TABLE tbl_with_partitions ADD COLUMN f INT;
ERROR HY000: Lock wait timeout exceeded; try restarting transaction
# Connection 1
# Try accessing the table after Alter aborted.
# This used to give ER_LOCK_DEADLOCK.
SELECT * FROM tbl_with_partitions;
i
1
# Connection 3
UNLOCK TABLES;
# Connection 1
# Cleanup
DROP TABLE tbl_with_partitions;
...@@ -39,6 +39,57 @@ ...@@ -39,6 +39,57 @@
#DROP TABLE t1; #DROP TABLE t1;
--echo #
--echo # Bug #46654 False deadlock on concurrent DML/DDL
--echo # with partitions, inconsistent behavior
--echo #
--disable_warnings
DROP TABLE IF EXISTS tbl_with_partitions;
--enable_warnings
CREATE TABLE tbl_with_partitions ( i INT )
PARTITION BY HASH(i);
INSERT INTO tbl_with_partitions VALUES (1);
connect(con2,localhost,root);
connect(con3,localhost,root);
--echo # Connection 3
connection con3;
LOCK TABLE tbl_with_partitions READ;
--echo # Connection 1
--echo # Access table with disabled autocommit
connection default;
SET AUTOCOMMIT = 0;
SELECT * FROM tbl_with_partitions;
--echo # Connection 2
--echo # Alter table, abort after prepare
connection con2;
set session debug="+d,abort_copy_table";
--error ER_LOCK_WAIT_TIMEOUT
ALTER TABLE tbl_with_partitions ADD COLUMN f INT;
--echo # Connection 1
--echo # Try accessing the table after Alter aborted.
--echo # This used to give ER_LOCK_DEADLOCK.
connection default;
SELECT * FROM tbl_with_partitions;
--echo # Connection 3
connection con3;
UNLOCK TABLES;
--echo # Connection 1
--echo # Cleanup
connection default;
disconnect con2;
disconnect con3;
DROP TABLE tbl_with_partitions;
# Check that all connections opened by test cases in this file are really # Check that all connections opened by test cases in this file are really
# gone so execution of other tests won't be affected by their presence. # gone so execution of other tests won't be affected by their presence.
--source include/wait_until_count_sessions.inc --source include/wait_until_count_sessions.inc
...@@ -1530,8 +1530,8 @@ bool close_thread_table(THD *thd, TABLE **table_ptr) ...@@ -1530,8 +1530,8 @@ bool close_thread_table(THD *thd, TABLE **table_ptr)
*table_ptr=table->next; *table_ptr=table->next;
table->mdl_ticket= NULL; table->mdl_ticket= NULL;
if (table->needs_reopen() || if (table->s->needs_reopen() ||
thd->version != refresh_version || !table->db_stat || thd->version != refresh_version || table->needs_reopen() ||
table_def_shutdown_in_progress) table_def_shutdown_in_progress)
{ {
free_cache_entry(table); free_cache_entry(table);
...@@ -8186,13 +8186,13 @@ bool mysql_notify_thread_having_shared_lock(THD *thd, THD *in_use) ...@@ -8186,13 +8186,13 @@ bool mysql_notify_thread_having_shared_lock(THD *thd, THD *in_use)
thd_table= thd_table->next) thd_table= thd_table->next)
{ {
/* /*
Check for TABLE::db_stat is needed since in some places we call Check for TABLE::needs_reopen() is needed since in some places we call
handler::close() for table instance (and set TABLE::db_stat to 0) handler::close() for table instance (and set TABLE::db_stat to 0)
and do not remove such instances from the THD::open_tables and do not remove such instances from the THD::open_tables
for some time, during which other thread can see those instances for some time, during which other thread can see those instances
(e.g. see partitioning code). (e.g. see partitioning code).
*/ */
if (thd_table->db_stat) if (!thd_table->needs_reopen())
signalled|= mysql_lock_abort_for_thread(thd, thd_table); signalled|= mysql_lock_abort_for_thread(thd, thd_table);
} }
pthread_mutex_unlock(&LOCK_open); pthread_mutex_unlock(&LOCK_open);
......
...@@ -820,7 +820,7 @@ void mysql_ha_flush(THD *thd) ...@@ -820,7 +820,7 @@ void mysql_ha_flush(THD *thd)
if (hash_tables->table && if (hash_tables->table &&
(hash_tables->table->mdl_ticket && (hash_tables->table->mdl_ticket &&
hash_tables->table->mdl_ticket->has_pending_conflicting_lock() || hash_tables->table->mdl_ticket->has_pending_conflicting_lock() ||
hash_tables->table->needs_reopen())) hash_tables->table->s->needs_reopen()))
mysql_ha_close_table(thd, hash_tables); mysql_ha_close_table(thd, hash_tables);
} }
......
...@@ -2657,7 +2657,7 @@ bool Delayed_insert::handle_inserts(void) ...@@ -2657,7 +2657,7 @@ bool Delayed_insert::handle_inserts(void)
thd_proc_info(&thd, "insert"); thd_proc_info(&thd, "insert");
max_rows= delayed_insert_limit; max_rows= delayed_insert_limit;
if (thd.killed || table->needs_reopen()) if (thd.killed || table->s->needs_reopen())
{ {
thd.killed= THD::KILL_CONNECTION; thd.killed= THD::KILL_CONNECTION;
max_rows= ULONG_MAX; // Do as much as possible max_rows= ULONG_MAX; // Do as much as possible
......
...@@ -4183,15 +4183,13 @@ bool mysql_unpack_partition(THD *thd, ...@@ -4183,15 +4183,13 @@ bool mysql_unpack_partition(THD *thd,
We need to free any memory objects allocated on item_free_list We need to free any memory objects allocated on item_free_list
by the parser since we are keeping the old info from the first by the parser since we are keeping the old info from the first
parser call in CREATE TABLE. parser call in CREATE TABLE.
We'll ensure that this object isn't put into table cache also
just to ensure we don't get into strange situations with the This table object can not be used any more. However, since
item objects. this is CREATE TABLE, we know that it will be destroyed by the
caller, and rely on that.
*/ */
thd->free_items(); thd->free_items();
part_info= thd->work_part_info; part_info= thd->work_part_info;
tdc_remove_table(thd, TDC_RT_REMOVE_UNUSED,
table->s->db.str,
table->s->table_name.str);
*work_part_info_used= true; *work_part_info_used= true;
} }
table->part_info= part_info; table->part_info= part_info;
...@@ -4484,17 +4482,11 @@ uint prep_alter_part_table(THD *thd, TABLE *table, Alter_info *alter_info, ...@@ -4484,17 +4482,11 @@ uint prep_alter_part_table(THD *thd, TABLE *table, Alter_info *alter_info,
/* /*
We are going to manipulate the partition info on the table object We are going to manipulate the partition info on the table object
so we need to ensure that the table instances cached and all other so we need to ensure that the table instance is removed from the
instances are properly closed. table cache.
*/ */
if (table->part_info) if (table->part_info)
{ table->m_needs_reopen= TRUE;
pthread_mutex_lock(&LOCK_open);
tdc_remove_table(thd, TDC_RT_REMOVE_UNUSED,
table->s->db.str,
table->s->table_name.str);
pthread_mutex_unlock(&LOCK_open);
}
thd->work_part_info= thd->lex->part_info; thd->work_part_info= thd->lex->part_info;
if (thd->work_part_info && if (thd->work_part_info &&
......
...@@ -7049,6 +7049,10 @@ view_err: ...@@ -7049,6 +7049,10 @@ view_err:
new_table->timestamp_field_type= TIMESTAMP_NO_AUTO_SET; new_table->timestamp_field_type= TIMESTAMP_NO_AUTO_SET;
new_table->next_number_field=new_table->found_next_number_field; new_table->next_number_field=new_table->found_next_number_field;
thd_proc_info(thd, "copy to tmp table"); thd_proc_info(thd, "copy to tmp table");
DBUG_EXECUTE_IF("abort_copy_table", {
my_error(ER_LOCK_WAIT_TIMEOUT, MYF(0));
goto err_new_table_cleanup;
});
error= copy_data_between_tables(table, new_table, error= copy_data_between_tables(table, new_table,
alter_info->create_list, ignore, alter_info->create_list, ignore,
order_num, order, &copied, &deleted, order_num, order, &copied, &deleted,
......
...@@ -294,6 +294,8 @@ TABLE_CATEGORY get_table_category(const LEX_STRING *db, ...@@ -294,6 +294,8 @@ TABLE_CATEGORY get_table_category(const LEX_STRING *db,
struct TABLE_share; struct TABLE_share;
extern ulong refresh_version;
/* /*
This structure is shared between different table objects. There is one This structure is shared between different table objects. There is one
instance of table share per one table in the database. instance of table share per one table in the database.
...@@ -503,6 +505,14 @@ struct TABLE_SHARE ...@@ -503,6 +505,14 @@ struct TABLE_SHARE
return table_map_id; return table_map_id;
} }
/*
Must all TABLEs be reopened?
*/
inline bool needs_reopen()
{
return version != refresh_version;
}
/** /**
Convert unrelated members of TABLE_SHARE to one enum Convert unrelated members of TABLE_SHARE to one enum
representing its type. representing its type.
...@@ -605,8 +615,6 @@ struct TABLE_SHARE ...@@ -605,8 +615,6 @@ struct TABLE_SHARE
}; };
extern ulong refresh_version;
/* Information for one open table */ /* Information for one open table */
enum index_hint_type enum index_hint_type
{ {
...@@ -804,6 +812,7 @@ public: ...@@ -804,6 +812,7 @@ public:
my_bool insert_or_update; /* Can be used by the handler */ my_bool insert_or_update; /* Can be used by the handler */
my_bool alias_name_used; /* true if table_name is alias */ my_bool alias_name_used; /* true if table_name is alias */
my_bool get_fields_in_item_tree; /* Signal to fix_field */ my_bool get_fields_in_item_tree; /* Signal to fix_field */
my_bool m_needs_reopen;
REGINFO reginfo; /* field connections */ REGINFO reginfo; /* field connections */
MEM_ROOT mem_root; MEM_ROOT mem_root;
...@@ -853,7 +862,7 @@ public: ...@@ -853,7 +862,7 @@ public:
Is this instance of the table should be reopen? Is this instance of the table should be reopen?
*/ */
inline bool needs_reopen() inline bool needs_reopen()
{ return s->version != refresh_version; } { return !db_stat || m_needs_reopen; }
}; };
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment