Description:
When a xa transaction is commited and the server crashed, then restart the MySQL server, first, do xa start with the exist xid, says: XAER_DUPID: The XID already exists, but this xid has been submitted.
This is why?
slave replication info:
mysql> show slave status\G
*************************** 1. row ***************************
Slave_IO_State:
Master_Host: 172.16.90.233
Master_User: repl
Master_Port: 3390
Connect_Retry: 60
Master_Log_File: my1binlog.000001
Read_Master_Log_Pos: 12598508
Relay_Log_File: relay-log-23490.000010
Relay_Log_Pos: 9748
Relay_Master_Log_File: my1binlog.000001
................
................
Replicate_Wild_Ignore_Table:
Last_Errno: 1440
Last_Error: Error 'XAER_DUPID: The XID already exists' on query. Default database: 'test'. Query: 'XA START X'30',X'',1'
Skip_Counter: 0
................
................
Last_SQL_Errno: 1440
Last_SQL_Error: Error 'XAER_DUPID: The XID already exists' on query. Default database: 'test'. Query: 'XA START X'30',X'',1'
Replicate_Ignore_Server_Ids:
Master_Server_Id: 23390
Master_UUID: 5d94dc1a-8204-11e6-92ee-5254005428f4
Master_Info_File: mysql.slave_master_info
SQL_Delay: 0
................
................
Master_SSL_Crlpath:
Retrieved_Gtid_Set: 5d94dc1a-8204-11e6-92ee-5254005428f4:23380-29377
Executed_Gtid_Set: 5d94dc1a-8204-11e6-92ee-5254005428f4:1-23402
1 row in set (0.00 sec)
master <my1binlog.000001> info:
# at 10246088
#160927 2:53:55 server id 23390 end_log_pos 10246153 CRC32 0x004cd64d GTID last_committed=23359 sequence_number=23369
SET @@SESSION.GTID_NEXT= '5d94dc1a-8204-11e6-92ee-5254005428f4:23369'/*!*/;
# at 10246153
#160927 2:53:55 server id 23390 end_log_pos 10246240 CRC32 0x20efecf6 Query thread_id=187 exec_time=0 error_code=0
SET TIMESTAMP=1474916035/*!*/;
XA START X'30',X'',1
/*!*/;
# at 10246240
#160927 2:53:55 server id 23390 end_log_pos 10246297 CRC32 0xf4e0417e Table_map: `test`.`part_table` mapped to number 119
# at 10246297
#160927 2:53:55 server id 23390 end_log_pos 10246341 CRC32 0xcdc10c06 Write_rows: table id 119 flags: STMT_END_F
BINLOG '
w27pVxNeWwAAOQAAAJlYnAAAAHcAAAAAAAEABHRlc3QACnBhcnRfdGFibGUAAwMDDwI8AAZ+QeD0
w27pVx5eWwAALAAAAMVYnAAAAHcAAAAAAAEAAgAD//yaMwAAgwwAAAYMwc0=
'/*!*/;
### INSERT INTO `test`.`part_table`
### SET
### @1=13210 /* INT meta=0 nullable=0 is_null=0 */
### @2=3203 /* INT meta=0 nullable=1 is_null=0 */
### @3=NULL /* VARSTRING(60) meta=60 nullable=1 is_null=1 */
# at 10246341
#160927 2:53:55 server id 23390 end_log_pos 10246398 CRC32 0xd8d0ee8d Table_map: `test`.`norm_table` mapped to number 118
# at 10246398
#160927 2:53:55 server id 23390 end_log_pos 10246442 CRC32 0x252d14d7 Write_rows: table id 118 flags: STMT_END_F
BINLOG '
w27pVxNeWwAAOQAAAP5YnAAAAHYAAAAAAAEABHRlc3QACm5vcm1fdGFibGUAAwMDDwI8AAaN7tDY
w27pVx5eWwAALAAAACpZnAAAAHYAAAAAAAEAAgAD//yaMwAAgwwAANcULSU=
'/*!*/;
### INSERT INTO `test`.`norm_table`
### SET
### @1=13210 /* INT meta=0 nullable=0 is_null=0 */
### @2=3203 /* INT meta=0 nullable=1 is_null=0 */
### @3=NULL /* VARSTRING(60) meta=60 nullable=1 is_null=1 */
# at 10246442
#160927 2:53:55 server id 23390 end_log_pos 10246527 CRC32 0xbd0250ad Query thread_id=187 exec_time=0 error_code=0
SET TIMESTAMP=1474916035/*!*/;
XA END X'30',X'',1
/*!*/;
# at 10246527
#160927 2:53:55 server id 23390 end_log_pos 10246564 CRC32 0xb2dd9b80 XA PREPARE X'30',X'',1
XA PREPARE X'30',X'',1
/*!*/;
..........
..........
..........
# at 10249978
#160927 2:53:55 server id 23390 end_log_pos 10250043 CRC32 0x1386b346 GTID last_committed=23369 sequence_number=23379
SET @@SESSION.GTID_NEXT= '5d94dc1a-8204-11e6-92ee-5254005428f4:23379'/*!*/;
# at 10250043
#160927 2:53:55 server id 23390 end_log_pos 10250131 CRC32 0x8722aed0 Query thread_id=187 exec_time=0 error_code=0
SET TIMESTAMP=1474916035/*!*/;
XA COMMIT X'30',X'',1
/*!*/;
Here you can see the master has been submitted.
slave binary log:
# at 1941042
#160927 2:53:55 server id 23390 end_log_pos 1941107 CRC32 0x2bce1b66 GTID last_committed=4771 sequence_number=4772
SET @@SESSION.GTID_NEXT= '5d94dc1a-8204-11e6-92ee-5254005428f4:23369'/*!*/;
# at 1941107
#160927 2:53:55 server id 23390 end_log_pos 1941185 CRC32 0xf3bce965 Query thread_id=187 exec_time=12 error_code=0
SET TIMESTAMP=1474916035/*!*/;
SET @@session.sql_mode=524288/*!*/;
XA START X'30',X'',1
/*!*/;
# at 1941185
#160927 2:53:55 server id 23390 end_log_pos 1941242 CRC32 0xeadf1e6a Table_map: `test`.`part_table` mapped to number 108
# at 1941242
#160927 2:53:55 server id 23390 end_log_pos 1941286 CRC32 0xad5c60d7 Write_rows: table id 108 flags: STMT_END_F
BINLOG '
w27pVxNeWwAAOQAAAPqeHQAAAGwAAAAAAAEABHRlc3QACnBhcnRfdGFibGUAAwMDDwI8AAZqHt/q
w27pVx5eWwAALAAAACafHQAAAGwAAAAAAAEAAgAD//yaMwAAgwwAANdgXK0=
'/*!*/;
### INSERT INTO `test`.`part_table`
### SET
### @1=13210 /* INT meta=0 nullable=0 is_null=0 */
### @2=3203 /* INT meta=0 nullable=1 is_null=0 */
### @3=NULL /* VARSTRING(60) meta=60 nullable=1 is_null=1 */
# at 1941286
#160927 2:53:55 server id 23390 end_log_pos 1941343 CRC32 0xa21c9d71 Table_map: `test`.`norm_table` mapped to number 109
# at 1941343
#160927 2:53:55 server id 23390 end_log_pos 1941387 CRC32 0xdd164306 Write_rows: table id 109 flags: STMT_END_F
BINLOG '
w27pVxNeWwAAOQAAAF+fHQAAAG0AAAAAAAEABHRlc3QACm5vcm1fdGFibGUAAwMDDwI8AAZxnRyi
w27pVx5eWwAALAAAAIufHQAAAG0AAAAAAAEAAgAD//yaMwAAgwwAAAZDFt0=
'/*!*/;
### INSERT INTO `test`.`norm_table`
### SET
### @1=13210 /* INT meta=0 nullable=0 is_null=0 */
### @2=3203 /* INT meta=0 nullable=1 is_null=0 */
### @3=NULL /* VARSTRING(60) meta=60 nullable=1 is_null=1 */
# at 1941387
#160927 2:53:55 server id 23390 end_log_pos 1941463 CRC32 0x70cde740 Query thread_id=187 exec_time=12 error_code=0
SET TIMESTAMP=1474916035/*!*/;
SET @@session.sql_mode=1436549152/*!*/;
XA END X'30',X'',1
/*!*/;
# at 1941463
#160927 2:53:55 server id 23390 end_log_pos 1941500 CRC32 0xf1c4290a XA PREPARE X'30',X'',1
XA PREPARE X'30',X'',1
..........
..........
..........
# at 1944806
#160927 2:53:55 server id 23390 end_log_pos 1944871 CRC32 0x51aaf46a GTID last_committed=4781 sequence_number=4782
SET @@SESSION.GTID_NEXT= '5d94dc1a-8204-11e6-92ee-5254005428f4:23379'/*!*/;
# at 1944871
#160927 2:53:55 server id 23390 end_log_pos 1944959 CRC32 0x91c3b6e4 Query thread_id=187 exec_time=13 error_code=0
SET TIMESTAMP=1474916035/*!*/;
XA COMMIT X'30',X'',1
/*!*/;
ROLLBACK /* added by mysqlbinlog */ /*!*/;
SET @@SESSION.GTID_NEXT= 'AUTOMATIC' /* added by mysqlbinlog */ /*!*/;
DELIMITER ;
# End of log file
/*!50003 SET COMPLETION_TYPE=@OLD_COMPLETION_TYPE*/;
/*!50530 SET @@SESSION.PSEUDO_SLAVE_MODE=0*/;
Here you can see the xa '30' in slave has been submitted.
Query table data from the slave:
mysql> select * from part_table where c1=13210;
Empty set (0.00 sec)
mysql> select * from norm_table where c1=13210;
Empty set (0.00 sec)
mysql> xa recover;
Empty set (0.00 sec)
Here has been submitted, but no data,this is why?
Before the XID has been submitted, and then begin a the same XID's XA transaction should be OK,but there is a error,says:Error 'XAER_DUPID: The XID already exists' on query.
And the execution of "xa recover", did not return the result.
MySQL has been lost before the transaction has been submitted?
How to repeat:
Reproducing method:
1.Create test table
create table norm_table(c1 int auto_increment primary key, c2 int, c3 varchar(20));
create table part_table(c1 int auto_increment primary key, c2 int, c3 varchar(20));
2.Perform sysbench in master database
sysbench --test=./tests/db/xa.lua --mysql-user=root --mysql-password=abc123 \
--mysql-db=test --mysql-host=127.0.0.1 --mysql-port=3390 --oltp-read-only=off --report-interval=10 \
--rand-type=uniform --max-time=60 --num-threads=5 --max-requests=0 --percentile=99 run
xa.lua文件:
pathtest = string.match(test, "(.*/)") or ""
dofile(pathtest .. "common.lua")
function thread_init(thread_id)
set_vars()
local ids
ids = sb_rand(0,10000)
local ids2
ids2 = sb_rand(10002,20000)
if (db_driver == "mysql" and mysql_table_engine == "myisam") then
begin_query = "LOCK TABLES test WRITE"
commit_query = "UNLOCK TABLES"
else
begin_query = "xa start " .. "'" .. ids .. "'"
commit_query1 = "xa end " .. "'" .. ids .. "'"
commit_query2 = "xa PREPARE " .. "'" .. ids .. "'"
commit_query3 = "xa commit " .. "'" .. ids .. "'"
begin_query2 = "xa start " .. "'" .. ids2 .. "'"
commit_query4 = "xa end " .. "'" .. ids2 .. "'"
commit_query5 = "xa commit " .. "'" .. ids2 .. "' ONE PHASE"
end
end
function event(thread_id)
local id
id = sb_rand(0,5000)
local ids3
ids3 = sb_rand(50001,10000)
if not oltp_skip_trx then
db_query(begin_query)
end
db_query("UPDATE test.norm_table SET c2 = c2 + 1 where c1 = " .. id )
db_query("UPDATE test.part_table SET c2 = c2 + 1 where c1 = " .. id )
db_query("delete from test.norm_table where c1 = " .. id )
db_query("delete from test.part_table where c1 = " .. id )
db_query("insert into test.part_table(c2) values(" .. id .. ")" )
db_query("insert into test.norm_table(c2) values(" .. id .. ")" )
db_query("delete from test.norm_table where c1 = " .. id )
db_query("delete from test.part_table where c1 = " .. id )
db_query("SELECT * FROM test.norm_table where sleep(0.3)=0 and c1 = " .. id )
if not oltp_skip_trx then
db_query(commit_query1)
db_query(commit_query2)
db_query(commit_query3)
end
if not oltp_skip_trx then
db_query(begin_query2)
end
db_query("UPDATE test.norm_table SET c2 = c2 + 1 where c1 = " .. ids3 )
db_query("UPDATE test.part_table SET c2 = c2 + 1 where c1 = " .. ids3 )
db_query("delete from test.norm_table where c1 = " .. ids3 )
db_query("delete from test.part_table where c1 = " .. ids3 )
db_query("insert into test.part_table(c2) values(" .. ids3 .. ")" )
db_query("insert into test.norm_table(c2) values(" .. ids3 .. ")" )
db_query("delete from test.norm_table where c1 = " .. ids3 )
db_query("delete from test.part_table where c1 = " .. ids3 )
db_query("SELECT * FROM test.norm_table where sleep(0.3)=0 and c1 = " .. ids3 )
if not oltp_skip_trx then
db_query(commit_query4)
db_query(commit_query5)
end
end
3.When the sysbench is executed in master,and slave server power off(The power down).Neither init 0 nor shutdown.
And then open slave server,slave database replication will be interrupted,Error occurred.
This phenomenon is accidental,But the probability is high.