#8 0x00005566b296b16a in wsrep::transaction::after_statement (this=this@entry=0x1490b00078a8) at /test/mtest/10.8_dbg/wsrep-lib/src/transaction.cpp:890
#9 0x00005566b2950fd8 in wsrep::client_state::after_statement (this=this@entry=0x1490b0007840) at /test/mtest/10.8_dbg/wsrep-lib/src/client_state.cpp:272
#10 0x00005566b1ee5c78 in wsrep_after_statement (thd=0x1490b0000ff8) at /test/mtest/10.8_dbg/sql/sql_class.h:5330
#11 rpt_handle_event (qev=qev@entry=0x1490c003bfb8, rpt=rpt@entry=0x1490c000eaa0) at /test/mtest/10.8_dbg/sql/rpl_parallel.cc:66
#12 0x00005566b1eeb555 in handle_rpl_parallel_thread (arg=arg@entry=0x1490c000eaa0) at /test/mtest/10.8_dbg/sql/rpl_parallel.cc:1376
#13 0x00005566b22e5601 in pfs_spawn_thread (arg=0x1490c000fd08) at /test/mtest/10.8_dbg/storage/perfschema/pfs.cc:2201
#14 0x000014914c45b609 in start_thread (arg=<optimized out>) at pthread_create.c:477
#15 0x000014914c049293 in clone () at ../sysdeps/unix/sysv/linux/x86_64/clone.S:95
(gdb)
Ramesh Sivaraman
added a comment - Node1 crashes with similar assertion in different place when we run RQG with a simple grammar file.
perl gentest.pl --dsn=dbi:mysql:host=127.0.0.1:port=4040:socket=/home/ramesh/rpl/data/socket.sock:user=root:database=test --gendata=conf/examples/example.zz --grammar=conf/examples/example.yy –-threads=8 --duration=300 --queries=100000
10.8.0 cf7cc376bacb3f49f5afa2cce144dace82602546
Core was generated by `/home/ramesh/rpl/mariadb-10.8.0-linux-x86_64_one/bin/mysqld --defaults-file=/ho'.
--Type <RET> for more, q to quit, c to continue without paging--
Program terminated with signal SIGABRT, Aborted.
#0 __pthread_kill (threadid=<optimized out>, signo=signo@entry=6) at ../sysdeps/unix/sysv/linux/pthread_kill.c:56
56 ../sysdeps/unix/sysv/linux/pthread_kill.c: No such file or directory.
[Current thread is 1 (Thread 0x149138272700 (LWP 324518))]
(gdb) bt
#0 __pthread_kill (threadid=<optimized out>, signo=signo@entry=6) at ../sysdeps/unix/sysv/linux/pthread_kill.c:56
#1 0x00005566b28071cd in my_write_core (sig=sig@entry=6) at /test/mtest/10.8_dbg/mysys/stacktrace.c:424
#2 0x00005566b1fe42d5 in handle_fatal_signal (sig=6) at /test/mtest/10.8_dbg/sql/signal_handler.cc:345
#3 <signal handler called>
#4 __GI_raise (sig=sig@entry=6) at ../sysdeps/unix/sysv/linux/raise.c:50
#5 0x000014914bf4c859 in __GI_abort () at abort.c:79
#6 0x000014914bf4c729 in __assert_fail_base (fmt=0x14914c0e2588 "%s%s%s:%u: %s%sAssertion `%s' failed.\n%n",
assertion=0x5566b2f50420 "state() == s_executing || state() == s_prepared || state() == s_committed || state() == s_aborted || state() == s_must_abort || state() == s_cert_failed || state() == s_must_replay", file=0x5566b2f4ed98 "/test/mtest/10.8_dbg/wsrep-lib/src/transaction.cpp", line=810, function=<optimized out>) at assert.c:92
#7 0x000014914bf5df36 in __GI___assert_fail (
assertion=assertion@entry=0x5566b2f50420 "state() == s_executing || state() == s_prepared || state() == s_committed || state() == s_aborted || state() == s_must_abort || state() == s_cert_failed || state() == s_must_replay", file=file@entry=0x5566b2f4ed98 "/test/mtest/10.8_dbg/wsrep-lib/src/transaction.cpp", line=line@entry=810, function=function@entry=0x5566b2f503f0 "int wsrep::transaction::after_statement()")
at assert.c:101
#8 0x00005566b296b16a in wsrep::transaction::after_statement (this=this@entry=0x1490b00078a8) at /test/mtest/10.8_dbg/wsrep-lib/src/transaction.cpp:890
#9 0x00005566b2950fd8 in wsrep::client_state::after_statement (this=this@entry=0x1490b0007840) at /test/mtest/10.8_dbg/wsrep-lib/src/client_state.cpp:272
#10 0x00005566b1ee5c78 in wsrep_after_statement (thd=0x1490b0000ff8) at /test/mtest/10.8_dbg/sql/sql_class.h:5330
#11 rpt_handle_event (qev=qev@entry=0x1490c003bfb8, rpt=rpt@entry=0x1490c000eaa0) at /test/mtest/10.8_dbg/sql/rpl_parallel.cc:66
#12 0x00005566b1eeb555 in handle_rpl_parallel_thread (arg=arg@entry=0x1490c000eaa0) at /test/mtest/10.8_dbg/sql/rpl_parallel.cc:1376
#13 0x00005566b22e5601 in pfs_spawn_thread (arg=0x1490c000fd08) at /test/mtest/10.8_dbg/storage/perfschema/pfs.cc:2201
#14 0x000014914c45b609 in start_thread (arg=<optimized out>) at pthread_create.c:477
#15 0x000014914c049293 in clone () at ../sysdeps/unix/sysv/linux/x86_64/clone.S:95
(gdb)
2022-03-19 17:03:42 23 [ERROR] Slave SQL: Node has dropped from cluster, Gtid 0-11-88, Internal MariaDB error code: 1047
2022-03-19 17:03:42 23 [Note] WSREP: wsrep_after_statement for 23 client_state exec client_mode local trans_state ordered_commit
2022-03-19 17:03:42 23 [ERROR] Slave (additional info): An attempt was made to binlog GTID 0-11-88 which would create an out-of-order sequence number with existing GTID 0-11-90, and gtid strict mode is enabled Error_code: 1950
2022-03-19 17:03:42 23 [Warning] Slave: An attempt was made to binlog GTID 0-11-88 which would create an out-of-order sequence number with existing GTID 0-11-90, and gtid strict mode is enabled Error_code: 1950
2022-03-19 17:03:42 23 [ERROR] Error running query, slave SQL thread aborted. Fix the problem, and restart the slave SQL thread with "SLAVE START". We stopped at log 'binlog.000001' position 68458343; GTID position '0-11-90'
2022-03-19 17:03:42 22 [Note] WSREP: wsrep_after_statement for 22 client_state exec client_mode local trans_state executing
Ramesh Sivaraman
added a comment - jplindst Replication breaks in 10.4 optimized build even after fixing MDEV-27568
10.4.25 c519aa3d7aea1afb7754ccf70aa5b276ff5fbf87
2022-03-19 17:03:42 23 [Note] WSREP: wsrep_after_prepare: 1
2022-03-19 17:03:42 23 [Note] WSREP: wsrep_before_commit: 1, 91
2022-03-19 17:03:42 23 [Note] WSREP: wsrep_ordered_commit: 1
2022-03-19 17:03:42 23 [ERROR] mysqld: Error writing file 'binlog' (errno: 1950 "Unknown error 1950")
2022-03-19 17:03:42 22 [Note] WSREP: wsrep_after_statement for 22 client_state exec client_mode local trans_state executing
2022-03-19 17:03:42 23 [Note] WSREP: log_and_order has failed 23 0
2022-03-19 17:03:42 23 [Note] WSREP: rollback skipped 0x148128035300 1
2022-03-19 17:03:42 23 [Note] WSREP: SQL apply failed, res 1 conflict state: ordered_commit
2022-03-19 17:03:42 23 [ERROR] Slave SQL: Node has dropped from cluster, Gtid 0-11-88, Internal MariaDB error code: 1047
2022-03-19 17:03:42 23 [Note] WSREP: wsrep_after_statement for 23 client_state exec client_mode local trans_state ordered_commit
2022-03-19 17:03:42 23 [ERROR] Slave (additional info): An attempt was made to binlog GTID 0-11-88 which would create an out-of-order sequence number with existing GTID 0-11-90, and gtid strict mode is enabled Error_code: 1950
2022-03-19 17:03:42 23 [Warning] Slave: An attempt was made to binlog GTID 0-11-88 which would create an out-of-order sequence number with existing GTID 0-11-90, and gtid strict mode is enabled Error_code: 1950
2022-03-19 17:03:42 23 [Warning] Slave: Error writing file 'binlog' (errno: 1950 "Unknown error 1950") Error_code: 1026
2022-03-19 17:03:42 23 [ERROR] Error running query, slave SQL thread aborted. Fix the problem, and restart the slave SQL thread with "SLAVE START". We stopped at log 'binlog.000001' position 68458343; GTID position '0-11-90'
2022-03-19 17:03:42 22 [Note] WSREP: wsrep_after_statement for 22 client_state exec client_mode local trans_state executing
The error "Error writing file 'binlog' (errno: 1950 "Unknown error 1950")" is reported because there is an attempt to write a gtid event to the binlog and the gtid is out of order (1950 is ER_GTID_STRICT_OUT_OF_ORDER). The error is raised in this case because gtid_strict_mode is enabled.
Currently, the combination parallel_slave_threads > 1 and Galera acting as a slave does not guarantee that the replication order of Galera matches the order given by the aync replication master.
Daniele Sciascia
added a comment - The error "Error writing file 'binlog' (errno: 1950 "Unknown error 1950")" is reported because there is an attempt to write a gtid event to the binlog and the gtid is out of order (1950 is ER_GTID_STRICT_OUT_OF_ORDER). The error is raised in this case because gtid_strict_mode is enabled.
Currently, the combination parallel_slave_threads > 1 and Galera acting as a slave does not guarantee that the replication order of Galera matches the order given by the aync replication master.
Node1 crashes with similar assertion in different place when we run RQG with a simple grammar file.
perl gentest.pl --dsn=dbi:mysql:host=127.0.0.1:port=4040:socket=/home/ramesh/rpl/data/socket.sock:user=root:database=test --gendata=conf/examples/example.zz --grammar=conf/examples/example.yy –-threads=8 --duration=300 --queries=100000
10.8.0 cf7cc376bacb3f49f5afa2cce144dace82602546
Core was generated by `/home/ramesh/rpl/mariadb-10.8.0-linux-x86_64_one/bin/mysqld --defaults-file=/ho'.
--Type <RET> for more, q to quit, c to continue without paging--
Program terminated with signal SIGABRT, Aborted.
#0 __pthread_kill (threadid=<optimized out>, signo=signo@entry=6) at ../sysdeps/unix/sysv/linux/pthread_kill.c:56
56 ../sysdeps/unix/sysv/linux/pthread_kill.c: No such file or directory.
[Current thread is 1 (Thread 0x149138272700 (LWP 324518))]
(gdb) bt
#0 __pthread_kill (threadid=<optimized out>, signo=signo@entry=6) at ../sysdeps/unix/sysv/linux/pthread_kill.c:56
#1 0x00005566b28071cd in my_write_core (sig=sig@entry=6) at /test/mtest/10.8_dbg/mysys/stacktrace.c:424
#2 0x00005566b1fe42d5 in handle_fatal_signal (sig=6) at /test/mtest/10.8_dbg/sql/signal_handler.cc:345
#3 <signal handler called>
#4 __GI_raise (sig=sig@entry=6) at ../sysdeps/unix/sysv/linux/raise.c:50
#5 0x000014914bf4c859 in __GI_abort () at abort.c:79
#6 0x000014914bf4c729 in __assert_fail_base (fmt=0x14914c0e2588 "%s%s%s:%u: %s%sAssertion `%s' failed.\n%n",
assertion=0x5566b2f50420 "state() == s_executing || state() == s_prepared || state() == s_committed || state() == s_aborted || state() == s_must_abort || state() == s_cert_failed || state() == s_must_replay", file=0x5566b2f4ed98 "/test/mtest/10.8_dbg/wsrep-lib/src/transaction.cpp", line=810, function=<optimized out>) at assert.c:92
#7 0x000014914bf5df36 in __GI___assert_fail (
assertion=assertion@entry=0x5566b2f50420 "state() == s_executing || state() == s_prepared || state() == s_committed || state() == s_aborted || state() == s_must_abort || state() == s_cert_failed || state() == s_must_replay", file=file@entry=0x5566b2f4ed98 "/test/mtest/10.8_dbg/wsrep-lib/src/transaction.cpp", line=line@entry=810, function=function@entry=0x5566b2f503f0 "int wsrep::transaction::after_statement()")
at assert.c:101
#8 0x00005566b296b16a in wsrep::transaction::after_statement (this=this@entry=0x1490b00078a8) at /test/mtest/10.8_dbg/wsrep-lib/src/transaction.cpp:890
#9 0x00005566b2950fd8 in wsrep::client_state::after_statement (this=this@entry=0x1490b0007840) at /test/mtest/10.8_dbg/wsrep-lib/src/client_state.cpp:272
#10 0x00005566b1ee5c78 in wsrep_after_statement (thd=0x1490b0000ff8) at /test/mtest/10.8_dbg/sql/sql_class.h:5330
#11 rpt_handle_event (qev=qev@entry=0x1490c003bfb8, rpt=rpt@entry=0x1490c000eaa0) at /test/mtest/10.8_dbg/sql/rpl_parallel.cc:66
#12 0x00005566b1eeb555 in handle_rpl_parallel_thread (arg=arg@entry=0x1490c000eaa0) at /test/mtest/10.8_dbg/sql/rpl_parallel.cc:1376
#13 0x00005566b22e5601 in pfs_spawn_thread (arg=0x1490c000fd08) at /test/mtest/10.8_dbg/storage/perfschema/pfs.cc:2201
#14 0x000014914c45b609 in start_thread (arg=<optimized out>) at pthread_create.c:477
#15 0x000014914c049293 in clone () at ../sysdeps/unix/sysv/linux/x86_64/clone.S:95
(gdb)