Uploaded image for project: 'MariaDB Server'
  1. MariaDB Server
  2. MDEV-34049

InnoDB: Failing assertion: table->get_ref_count() == 0 in dict_sys_t::remove on DROP

Details

    Description

      Possibly related: MDEV-25850, MDEV-26636, MDEV-29277, MDEV-29507, MDEV-30337

      # MYEXTRA="--no-defaults --sql_mode="
      # REPL_EXTRA="--gtid_strict_mode=1 --relay-log=relaylog"  # used for both master & slave
      # MASTER_EXTRA="--log_bin=binlog --binlog_format=STATEMENT --log_bin_trust_function_creators=1 --server_id=1"
      # SLAVE_EXTRA="--slave-parallel-threads=11 --slave-parallel-mode=aggressive --slave-parallel-max-queued=1073741827 --slave_run_triggers_for_rbr=LOGGING --slave_skip_errors=ALL --server_id=2"
      CREATE TABLE t1 (a1 VARCHAR(1), a2 VARCHAR(1)) ENGINE=InnoDB;
      XA START 'a';
      CREATE TEMPORARY TABLE t1 (c1 INT) ENGINE=InnoDB;
      INSERT INTO t1 VALUES ('a');
      INSERT IGNORE INTO t1 VALUES (@inserted_value);
      XA END 'a';
      XA ROLLBACK 'a';
      SET SESSION gtid_domain_id=102;
      

      Leads, very sporadically, to:

      10.6.18 0ccdf54b644352f42e1768bc660be7ab50c1e9d2 (Debug)

      Core was generated by `/test/MD240424-mariadb-10.6.18-linux-x86_64-dbg/bin/mariadbd --no-defaults --ba'.
      Program terminated with signal SIGABRT, Aborted.
      #0  __pthread_kill_implementation (no_tid=0, signo=6, threadid=<optimized out>)at ./nptl/pthread_kill.c:44
      [Current thread is 1 (LWP 2457798)]
      (gdb) bt
      #0  __pthread_kill_implementation (no_tid=0, signo=6, threadid=<optimized out>)at ./nptl/pthread_kill.c:44
      #1  __pthread_kill_internal (signo=6, threadid=<optimized out>)at ./nptl/pthread_kill.c:78
      #2  __GI___pthread_kill (threadid=<optimized out>, signo=signo@entry=6)at ./nptl/pthread_kill.c:89
      #3  0x00001508c683c406 in __GI_raise (sig=sig@entry=6)at ../sysdeps/posix/raise.c:26
      #4  0x00001508c682287c in __GI_abort () at ./stdlib/abort.c:79
      #5  0x000055b283f69902 in ut_dbg_assertion_failed (expr=expr@entry=0x55b2845e0fe1 "table->get_ref_count() == 0", file=file@entry=0x55b2845e1250 "/test/10.6_dbg/storage/innobase/dict/dict0dict.cc", line=line@entry=1826)at /test/10.6_dbg/storage/innobase/ut/ut0dbg.cc:60
      #6  0x000055b28401cfab in dict_sys_t::remove (this=this@entry=0x55b284bfa980 <dict_sys>, table=0x150850021e38, lru=lru@entry=false, keep=keep@entry=false)at /test/10.6_dbg/storage/innobase/dict/dict0dict.cc:1826
      #7  0x000055b283d5f650 in ha_innobase::delete_table (this=<optimized out>, name=<optimized out>)at /test/10.6_dbg/storage/innobase/handler/ha_innodb.cc:13528
      #8  0x000055b2839c79c1 in hton_drop_table (hton=<optimized out>, path=<optimized out>) at /test/10.6_dbg/sql/handler.cc:573
      #9  0x000055b28392bc8b in THD::rm_temporary_table (this=<optimized out>, base=0x55b286f5cc18, path=0x150850020f70 "/dev/shm/1714686204629124488/subreducer/289/tmp_slave/#sql-temptable-25632b-c-0") at /test/10.6_dbg/sql/temporary_tables.cc:705
      #10 0x000055b28392c31e in THD::free_tmp_table_share (this=this@entry=0x150854000d58, share=share@entry=0x150850020958, delete_table=delete_table@entry=true)at /test/10.6_dbg/sql/temporary_tables.cc:1473
      #11 0x000055b28392db50 in THD::drop_temporary_table (this=this@entry=0x150854000d58, table=<optimized out>, is_trans=is_trans@entry=0x1508a1964be7, delete_table=delete_table@entry=true)at /test/10.6_dbg/sql/temporary_tables.cc:673
      #12 0x000055b2837c1c9e in mysql_rm_table_no_locks (thd=thd@entry=0x150854000d58, tables=tables@entry=0x15085400ae78, current_db=current_db@entry=0x150854000df8, ddl_log_state=0x1508a1964c40, ddl_log_state@entry=0x0, if_exists=if_exists@entry=true, drop_temporary=drop_temporary@entry=true, drop_view=false, drop_sequence=false, dont_log_query=false, dont_free_locks=false)at /test/10.6_dbg/sql/sql_table.cc:1321
      #13 0x000055b2837c450f in mysql_rm_table (thd=thd@entry=0x150854000d58, tables=tables@entry=0x15085400ae78, if_exists=<optimized out>, drop_temporary=<optimized out>, drop_sequence=<optimized out>, dont_log_query=dont_log_query@entry=false)at /test/10.6_dbg/sql/sql_table.cc:1069
      #14 0x000055b283706796 in mysql_execute_command (thd=thd@entry=0x150854000d58, is_called_from_prepared_stmt=is_called_from_prepared_stmt@entry=false)at /test/10.6_dbg/sql/sql_parse.cc:5030
      #15 0x000055b28370b0b4 in mysql_parse (thd=0x150854000d58, rawbuf=<optimized out>, length=<optimized out>, parser_state=parser_state@entry=0x1508a19658b0)at /test/10.6_dbg/sql/sql_parse.cc:8146
      #16 0x000055b283b2ffe2 in Query_log_event::do_apply_event (this=0x15086c037098, rgi=0x15086c02edc0, query_arg=0x15086c037203 "DROP /*!40005 TEMPORARY */ TABLE IF EXISTS `t1`", q_len_arg=<optimized out>) at /test/10.6_dbg/sql/sql_class.h:240
      #17 0x000055b283b3091e in Query_log_event::do_apply_event (this=<optimized out>, rgi=<optimized out>)at /test/10.6_dbg/sql/log_event_server.cc:1609
      #18 0x000055b28362c4e5 in Log_event::apply_event (rgi=0x15086c02edc0, this=0x15086c037098) at /test/10.6_dbg/sql/log_event.h:1509
      #19 apply_event_and_update_pos_apply (ev=ev@entry=0x15086c037098, thd=thd@entry=0x150854000d58, rgi=rgi@entry=0x15086c02edc0, reason=reason@entry=0) at /test/10.6_dbg/sql/slave.cc:3906
      #20 0x000055b28363672c in apply_event_and_update_pos_for_parallel (ev=ev@entry=0x15086c037098, thd=thd@entry=0x150854000d58, rgi=rgi@entry=0x15086c02edc0) at /test/10.6_dbg/sql/slave.cc:4102
      #21 0x000055b2838d6508 in rpt_handle_event (qev=qev@entry=0x15086c02e968, rpt=rpt@entry=0x15086c00f7c0) at /test/10.6_dbg/sql/rpl_parallel.cc:64
      #22 0x000055b2838db02b in handle_rpl_parallel_thread (arg=arg@entry=0x15086c00f7c0) at /test/10.6_dbg/sql/rpl_parallel.cc:1525
      #23 0x000055b283ca0f78 in pfs_spawn_thread (arg=0x15086c012c38)at /test/10.6_dbg/storage/perfschema/pfs.cc:2201
      #24 0x00001508c688f18a in start_thread (arg=<optimized out>)at ./nptl/pthread_create.c:444
      #25 0x00001508c691dbd0 in clone3 ()at ../sysdeps/unix/sysv/linux/x86_64/clone3.S:81
      

      Note the crashing query from the stack:

      DROP /*!40005 TEMPORARY */ TABLE IF EXISTS `t1`
      

      Is not directly part of the testcase.

      NTS: ~/MDEV-34049 | sc30985

      Attachments

        Issue Links

          Activity

            Proposed patch (10.6-based) to fix this issue:

            diff --git a/sql/sys_vars.cc b/sql/sys_vars.cc
            index 115bbdf499b..e9baed59cd7 100644
            --- a/sql/sys_vars.cc
            +++ b/sql/sys_vars.cc
            @@ -1808,12 +1808,32 @@ Sys_pseudo_thread_id(
             static bool
             check_gtid_domain_id(sys_var *self, THD *thd, set_var *var)
             {
            -  if (var->type != OPT_GLOBAL &&
            -      error_if_in_trans_or_substatement(thd,
            +  if (var->type != OPT_GLOBAL)
            +  {
            +    if (error_if_in_trans_or_substatement(thd,
                       ER_STORED_FUNCTION_PREVENTS_SWITCH_GTID_DOMAIN_ID_SEQ_NO,
                       ER_INSIDE_TRANSACTION_PREVENTS_SWITCH_GTID_DOMAIN_ID_SEQ_NO))
                 return true;
            -
            +    /*
            +      All binlogged statements on a temporary table must be binlogged in the
            +      same domain_id; it is not safe to run them in parallel in different
            +      domains, temporary table must be exclusive to a single thread.
            +      In row-based binlogging, temporary tables do not end up in the binlog,
            +      so there is no such issue.
            +
            +      ToDo: When merging to next (non-GA) release, introduce a more specific
            +      error that describes that the problem is changing gtid_domain_id with
            +      open temporary tables in statement/mixed binlogging mode; it is not
            +      really due to doing it inside a "transaction".
            +    */
            +    if (thd->has_thd_temporary_tables() &&
            +        !thd->is_current_stmt_binlog_format_row())
            +    {
            +      my_error(ER_INSIDE_TRANSACTION_PREVENTS_SWITCH_GTID_DOMAIN_ID_SEQ_NO,
            +               MYF(0));
            +        return true;
            +    }
            +  }
               return false;
             }
             
            

            knielsen Kristian Nielsen added a comment - Proposed patch (10.6-based) to fix this issue: diff --git a/sql/sys_vars.cc b/sql/sys_vars.cc index 115bbdf499b..e9baed59cd7 100644 --- a/sql/sys_vars.cc +++ b/sql/sys_vars.cc @@ -1808,12 +1808,32 @@ Sys_pseudo_thread_id( static bool check_gtid_domain_id(sys_var *self, THD *thd, set_var *var) { - if (var->type != OPT_GLOBAL && - error_if_in_trans_or_substatement(thd, + if (var->type != OPT_GLOBAL) + { + if (error_if_in_trans_or_substatement(thd, ER_STORED_FUNCTION_PREVENTS_SWITCH_GTID_DOMAIN_ID_SEQ_NO, ER_INSIDE_TRANSACTION_PREVENTS_SWITCH_GTID_DOMAIN_ID_SEQ_NO)) return true; - + /* + All binlogged statements on a temporary table must be binlogged in the + same domain_id; it is not safe to run them in parallel in different + domains, temporary table must be exclusive to a single thread. + In row-based binlogging, temporary tables do not end up in the binlog, + so there is no such issue. + + ToDo: When merging to next (non-GA) release, introduce a more specific + error that describes that the problem is changing gtid_domain_id with + open temporary tables in statement/mixed binlogging mode; it is not + really due to doing it inside a "transaction". + */ + if (thd->has_thd_temporary_tables() && + !thd->is_current_stmt_binlog_format_row()) + { + my_error(ER_INSIDE_TRANSACTION_PREVENTS_SWITCH_GTID_DOMAIN_ID_SEQ_NO, + MYF(0)); + return true; + } + } return false; }
            knielsen Kristian Nielsen added a comment - Proposed patch for review: https://lists.mariadb.org/hyperkitty/list/commits@lists.mariadb.org/thread/DN2LQ53HWTUQSAQHR6PT5OYDIFXI6BYB/

            Thank you very much knielsen

            Roel Roel Van de Paar added a comment - Thank you very much knielsen

            Looks good, thanks knielsen!

            bnestere Brandon Nesterenko added a comment - Looks good, thanks knielsen !

            Pushed to 10.6

            knielsen Kristian Nielsen added a comment - Pushed to 10.6

            People

              knielsen Kristian Nielsen
              Roel Roel Van de Paar
              Votes:
              0 Vote for this issue
              Watchers:
              4 Start watching this issue

              Dates

                Created:
                Updated:
                Resolved:

                Git Integration

                  Error rendering 'com.xiplink.jira.git.jira_git_plugin:git-issue-webpanel'. Please contact your Jira administrators.