In an environment running Galera Cluster with 6 MariaDB nodes, 1 arbitrator node, some replicas and a ProxySQL, after a network issue that triggered a state transfer on two nodes,
for some reason, almost all the transactions hang in:
- “starting” state on the commit statement or on "".
- "acquiring total order isolation" on the "KILL CONNECTION" statement (The "KILL CONNECTION" was requested by the ProxySQL)
We tried to restart the service but it hangs on stopping, ProxySQL detected this node as down and switched the traffic to another node.
By looking at the backtrace it seems that we have a kind of "pthread_cond_wait() deadlock" executed by lock.wait() on the enter() function on the commit monitor during the commit order critical section.
Unfortunately, we didn't find a way to reproduce the problem
{"report":{"fcp":826.8999996185303,"ttfb":275.3999996185303,"pageVisibility":"visible","entityId":113664,"key":"jira.project.issue.view-issue","isInitial":true,"threshold":1000,"elementTimings":{},"userDeviceMemory":8,"userDeviceProcessors":32,"apdex":1,"journeyId":"0fd77c99-4d28-4984-9e8f-fe79664d3704","navigationType":0,"readyForUser":902.6999998092651,"redirectCount":0,"resourceLoadedEnd":553.8999996185303,"resourceLoadedStart":280.2999997138977,"resourceTiming":[{"duration":11.5,"initiatorType":"link","name":"https://jira.mariadb.org/s/2c21342762a6a02add1c328bed317ffd-CDN/lu2cib/820016/12ta74/0a8bac35585be7fc6c9cc5a0464cd4cf/_/download/contextbatch/css/_super/batch.css","startTime":280.2999997138977,"connectEnd":0,"connectStart":0,"domainLookupEnd":0,"domainLookupStart":0,"fetchStart":280.2999997138977,"redirectEnd":0,"redirectStart":0,"requestStart":0,"responseEnd":291.7999997138977,"responseStart":0,"secureConnectionStart":0},{"duration":16.09999990463257,"initiatorType":"link","name":"https://jira.mariadb.org/s/7ebd35e77e471bc30ff0eba799ebc151-CDN/lu2cib/820016/12ta74/494e4c556ecbb29f90a3d3b4f09cb99c/_/download/contextbatch/css/jira.browse.project,project.issue.navigator,jira.view.issue,jira.general,jira.global,atl.general,-_super/batch.css?agile_global_admin_condition=true&jag=true&jira.create.linked.issue=true&slack-enabled=true&whisper-enabled=true","startTime":280.59999990463257,"connectEnd":0,"connectStart":0,"domainLookupEnd":0,"domainLookupStart":0,"fetchStart":280.59999990463257,"redirectEnd":0,"redirectStart":0,"requestStart":0,"responseEnd":296.69999980926514,"responseStart":0,"secureConnectionStart":0},{"duration":61.09999990463257,"initiatorType":"script","name":"https://jira.mariadb.org/s/0917945aaa57108d00c5076fea35e069-CDN/lu2cib/820016/12ta74/0a8bac35585be7fc6c9cc5a0464cd4cf/_/download/contextbatch/js/_super/batch.js?locale=en","startTime":280.7999997138977,"connectEnd":280.7999997138977,"connectStart":280.7999997138977,"domainLookupEnd":280.7999997138977,"domainLookupStart":280.7999997138977,"fetchStart":280.7999997138977,"redirectEnd":0,"redirectStart":0,"requestStart":301.2999997138977,"responseEnd":341.8999996185303,"responseStart":315.59999990463257,"secureConnectionStart":280.7999997138977},{"duration":90.5,"initiatorType":"script","name":"https://jira.mariadb.org/s/2d8175ec2fa4c816e8023260bd8c1786-CDN/lu2cib/820016/12ta74/494e4c556ecbb29f90a3d3b4f09cb99c/_/download/contextbatch/js/jira.browse.project,project.issue.navigator,jira.view.issue,jira.general,jira.global,atl.general,-_super/batch.js?agile_global_admin_condition=true&jag=true&jira.create.linked.issue=true&locale=en&slack-enabled=true&whisper-enabled=true","startTime":281,"connectEnd":281,"connectStart":281,"domainLookupEnd":281,"domainLookupStart":281,"fetchStart":281,"redirectEnd":0,"redirectStart":0,"requestStart":301.3999996185303,"responseEnd":371.5,"responseStart":320.8999996185303,"secureConnectionStart":281},{"duration":34.40000009536743,"initiatorType":"script","name":"https://jira.mariadb.org/s/a9324d6758d385eb45c462685ad88f1d-CDN/lu2cib/820016/12ta74/c92c0caa9a024ae85b0ebdbed7fb4bd7/_/download/contextbatch/js/atl.global,-_super/batch.js?locale=en","startTime":281.09999990463257,"connectEnd":281.09999990463257,"connectStart":281.09999990463257,"domainLookupEnd":281.09999990463257,"domainLookupStart":281.09999990463257,"fetchStart":281.09999990463257,"redirectEnd":0,"redirectStart":0,"requestStart":302.19999980926514,"responseEnd":315.5,"responseStart":314.5,"secureConnectionStart":281.09999990463257},{"duration":52.40000009536743,"initiatorType":"script","name":"https://jira.mariadb.org/s/d41d8cd98f00b204e9800998ecf8427e-CDN/lu2cib/820016/12ta74/1.0/_/download/batch/jira.webresources:calendar-en/jira.webresources:calendar-en.js","startTime":281.2999997138977,"connectEnd":281.2999997138977,"connectStart":281.2999997138977,"domainLookupEnd":281.2999997138977,"domainLookupStart":281.2999997138977,"fetchStart":281.2999997138977,"redirectEnd":0,"redirectStart":0,"requestStart":305,"responseEnd":333.69999980926514,"responseStart":333.09999990463257,"secureConnectionStart":281.2999997138977},{"duration":54.299999713897705,"initiatorType":"script","name":"https://jira.mariadb.org/s/d41d8cd98f00b204e9800998ecf8427e-CDN/lu2cib/820016/12ta74/1.0/_/download/batch/jira.webresources:calendar-localisation-moment/jira.webresources:calendar-localisation-moment.js","startTime":281.5,"connectEnd":281.5,"connectStart":281.5,"domainLookupEnd":281.5,"domainLookupStart":281.5,"fetchStart":281.5,"redirectEnd":0,"redirectStart":0,"requestStart":306.09999990463257,"responseEnd":335.7999997138977,"responseStart":335.2999997138977,"secureConnectionStart":281.5},{"duration":23.09999990463257,"initiatorType":"link","name":"https://jira.mariadb.org/s/b04b06a02d1959df322d9cded3aeecc1-CDN/lu2cib/820016/12ta74/a2ff6aa845ffc9a1d22fe23d9ee791fc/_/download/contextbatch/css/jira.global.look-and-feel,-_super/batch.css","startTime":281.69999980926514,"connectEnd":0,"connectStart":0,"domainLookupEnd":0,"domainLookupStart":0,"fetchStart":281.69999980926514,"redirectEnd":0,"redirectStart":0,"requestStart":0,"responseEnd":304.7999997138977,"responseStart":0,"secureConnectionStart":0},{"duration":48.80000019073486,"initiatorType":"script","name":"https://jira.mariadb.org/rest/api/1.0/shortcuts/820016/47140b6e0a9bc2e4913da06536125810/shortcuts.js?context=issuenavigation&context=issueaction","startTime":281.7999997138977,"connectEnd":316.2999997138977,"connectStart":316.2999997138977,"domainLookupEnd":316.2999997138977,"domainLookupStart":316.2999997138977,"fetchStart":281.7999997138977,"redirectEnd":0,"redirectStart":0,"requestStart":318.8999996185303,"responseEnd":330.59999990463257,"responseStart":329.5,"secureConnectionStart":316.2999997138977},{"duration":34.19999980926514,"initiatorType":"link","name":"https://jira.mariadb.org/s/3ac36323ba5e4eb0af2aa7ac7211b4bb-CDN/lu2cib/820016/12ta74/d176f0986478cc64f24226b3d20c140d/_/download/contextbatch/css/com.atlassian.jira.projects.sidebar.init,-_super,-project.issue.navigator,-jira.view.issue/batch.css?jira.create.linked.issue=true","startTime":282,"connectEnd":0,"connectStart":0,"domainLookupEnd":0,"domainLookupStart":0,"fetchStart":282,"redirectEnd":0,"redirectStart":0,"requestStart":0,"responseEnd":316.19999980926514,"responseStart":0,"secureConnectionStart":0},{"duration":54.59999990463257,"initiatorType":"script","name":"https://jira.mariadb.org/s/5d5e8fe91fbc506585e83ea3b62ccc4b-CDN/lu2cib/820016/12ta74/d176f0986478cc64f24226b3d20c140d/_/download/contextbatch/js/com.atlassian.jira.projects.sidebar.init,-_super,-project.issue.navigator,-jira.view.issue/batch.js?jira.create.linked.issue=true&locale=en","startTime":282.09999990463257,"connectEnd":282.09999990463257,"connectStart":282.09999990463257,"domainLookupEnd":282.09999990463257,"domainLookupStart":282.09999990463257,"fetchStart":282.09999990463257,"redirectEnd":0,"redirectStart":0,"requestStart":319.8999996185303,"responseEnd":336.69999980926514,"responseStart":331.3999996185303,"secureConnectionStart":282.09999990463257},{"duration":259,"initiatorType":"script","name":"https://jira.mariadb.org/s/d41d8cd98f00b204e9800998ecf8427e-CDN/lu2cib/820016/12ta74/1.0/_/download/batch/jira.webresources:bigpipe-js/jira.webresources:bigpipe-js.js","startTime":294.7999997138977,"connectEnd":294.7999997138977,"connectStart":294.7999997138977,"domainLookupEnd":294.7999997138977,"domainLookupStart":294.7999997138977,"fetchStart":294.7999997138977,"redirectEnd":0,"redirectStart":0,"requestStart":351.09999990463257,"responseEnd":553.7999997138977,"responseStart":549.7999997138977,"secureConnectionStart":294.7999997138977},{"duration":257.5,"initiatorType":"script","name":"https://jira.mariadb.org/s/d41d8cd98f00b204e9800998ecf8427e-CDN/lu2cib/820016/12ta74/1.0/_/download/batch/jira.webresources:bigpipe-init/jira.webresources:bigpipe-init.js","startTime":296.3999996185303,"connectEnd":296.3999996185303,"connectStart":296.3999996185303,"domainLookupEnd":296.3999996185303,"domainLookupStart":296.3999996185303,"fetchStart":296.3999996185303,"redirectEnd":0,"redirectStart":0,"requestStart":360.09999990463257,"responseEnd":553.8999996185303,"responseStart":550.2999997138977,"secureConnectionStart":296.3999996185303},{"duration":193.60000038146973,"initiatorType":"xmlhttprequest","name":"https://jira.mariadb.org/rest/webResources/1.0/resources","startTime":565.3999996185303,"connectEnd":565.3999996185303,"connectStart":565.3999996185303,"domainLookupEnd":565.3999996185303,"domainLookupStart":565.3999996185303,"fetchStart":565.3999996185303,"redirectEnd":0,"redirectStart":0,"requestStart":726.6999998092651,"responseEnd":759,"responseStart":758.3999996185303,"secureConnectionStart":565.3999996185303},{"duration":141,"initiatorType":"script","name":"https://www.google-analytics.com/analytics.js","startTime":797,"connectEnd":0,"connectStart":0,"domainLookupEnd":0,"domainLookupStart":0,"fetchStart":797,"redirectEnd":0,"redirectStart":0,"requestStart":0,"responseEnd":938,"responseStart":0,"secureConnectionStart":0},{"duration":181,"initiatorType":"xmlhttprequest","name":"https://jira.mariadb.org/rest/webResources/1.0/resources","startTime":818.2999997138977,"connectEnd":818.2999997138977,"connectStart":818.2999997138977,"domainLookupEnd":818.2999997138977,"domainLookupStart":818.2999997138977,"fetchStart":818.2999997138977,"redirectEnd":0,"redirectStart":0,"requestStart":964,"responseEnd":999.2999997138977,"responseStart":998.5999999046326,"secureConnectionStart":818.2999997138977}],"fetchStart":0,"domainLookupStart":0,"domainLookupEnd":0,"connectStart":0,"connectEnd":0,"requestStart":18,"responseStart":275,"responseEnd":295,"domLoading":279,"domInteractive":965,"domContentLoadedEventStart":965,"domContentLoadedEventEnd":1007,"domComplete":1269,"loadEventStart":1269,"loadEventEnd":1269,"userAgent":"Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; ClaudeBot/1.0; +claudebot@anthropic.com)","marks":[{"name":"bigPipe.sidebar-id.start","time":940.0999999046326},{"name":"bigPipe.sidebar-id.end","time":940.6999998092651},{"name":"bigPipe.activity-panel-pipe-id.start","time":940.8999996185303},{"name":"bigPipe.activity-panel-pipe-id.end","time":942.2999997138977},{"name":"activityTabFullyLoaded","time":1029.6999998092651}],"measures":[],"correlationId":"cc495ab0b60aa","effectiveType":"4g","downlink":10,"rtt":0,"serverDuration":170,"dbReadsTimeInMs":21,"dbConnsTimeInMs":31,"applicationHash":"9d11dbea5f4be3d4cc21f03a88dd11d8c8687422","experiments":[]}}
I see that it has been previously claimed that this bug does not affect MariaDB Server 10.6 or later. Please clarify what should be done on merge to 10.6. If it is anything else than a null-merge (discarding the changes), we need to review and test the 10.6 version as well.
Am I right that this is basically yet another attempt at fixing
MDEV-23328?