Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

bugfix: fix tcc dead lock #6769

Merged
merged 6 commits into from
Aug 22, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions changes/en-us/2.x.md
Original file line number Diff line number Diff line change
Expand Up @@ -24,6 +24,7 @@ Add changes here for all PR submitted to the 2.x branch.
- [[#6714](https://github.com/apache/incubator-seata/pull/6714)] fix dameng delete undo fail
- [[#6701](https://github.com/apache/incubator-seata/pull/6728)] fix support serialization for dm.jdbc.driver.DmdbTimestamp
- [[#6757](https://github.com/apache/incubator-seata/pull/6757)] the bug where multiple nodes cannot be retrieved from the naming server
- [[#6769](https://github.com/apache/incubator-seata/pull/6769)] fix tcc fence deadLock


### optimize:
Expand Down
2 changes: 1 addition & 1 deletion changes/zh-cn/2.x.md
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@
- [[#6714](https://github.com/apache/incubator-seata/pull/6714)] 修复达梦数据库的delete sql回滚失败的问题
- [[#6701](https://github.com/apache/incubator-seata/pull/6728)] 修复达梦数据库的对dm.jdbc.driver.DmdbTimestamp的支持
- [[#6757](https://github.com/apache/incubator-seata/pull/6757)] 修复client通过namingserver只能获取到一个tc节点的bug

- [[#6769](https://github.com/apache/incubator-seata/pull/6769)] 修复tcc fence死锁

### optimize:
- [[#6499](https://github.com/apache/incubator-seata/pull/6499)] 拆分 committing 和 rollbacking 状态的任务线程池
Expand Down
10 changes: 10 additions & 0 deletions common/src/main/java/org/apache/seata/common/Constants.java
Original file line number Diff line number Diff line change
Expand Up @@ -225,4 +225,14 @@ public interface Constants {
*/
String JACKSON_JSON_TEXT_PREFIX = "{\"@class\":";

/**
* The constant DEAD_LOCK_SQL_STATE
*/
String DEAD_LOCK_SQL_STATE = "40001";

/**
* The constant DEAD_LOCK_ERROR_CODE
*/
int DEAD_LOCK_ERROR_CODE = 1213;

}
Original file line number Diff line number Diff line change
Expand Up @@ -18,8 +18,12 @@

import java.lang.reflect.Method;
import java.sql.Connection;
import java.sql.SQLException;
import java.util.ArrayList;
import java.util.Date;
import java.util.Map;
import java.util.Objects;
import java.util.Optional;
import java.util.Set;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.LinkedBlockingQueue;
Expand All @@ -28,6 +32,7 @@

import javax.sql.DataSource;

import org.apache.seata.common.Constants;
import org.apache.seata.common.exception.ExceptionUtil;
import org.apache.seata.common.exception.FrameworkErrorCode;
import org.apache.seata.common.exception.SkipCallbackWrapperException;
Expand All @@ -41,10 +46,14 @@
import org.apache.seata.integration.tx.api.fence.store.CommonFenceStore;
import org.apache.seata.integration.tx.api.fence.store.db.CommonFenceStoreDataBaseDAO;
import org.apache.seata.integration.tx.api.remoting.TwoPhaseResult;
import org.apache.seata.rm.tcc.api.BusinessActionContext;
import org.apache.seata.rm.tcc.api.BusinessActionContextUtil;
import org.apache.seata.rm.tcc.utils.MethodUtils;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.springframework.jdbc.datasource.DataSourceUtils;
import org.springframework.transaction.TransactionStatus;
import org.springframework.transaction.annotation.Transactional;
import org.springframework.transaction.support.TransactionTemplate;

/**
Expand Down Expand Up @@ -108,7 +117,8 @@ public static void setTransactionTemplate(TransactionTemplate transactionTemplat
*/
@Override
public Object prepareFence(String xid, Long branchId, String actionName, Callback<Object> targetCallback) {
return transactionTemplate.execute(status -> {
TransactionTemplate template = createTransactionTemplateForTransactionalMethod(null);
return template.execute(status -> {
try {
Connection conn = DataSourceUtils.getConnection(dataSource);
boolean result = insertCommonFenceLog(conn, xid, branchId, actionName, CommonFenceConstant.STATUS_TRIED);
Expand Down Expand Up @@ -146,7 +156,8 @@ public Object prepareFence(String xid, Long branchId, String actionName, Callbac
@Override
public boolean commitFence(Method commitMethod, Object targetTCCBean,
String xid, Long branchId, Object[] args) {
return transactionTemplate.execute(status -> {
TransactionTemplate template = createTransactionTemplateForTransactionalMethod(MethodUtils.getTransactionalAnnotationByMethod(commitMethod, targetTCCBean));
return template.execute(status -> {
try {
Connection conn = DataSourceUtils.getConnection(dataSource);
CommonFenceDO commonFenceDO = COMMON_FENCE_DAO.queryCommonFenceDO(conn, xid, branchId);
Expand Down Expand Up @@ -188,7 +199,8 @@ public boolean commitFence(Method commitMethod, Object targetTCCBean,
@Override
public boolean rollbackFence(Method rollbackMethod, Object targetTCCBean,
String xid, Long branchId, Object[] args, String actionName) {
return transactionTemplate.execute(status -> {
TransactionTemplate template = createTransactionTemplateForTransactionalMethod(MethodUtils.getTransactionalAnnotationByMethod(rollbackMethod, targetTCCBean));
return template.execute(status -> {
try {
Connection conn = DataSourceUtils.getConnection(dataSource);
CommonFenceDO commonFenceDO = COMMON_FENCE_DAO.queryCommonFenceDO(conn, xid, branchId);
Expand Down Expand Up @@ -218,6 +230,16 @@ public boolean rollbackFence(Method rollbackMethod, Object targetTCCBean,
return result;
} catch (Throwable t) {
status.setRollbackOnly();
Throwable cause = t.getCause();
if (cause != null && cause instanceof SQLException) {
SQLException sqlException = (SQLException) cause;
String sqlState = sqlException.getSQLState();
int errorCode = sqlException.getErrorCode();
if (Constants.DEAD_LOCK_SQL_STATE.equals(sqlState) && Constants.DEAD_LOCK_ERROR_CODE == errorCode) {
// MySQL deadlock exception
LOGGER.error("Common fence rollback fail. xid: {}, branchId: {}, This exception may be due to the deadlock caused by the transaction isolation level being Repeatable Read. The seata server will try to roll back again, so you can ignore this exception. (To avoid this exception, you can set transaction isolation to Read Committed.)", xid, branchId);
}
}
throw new SkipCallbackWrapperException(t);
}
});
Expand Down Expand Up @@ -353,6 +375,31 @@ private static void addToLogCleanQueue(final String xid, final long branchId) {
}
}

/**
* Creating a transactionTemplate with business transactional attributes
* @param transactional Transactional annotation
* @return
*/
private TransactionTemplate createTransactionTemplateForTransactionalMethod(Transactional transactional) {
Map<String, Object> businessActionContext = Optional.ofNullable(BusinessActionContextUtil.getContext()).map(BusinessActionContext::getActionContext).orElse(null);
if (transactional == null && businessActionContext == null) {
return transactionTemplate;
}
if (transactional != null) {
TransactionTemplate template = new TransactionTemplate(Objects.requireNonNull(transactionTemplate.getTransactionManager()));
template.setIsolationLevel(transactional.isolation().value());
return template;
} else {
boolean containIsolation = businessActionContext.containsKey(Constants.TX_ISOLATION);
if (!containIsolation) {
return transactionTemplate;
}
TransactionTemplate template = new TransactionTemplate(Objects.requireNonNull(transactionTemplate.getTransactionManager()));
template.setIsolationLevel((int) businessActionContext.get(Constants.TX_ISOLATION));
return template;
}
}

/**
* clean fence log that has the final status runnable.
*
Expand Down
10 changes: 10 additions & 0 deletions tcc/src/main/java/org/apache/seata/rm/tcc/TCCResourceManager.java
Original file line number Diff line number Diff line change
Expand Up @@ -119,6 +119,8 @@ public BranchStatus branchCommit(BranchType branchType, String xid, long branchI
applicationData);

Object[] args = this.getTwoPhaseCommitArgs(tccResource, businessActionContext);
//share actionContext implicitly
BusinessActionContextUtil.setContext(businessActionContext);
Object ret;
boolean result;
// add idempotent and anti hanging
Expand Down Expand Up @@ -146,6 +148,9 @@ public BranchStatus branchCommit(BranchType branchType, String xid, long branchI
String msg = String.format("commit TCC resource error, resourceId: %s, xid: %s.", resourceId, xid);
LOGGER.error(msg, ExceptionUtil.unwrap(t));
return BranchStatus.PhaseTwo_CommitFailed_Retryable;
} finally {
// clear the action context
BusinessActionContextUtil.clear();
}
}

Expand Down Expand Up @@ -177,6 +182,8 @@ public BranchStatus branchRollback(BranchType branchType, String xid, long branc
BusinessActionContext businessActionContext = BusinessActionContextUtil.getBusinessActionContext(xid, branchId, resourceId,
applicationData);
Object[] args = this.getTwoPhaseRollbackArgs(tccResource, businessActionContext);
//share actionContext implicitly
BusinessActionContextUtil.setContext(businessActionContext);
Object ret;
boolean result;
// add idempotent and anti hanging
Expand Down Expand Up @@ -205,6 +212,9 @@ public BranchStatus branchRollback(BranchType branchType, String xid, long branc
String msg = String.format("rollback TCC resource error, resourceId: %s, xid: %s.", resourceId, xid);
LOGGER.error(msg, ExceptionUtil.unwrap(t));
return BranchStatus.PhaseTwo_RollbackFailed_Retryable;
} finally {
// clear the action context
BusinessActionContextUtil.clear();
}
}

Expand Down
Loading