TDengine/source/dnode/mnode/impl/src/mndSync.c

195 lines
5.1 KiB
C
Raw Normal View History

2021-12-17 06:20:32 +00:00
/*
* Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
*
* This program is free software: you can use, redistribute, and/or modify
* it under the terms of the GNU Affero General Public License, version 3
* or later ("AGPL"), as published by the Free Software Foundation.
*
* This program is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*/
#define _DEFAULT_SOURCE
2021-12-25 06:40:43 +00:00
#include "mndSync.h"
2022-01-03 13:36:31 +00:00
#include "mndTrans.h"
2021-12-17 06:20:32 +00:00
2022-01-03 13:36:31 +00:00
static int32_t mndInitWal(SMnode *pMnode) {
2021-12-25 06:40:43 +00:00
SSyncMgmt *pMgmt = &pMnode->syncMgmt;
2022-01-03 09:44:47 +00:00
char path[PATH_MAX] = {0};
snprintf(path, sizeof(path), "%s%swal", pMnode->path, TD_DIRSEP);
SWalCfg cfg = {
.vgId = 1,
.fsyncPeriod = 0,
.rollPeriod = -1,
.segSize = -1,
.retentionPeriod = -1,
.retentionSize = -1,
.level = TAOS_WAL_FSYNC,
};
2022-01-03 09:44:47 +00:00
pMgmt->pWal = walOpen(path, &cfg);
2022-01-03 13:36:31 +00:00
if (pMgmt->pWal == NULL) return -1;
return 0;
}
static void mndCloseWal(SMnode *pMnode) {
SSyncMgmt *pMgmt = &pMnode->syncMgmt;
if (pMgmt->pWal != NULL) {
walClose(pMgmt->pWal);
pMgmt->pWal = NULL;
}
}
static int32_t mndRestoreWal(SMnode *pMnode) {
SWal *pWal = pMnode->syncMgmt.pWal;
SSdb *pSdb = pMnode->pSdb;
int64_t lastSdbVer = sdbUpdateVer(pSdb, 0);
int32_t code = -1;
SWalReadHandle *pHandle = walOpenReadHandle(pWal);
if (pHandle == NULL) return -1;
2022-01-04 07:20:29 +00:00
int64_t first = walGetFirstVer(pWal);
int64_t last = walGetLastVer(pWal);
mDebug("start to restore wal, sdbver:%" PRId64 ", first:%" PRId64 " last:%" PRId64, lastSdbVer, first, last);
2022-01-03 13:36:31 +00:00
2022-01-24 04:53:17 +00:00
first = TMAX(lastSdbVer + 1, first);
2022-01-04 07:20:29 +00:00
for (int64_t ver = first; ver >= 0 && ver <= last; ++ver) {
2022-01-03 13:36:31 +00:00
if (walReadWithHandle(pHandle, ver) < 0) {
mError("ver:%" PRId64 ", failed to read from wal since %s", ver, terrstr());
goto _OVER;
2022-01-03 13:36:31 +00:00
}
SWalHead *pHead = pHandle->pHead;
int64_t sdbVer = sdbUpdateVer(pSdb, 0);
if (sdbVer + 1 != ver) {
terrno = TSDB_CODE_SDB_INVALID_WAl_VER;
mError("ver:%" PRId64 ", failed to write to sdb, since inconsistent with sdbver:%" PRId64, ver, sdbVer);
goto _OVER;
2022-01-03 13:36:31 +00:00
}
mTrace("ver:%" PRId64 ", will be restored, content:%p", ver, pHead->head.body);
2022-04-26 07:47:45 +00:00
if (sdbWriteWithoutFree(pSdb, (void *)pHead->head.body) < 0) {
mError("ver:%" PRId64 ", failed to write to sdb since %s", ver, terrstr());
goto _OVER;
2022-01-03 13:36:31 +00:00
}
sdbUpdateVer(pSdb, 1);
mDebug("ver:%" PRId64 ", is restored", ver);
2022-01-03 13:36:31 +00:00
}
int64_t sdbVer = sdbUpdateVer(pSdb, 0);
mDebug("restore wal finished, sdbver:%" PRId64, sdbVer);
2022-01-04 07:20:29 +00:00
2022-01-04 11:44:44 +00:00
mndTransPullup(pMnode);
sdbVer = sdbUpdateVer(pSdb, 0);
mDebug("pullup trans finished, sdbver:%" PRId64, sdbVer);
2022-01-04 11:44:44 +00:00
2022-01-04 05:40:47 +00:00
if (sdbVer != lastSdbVer) {
2022-01-04 07:20:29 +00:00
mInfo("sdb restored from %" PRId64 " to %" PRId64 ", write file", lastSdbVer, sdbVer);
2022-01-03 13:41:45 +00:00
if (sdbWriteFile(pSdb) != 0) {
goto _OVER;
2022-01-03 13:36:31 +00:00
}
2022-01-20 05:52:54 +00:00
if (walCommit(pWal, sdbVer) != 0) {
goto _OVER;
2022-01-20 05:52:54 +00:00
}
2022-01-10 08:23:35 +00:00
if (walBeginSnapshot(pWal, sdbVer) < 0) {
goto _OVER;
2022-01-10 08:23:35 +00:00
}
if (walEndSnapshot(pWal) < 0) {
goto _OVER;
2022-01-10 08:23:35 +00:00
}
2022-01-10 08:13:05 +00:00
}
2022-01-03 13:36:31 +00:00
code = 0;
_OVER:
2022-01-03 13:36:31 +00:00
walCloseReadHandle(pHandle);
2022-01-03 13:41:45 +00:00
return code;
2022-01-03 13:36:31 +00:00
}
int32_t mndInitSync(SMnode *pMnode) {
SSyncMgmt *pMgmt = &pMnode->syncMgmt;
tsem_init(&pMgmt->syncSem, 0, 0);
if (mndInitWal(pMnode) < 0) {
mError("failed to open wal since %s", terrstr());
return -1;
}
if (mndRestoreWal(pMnode) < 0) {
mError("failed to restore wal since %s", terrstr());
2022-01-03 09:44:47 +00:00
return -1;
}
2022-04-09 11:00:52 +00:00
if (pMnode->selfId == 1) {
pMgmt->state = TAOS_SYNC_STATE_LEADER;
}
2021-12-25 06:40:43 +00:00
pMgmt->pSyncNode = NULL;
return 0;
}
void mndCleanupSync(SMnode *pMnode) {
SSyncMgmt *pMgmt = &pMnode->syncMgmt;
2022-01-03 13:36:31 +00:00
tsem_destroy(&pMgmt->syncSem);
mndCloseWal(pMnode);
2021-12-25 06:40:43 +00:00
}
static int32_t mndSyncApplyCb(struct SSyncFSM *fsm, SyncIndex index, const SSyncBuffer *buf, void *pData) {
SMnode *pMnode = pData;
SSyncMgmt *pMgmt = &pMnode->syncMgmt;
pMgmt->errCode = 0;
tsem_post(&pMgmt->syncSem);
return 0;
}
2021-12-17 06:20:32 +00:00
int32_t mndSyncPropose(SMnode *pMnode, SSdbRaw *pRaw) {
2022-01-03 09:44:47 +00:00
SWal *pWal = pMnode->syncMgmt.pWal;
SSdb *pSdb = pMnode->pSdb;
int64_t ver = sdbUpdateVer(pSdb, 1);
if (walWrite(pWal, ver, 1, pRaw, sdbGetRawTotalSize(pRaw)) < 0) {
sdbUpdateVer(pSdb, -1);
2022-04-26 09:42:57 +00:00
mError("ver:%" PRId64 ", failed to write raw:%p to wal since %s", ver, pRaw, terrstr());
2022-01-03 09:44:47 +00:00
return -1;
}
2022-04-26 09:42:57 +00:00
mTrace("ver:%" PRId64 ", write to wal, raw:%p", ver, pRaw);
2022-01-03 13:36:31 +00:00
walCommit(pWal, ver);
2022-01-03 09:44:47 +00:00
walFsync(pWal, true);
2021-12-25 06:40:43 +00:00
#if 1
return 0;
#else
if (pMnode->replica == 1) return 0;
SSyncMgmt *pMgmt = &pMnode->syncMgmt;
pMgmt->errCode = 0;
SSyncBuffer buf = {.data = pRaw, .len = sdbGetRawTotalSize(pRaw)};
bool isWeak = false;
int32_t code = syncPropose(pMgmt->pSyncNode, &buf, pMnode, isWeak);
2021-12-17 06:20:32 +00:00
2021-12-25 06:40:43 +00:00
if (code != 0) return code;
2021-12-17 06:20:32 +00:00
2021-12-25 06:40:43 +00:00
tsem_wait(&pMgmt->syncSem);
return pMgmt->errCode;
#endif
2021-12-17 06:20:32 +00:00
}
2021-12-23 06:47:46 +00:00
bool mndIsMaster(SMnode *pMnode) {
2021-12-25 06:40:43 +00:00
SSyncMgmt *pMgmt = &pMnode->syncMgmt;
return pMgmt->state == TAOS_SYNC_STATE_LEADER;
2022-01-10 08:13:05 +00:00
}