TDengine/source/libs/executor/src/scanoperator.c

4698 lines
166 KiB
C
Raw Normal View History

2022-04-04 06:54:39 +00:00
/*
* Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
*
* This program is free software: you can use, redistribute, and/or modify
* it under the terms of the GNU Affero General Public License, version 3
* or later ("AGPL"), as published by the Free Software Foundation.
*
* This program is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*/
2023-04-28 03:42:34 +00:00
#include "executorInt.h"
2022-08-05 09:40:40 +00:00
#include "filter.h"
2022-05-26 08:29:52 +00:00
#include "function.h"
#include "functionMgt.h"
2022-08-16 04:11:56 +00:00
#include "os.h"
2022-04-04 06:54:39 +00:00
#include "querynodes.h"
2024-05-16 08:24:58 +00:00
#include "streamexecutorInt.h"
2024-07-19 08:15:37 +00:00
#include "systable.h"
2022-04-04 06:54:39 +00:00
#include "tname.h"
#include "tdatablock.h"
#include "tmsg.h"
2024-10-16 04:16:59 +00:00
#include "ttime.h"
2022-04-04 06:54:39 +00:00
2024-07-19 08:15:37 +00:00
#include "operator.h"
2022-04-04 06:54:39 +00:00
#include "query.h"
2024-07-19 08:15:37 +00:00
#include "querytask.h"
2022-04-04 06:54:39 +00:00
#include "tcompare.h"
#include "thash.h"
#include "ttypes.h"
#include "storageapi.h"
#include "wal.h"
2025-04-19 02:26:32 +00:00
#include "function.h"
2023-03-28 09:40:46 +00:00
int32_t scanDebug = 0;
2024-07-19 08:15:37 +00:00
#define MULTI_READER_MAX_TABLE_NUM 5000
#define SET_REVERSE_SCAN_FLAG(_info) ((_info)->scanFlag = REVERSE_SCAN)
#define SWITCH_ORDER(n) (((n) = ((n) == TSDB_ORDER_ASC) ? TSDB_ORDER_DESC : TSDB_ORDER_ASC))
#define STREAM_SCAN_OP_NAME "StreamScanOperator"
#define STREAM_SCAN_OP_STATE_NAME "StreamScanFillHistoryState"
#define STREAM_SCAN_OP_CHECKPOINT_NAME "StreamScanOperator_Checkpoint"
2022-04-06 09:59:08 +00:00
2022-11-04 10:46:48 +00:00
typedef struct STableMergeScanExecInfo {
SFileBlockLoadRecorder blockRecorder;
SSortExecInfo sortExecInfo;
} STableMergeScanExecInfo;
typedef struct STableMergeScanSortSourceParam {
SOperatorInfo* pOperator;
int32_t readerIdx;
uint64_t uid;
STsdbReader* reader;
2022-11-04 10:46:48 +00:00
} STableMergeScanSortSourceParam;
2023-04-03 09:47:48 +00:00
typedef struct STableCountScanOperatorInfo {
SReadHandle readHandle;
SSDataBlock* pRes;
STableCountScanSupp supp;
int32_t currGrpIdx;
SArray* stbUidList; // when group by db_name and/or stable_name
} STableCountScanOperatorInfo;
static bool processBlockWithProbability(const SSampleExecInfo* pInfo);
2024-08-27 09:04:44 +00:00
static int32_t doTableCountScanNext(SOperatorInfo* pOperator, SSDataBlock** ppRes);
2022-11-04 14:13:40 +00:00
bool processBlockWithProbability(const SSampleExecInfo* pInfo) {
#if 0
if (pInfo->sampleRatio == 1) {
return true;
}
uint32_t val = taosRandR((uint32_t*) &pInfo->seed);
return (val % ((uint32_t)(1/pInfo->sampleRatio))) == 0;
#else
return true;
#endif
}
2022-05-03 15:23:49 +00:00
static void switchCtxOrder(SqlFunctionCtx* pCtx, int32_t numOfOutput) {
2022-04-04 06:54:39 +00:00
for (int32_t i = 0; i < numOfOutput; ++i) {
SWITCH_ORDER(pCtx[i].order);
}
}
2024-08-06 10:10:46 +00:00
static int32_t overlapWithTimeWindow(SInterval* pInterval, SDataBlockInfo* pBlockInfo, int32_t order, bool* overlap) {
2024-09-11 08:37:06 +00:00
int32_t code = TSDB_CODE_SUCCESS;
STimeWindow w = {0};
// 0 by default, which means it is not a interval operator of the upstream operator.
if (pInterval->interval == 0) {
2024-08-06 10:10:46 +00:00
*overlap = false;
return code;
}
if (order == TSDB_ORDER_ASC) {
w = getAlignQueryTimeWindow(pInterval, pBlockInfo->window.skey);
2024-09-11 08:37:06 +00:00
if (w.ekey < pBlockInfo->window.skey) {
2024-08-06 10:10:46 +00:00
qError("w.ekey:%" PRId64 " < pBlockInfo->window.skey:%" PRId64, w.ekey, pBlockInfo->window.skey);
return TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR;
}
if (w.ekey < pBlockInfo->window.ekey) {
2024-08-06 10:10:46 +00:00
*overlap = true;
return code;
}
while (1) {
getNextTimeWindow(pInterval, &w, order);
if (w.skey > pBlockInfo->window.ekey) {
break;
}
2024-09-11 08:37:06 +00:00
if (w.ekey <= pBlockInfo->window.ekey) {
2024-08-06 10:10:46 +00:00
qError("w.ekey:%" PRId64 " <= pBlockInfo->window.ekey:%" PRId64, w.ekey, pBlockInfo->window.ekey);
return TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR;
}
if (TMAX(w.skey, pBlockInfo->window.skey) <= pBlockInfo->window.ekey) {
2024-08-06 10:10:46 +00:00
*overlap = true;
return code;
}
}
} else {
w = getAlignQueryTimeWindow(pInterval, pBlockInfo->window.ekey);
2024-09-11 08:37:06 +00:00
if (w.skey > pBlockInfo->window.ekey) {
2024-08-06 11:36:33 +00:00
qError("w.skey:%" PRId64 " > pBlockInfo->window.skey:%" PRId64, w.skey, pBlockInfo->window.ekey);
2024-08-06 10:10:46 +00:00
return TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR;
}
if (w.skey > pBlockInfo->window.skey) {
2024-08-06 10:10:46 +00:00
*overlap = true;
return code;
}
2022-05-26 08:29:52 +00:00
while (1) {
getNextTimeWindow(pInterval, &w, order);
if (w.ekey < pBlockInfo->window.skey) {
break;
}
2024-09-11 08:37:06 +00:00
if (w.skey >= pBlockInfo->window.skey) {
2024-08-06 10:10:46 +00:00
qError("w.skey:%" PRId64 " >= pBlockInfo->window.skey:%" PRId64, w.skey, pBlockInfo->window.skey);
return TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR;
}
if (pBlockInfo->window.skey <= TMIN(w.ekey, pBlockInfo->window.ekey)) {
2024-08-06 10:10:46 +00:00
*overlap = true;
return code;
}
}
}
2024-08-06 10:10:46 +00:00
*overlap = false;
return code;
}
// this function is for table scanner to extract temporary results of upstream aggregate results.
static SResultRow* getTableGroupOutputBuf(SOperatorInfo* pOperator, uint64_t groupId, SFilePage** pPage) {
if (pOperator->operatorType != QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN) {
return NULL;
}
int64_t buf[2] = {0};
SET_RES_WINDOW_KEY((char*)buf, &groupId, sizeof(groupId), groupId);
STableScanInfo* pTableScanInfo = pOperator->info;
2022-11-25 15:00:14 +00:00
SResultRowPosition* p1 = (SResultRowPosition*)tSimpleHashGet(pTableScanInfo->base.pdInfo.pAggSup->pResultRowHashTable,
buf, GET_RES_WINDOW_KEY_LEN(sizeof(groupId)));
if (p1 == NULL) {
return NULL;
}
2022-11-18 01:47:26 +00:00
*pPage = getBufPage(pTableScanInfo->base.pdInfo.pAggSup->pResultBuf, p1->pageId);
if (NULL == *pPage) {
return NULL;
}
2023-01-10 05:47:18 +00:00
return (SResultRow*)((char*)(*pPage) + p1->offset);
}
static int32_t insertTableToScanIgnoreList(STableScanInfo* pTableScanInfo, uint64_t uid) {
if (NULL == pTableScanInfo->pIgnoreTables) {
int32_t tableNum = taosArrayGetSize(pTableScanInfo->base.pTableListInfo->pTableList);
2024-07-19 08:15:37 +00:00
pTableScanInfo->pIgnoreTables =
taosHashInit(tableNum, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT), true, HASH_NO_LOCK);
if (NULL == pTableScanInfo->pIgnoreTables) {
2024-09-20 05:23:44 +00:00
return terrno;
}
}
2023-05-19 01:07:35 +00:00
2024-07-23 10:32:03 +00:00
int32_t tempRes = taosHashPut(pTableScanInfo->pIgnoreTables, &uid, sizeof(uid), &pTableScanInfo->scanTimes,
sizeof(pTableScanInfo->scanTimes));
if (tempRes != TSDB_CODE_SUCCESS && tempRes != TSDB_CODE_DUP_KEY) {
qError("%s failed at line %d since %s", __func__, __LINE__, tstrerror(tempRes));
return tempRes;
2024-07-23 06:19:04 +00:00
}
return TSDB_CODE_SUCCESS;
}
static int32_t doDynamicPruneDataBlock(SOperatorInfo* pOperator, SDataBlockInfo* pBlockInfo, uint32_t* status) {
STableScanInfo* pTableScanInfo = pOperator->info;
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
2022-11-18 01:47:26 +00:00
if (pTableScanInfo->base.pdInfo.pExprSup == NULL) {
return TSDB_CODE_SUCCESS;
}
2022-11-18 01:47:26 +00:00
SExprSupp* pSup1 = pTableScanInfo->base.pdInfo.pExprSup;
SFilePage* pPage = NULL;
2022-11-28 04:32:40 +00:00
SResultRow* pRow = getTableGroupOutputBuf(pOperator, pBlockInfo->id.groupId, &pPage);
if (pRow == NULL) {
return TSDB_CODE_SUCCESS;
}
bool notLoadBlock = true;
for (int32_t i = 0; i < pSup1->numOfExprs; ++i) {
int32_t functionId = pSup1->pCtx[i].functionId;
2022-11-18 01:47:26 +00:00
SResultRowEntryInfo* pEntry = getResultEntryInfo(pRow, i, pTableScanInfo->base.pdInfo.pExprSup->rowEntryInfoOffset);
2024-09-11 08:37:06 +00:00
EFuncDataRequired reqStatus = fmFuncDynDataRequired(functionId, pEntry, pBlockInfo);
if (reqStatus != FUNC_DATA_REQUIRED_NOT_LOAD) {
notLoadBlock = false;
break;
}
}
// release buffer pages
2022-11-18 01:47:26 +00:00
releaseBufPage(pTableScanInfo->base.pdInfo.pAggSup->pResultBuf, pPage);
if (notLoadBlock) {
*status = FUNC_DATA_REQUIRED_NOT_LOAD;
code = insertTableToScanIgnoreList(pTableScanInfo, pBlockInfo->id.uid);
}
return code;
}
static int32_t doFilterByBlockSMA(SFilterInfo* pFilterInfo, SColumnDataAgg* pColsAgg, int32_t numOfCols,
2024-07-19 08:15:37 +00:00
int32_t numOfRows, bool* keep) {
2022-11-04 14:13:40 +00:00
if (pColsAgg == NULL || pFilterInfo == NULL) {
*keep = true;
return TSDB_CODE_SUCCESS;
2022-08-05 09:40:40 +00:00
}
return filterRangeExecute(pFilterInfo, pColsAgg, numOfCols, numOfRows, keep);
2022-08-05 09:40:40 +00:00
}
static int32_t doLoadBlockSMA(STableScanBase* pTableScanInfo, SSDataBlock* pBlock, SExecTaskInfo* pTaskInfo,
bool* pLoad) {
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
bool allColumnsHaveAgg = true;
bool hasNullSMA = false;
if (pLoad != NULL) {
*pLoad = false;
}
2024-07-19 08:15:37 +00:00
int32_t code = pAPI->tsdReader.tsdReaderRetrieveBlockSMAInfo(pTableScanInfo->dataReader, pBlock, &allColumnsHaveAgg,
&hasNullSMA);
2022-08-05 09:40:40 +00:00
if (code != TSDB_CODE_SUCCESS) {
return code;
2022-08-05 09:40:40 +00:00
}
2023-05-24 07:31:05 +00:00
if (!allColumnsHaveAgg || hasNullSMA) {
*pLoad = false;
} else {
*pLoad = true;
2022-08-05 09:40:40 +00:00
}
return code;
2022-08-05 09:40:40 +00:00
}
static int32_t doSetTagColumnData(STableScanBase* pTableScanInfo, SSDataBlock* pBlock, SExecTaskInfo* pTaskInfo,
int32_t rows) {
int32_t code = 0;
SExprSupp* pSup = &pTableScanInfo->pseudoSup;
if (pSup->numOfExprs > 0) {
code = addTagPseudoColumnData(&pTableScanInfo->readHandle, pSup->pExprInfo, pSup->numOfExprs, pBlock, rows,
pTaskInfo, &pTableScanInfo->metaCache);
2022-11-17 08:11:42 +00:00
// ignore the table not exists error, since this table may have been dropped during the scan procedure.
if (code == TSDB_CODE_PAR_TABLE_NOT_EXIST) {
2024-11-05 07:10:25 +00:00
if (pTaskInfo->streamInfo.pState) blockDataCleanup(pBlock);
code = 0;
2022-10-17 05:00:31 +00:00
}
}
return code;
2022-10-17 05:00:31 +00:00
}
2023-01-20 10:08:34 +00:00
bool applyLimitOffset(SLimitInfo* pLimitInfo, SSDataBlock* pBlock, SExecTaskInfo* pTaskInfo) {
SLimit* pLimit = &pLimitInfo->limit;
2022-11-04 10:46:48 +00:00
const char* id = GET_TASKID(pTaskInfo);
2023-01-20 10:08:34 +00:00
if (pLimitInfo->remainOffset > 0) {
if (pLimitInfo->remainOffset >= pBlock->info.rows) {
pLimitInfo->remainOffset -= pBlock->info.rows;
2022-12-01 09:24:26 +00:00
blockDataEmpty(pBlock);
2022-11-04 10:46:48 +00:00
qDebug("current block ignore due to offset, current:%" PRId64 ", %s", pLimitInfo->remainOffset, id);
return false;
} else {
2024-07-19 08:15:37 +00:00
int32_t code = blockDataTrimFirstRows(pBlock, pLimitInfo->remainOffset);
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, __LINE__, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
T_LONG_JMP(pTaskInfo->env, code);
2024-07-19 08:15:37 +00:00
}
pLimitInfo->remainOffset = 0;
}
}
if (pLimit->limit != -1 && pLimit->limit <= (pLimitInfo->numOfOutputRows + pBlock->info.rows)) {
// limit the output rows
int32_t keep = (int32_t)(pLimit->limit - pLimitInfo->numOfOutputRows);
blockDataKeepFirstNRows(pBlock, keep);
2023-01-20 10:08:34 +00:00
pLimitInfo->numOfOutputRows += pBlock->info.rows;
2022-11-04 10:46:48 +00:00
qDebug("output limit %" PRId64 " has reached, %s", pLimit->limit, id);
return true;
}
2023-01-20 10:08:34 +00:00
pLimitInfo->numOfOutputRows += pBlock->info.rows;
return false;
}
static bool isDynVtbScan(SOperatorInfo* pOperator) {
return pOperator->dynamicTask && ((STableScanInfo*)(pOperator->info))->virtualStableScan;
}
2022-11-18 01:47:26 +00:00
static int32_t loadDataBlock(SOperatorInfo* pOperator, STableScanBase* pTableScanInfo, SSDataBlock* pBlock,
2022-05-07 16:21:17 +00:00
uint32_t* status) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
2024-08-14 05:10:11 +00:00
bool loadSMA = false;
2022-05-03 15:52:17 +00:00
SFileBlockLoadRecorder* pCost = &pTableScanInfo->readRecorder;
2022-04-04 06:54:39 +00:00
pCost->totalBlocks += 1;
pCost->totalRows += pBlock->info.rows;
2022-11-18 05:40:03 +00:00
*status = pTableScanInfo->dataBlockLoadFlag;
2024-08-14 05:10:11 +00:00
2024-08-06 10:10:46 +00:00
if (pOperator->exprSupp.pFilterInfo != NULL) {
(*status) = FUNC_DATA_REQUIRED_DATA_LOAD;
2024-08-06 10:10:46 +00:00
} else {
bool overlap = false;
int ret =
overlapWithTimeWindow(&pTableScanInfo->pdInfo.interval, &pBlock->info, pTableScanInfo->cond.order, &overlap);
if (ret != TSDB_CODE_SUCCESS) {
return ret;
}
if (overlap) {
(*status) = FUNC_DATA_REQUIRED_DATA_LOAD;
}
}
SDataBlockInfo* pBlockInfo = &pBlock->info;
taosMemoryFreeClear(pBlock->pBlockAgg);
if (*status == FUNC_DATA_REQUIRED_FILTEROUT) {
2023-04-04 06:50:58 +00:00
qDebug("%s data block filter out, brange:%" PRId64 "-%" PRId64 ", rows:%" PRId64, GET_TASKID(pTaskInfo),
pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows);
pCost->filterOutBlocks += 1;
pCost->totalRows += pBlock->info.rows;
2023-05-23 10:58:54 +00:00
pAPI->tsdReader.tsdReaderReleaseDataBlock(pTableScanInfo->dataReader);
return TSDB_CODE_SUCCESS;
} else if (*status == FUNC_DATA_REQUIRED_NOT_LOAD) {
2023-04-04 06:50:58 +00:00
qDebug("%s data block skipped, brange:%" PRId64 "-%" PRId64 ", rows:%" PRId64 ", uid:%" PRIu64,
GET_TASKID(pTaskInfo), pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows,
pBlockInfo->id.uid);
code = doSetTagColumnData(pTableScanInfo, pBlock, pTaskInfo, pBlock->info.rows);
pCost->skipBlocks += 1;
2023-05-23 10:58:54 +00:00
pAPI->tsdReader.tsdReaderReleaseDataBlock(pTableScanInfo->dataReader);
2024-08-16 09:04:26 +00:00
return code;
2022-11-04 10:46:48 +00:00
} else if (*status == FUNC_DATA_REQUIRED_SMA_LOAD) {
pCost->loadBlockStatis += 1;
2022-08-16 04:11:56 +00:00
loadSMA = true; // mark the operation of load sma;
bool success = true;
code = doLoadBlockSMA(pTableScanInfo, pBlock, pTaskInfo, &success);
if (code) {
pAPI->tsdReader.tsdReaderReleaseDataBlock(pTableScanInfo->dataReader);
qError("%s failed to retrieve sma info", GET_TASKID(pTaskInfo));
QUERY_CHECK_CODE(code, lino, _end);
}
2022-08-16 04:11:56 +00:00
if (success) { // failed to load the block sma data, data block statistics does not exist, load data block instead
2023-04-04 06:50:58 +00:00
qDebug("%s data block SMA loaded, brange:%" PRId64 "-%" PRId64 ", rows:%" PRId64, GET_TASKID(pTaskInfo),
pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows);
code = doSetTagColumnData(pTableScanInfo, pBlock, pTaskInfo, pBlock->info.rows);
2023-05-23 10:58:54 +00:00
pAPI->tsdReader.tsdReaderReleaseDataBlock(pTableScanInfo->dataReader);
2024-08-16 11:34:08 +00:00
return code;
} else {
2022-08-10 11:58:23 +00:00
qDebug("%s failed to load SMA, since not all columns have SMA", GET_TASKID(pTaskInfo));
2022-08-05 09:40:40 +00:00
*status = FUNC_DATA_REQUIRED_DATA_LOAD;
}
2022-08-05 09:40:40 +00:00
}
2024-09-11 08:37:06 +00:00
if (*status != FUNC_DATA_REQUIRED_DATA_LOAD) {
pAPI->tsdReader.tsdReaderReleaseDataBlock(pTableScanInfo->dataReader);
qError("%s loadDataBlock invalid status:%d", GET_TASKID(pTaskInfo), *status);
2024-08-06 10:10:46 +00:00
return TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR;
}
2022-08-05 09:40:40 +00:00
// try to filter data block according to sma info
2022-11-04 14:13:40 +00:00
if (pOperator->exprSupp.pFilterInfo != NULL && (!loadSMA)) {
bool success = true;
code = doLoadBlockSMA(pTableScanInfo, pBlock, pTaskInfo, &success);
if (code) {
pAPI->tsdReader.tsdReaderReleaseDataBlock(pTableScanInfo->dataReader);
qError("%s failed to retrieve sma info", GET_TASKID(pTaskInfo));
QUERY_CHECK_CODE(code, lino, _end);
}
2022-08-10 11:58:23 +00:00
if (success) {
2024-07-23 06:19:04 +00:00
size_t size = taosArrayGetSize(pBlock->pDataBlock);
bool keep = false;
code = doFilterByBlockSMA(pOperator->exprSupp.pFilterInfo, pBlock->pBlockAgg, size, pBlockInfo->rows, &keep);
if (code) {
pAPI->tsdReader.tsdReaderReleaseDataBlock(pTableScanInfo->dataReader);
qError("%s failed to do filter by block sma, code:%s", GET_TASKID(pTaskInfo), tstrerror(code));
QUERY_CHECK_CODE(code, lino, _end);
}
2024-07-23 02:50:16 +00:00
2022-08-10 11:58:23 +00:00
if (!keep) {
2023-04-04 06:50:58 +00:00
qDebug("%s data block filter out by block SMA, brange:%" PRId64 "-%" PRId64 ", rows:%" PRId64,
GET_TASKID(pTaskInfo), pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows);
2022-08-10 11:58:23 +00:00
pCost->filterOutBlocks += 1;
(*status) = FUNC_DATA_REQUIRED_FILTEROUT;
taosMemoryFreeClear(pBlock->pBlockAgg);
2022-08-10 11:58:23 +00:00
2023-05-23 10:58:54 +00:00
pAPI->tsdReader.tsdReaderReleaseDataBlock(pTableScanInfo->dataReader);
2022-08-10 11:58:23 +00:00
return TSDB_CODE_SUCCESS;
}
}
2022-04-16 11:10:21 +00:00
}
2024-07-21 10:20:30 +00:00
// free the sma info, since it should not be involved in *later computing process.
taosMemoryFreeClear(pBlock->pBlockAgg);
// try to filter data block according to current results
2024-07-19 08:15:37 +00:00
code = doDynamicPruneDataBlock(pOperator, pBlockInfo, status);
if (code) {
pAPI->tsdReader.tsdReaderReleaseDataBlock(pTableScanInfo->dataReader);
QUERY_CHECK_CODE(code, lino, _end);
}
2024-07-19 08:15:37 +00:00
if (*status == FUNC_DATA_REQUIRED_NOT_LOAD) {
2023-04-04 06:50:58 +00:00
qDebug("%s data block skipped due to dynamic prune, brange:%" PRId64 "-%" PRId64 ", rows:%" PRId64,
GET_TASKID(pTaskInfo), pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows);
pCost->skipBlocks += 1;
2023-05-23 10:58:54 +00:00
pAPI->tsdReader.tsdReaderReleaseDataBlock(pTableScanInfo->dataReader);
STableScanInfo* p1 = pOperator->info;
if (taosHashGetSize(p1->pIgnoreTables) == taosArrayGetSize(p1->base.pTableListInfo->pTableList)) {
*status = FUNC_DATA_REQUIRED_ALL_FILTEROUT;
} else {
*status = FUNC_DATA_REQUIRED_FILTEROUT;
}
return TSDB_CODE_SUCCESS;
}
2022-04-16 11:10:21 +00:00
pCost->totalCheckedRows += pBlock->info.rows;
pCost->loadBlocks += 1;
SSDataBlock* p = NULL;
2024-07-19 08:15:37 +00:00
code = pAPI->tsdReader.tsdReaderRetrieveDataBlock(pTableScanInfo->dataReader, &p, NULL);
2024-08-19 05:39:30 +00:00
if (p == NULL || code != TSDB_CODE_SUCCESS || p != pBlock) {
return code;
2022-04-04 06:54:39 +00:00
}
if ((pOperator->operatorType == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN) && ((STableScanInfo *)pOperator->info)->ignoreTag) {
// do nothing
} else {
// dyn vtb scan do not read tag from origin tables.
code = doSetTagColumnData(pTableScanInfo, pBlock, pTaskInfo, pBlock->info.rows);
if (code) {
return code;
}
}
2022-10-26 08:25:33 +00:00
// restore the previous value
pCost->totalRows -= pBlock->info.rows;
2022-11-04 14:13:40 +00:00
if (pOperator->exprSupp.pFilterInfo != NULL) {
2024-07-19 08:15:37 +00:00
code = doFilter(pBlock, pOperator->exprSupp.pFilterInfo, &pTableScanInfo->matchInfo);
QUERY_CHECK_CODE(code, lino, _end);
int64_t st = taosGetTimestampUs();
2024-07-19 08:15:37 +00:00
double el = (taosGetTimestampUs() - st) / 1000.0;
pTableScanInfo->readRecorder.filterTime += el;
if (pBlock->info.rows == 0) {
pCost->filterOutBlocks += 1;
2023-03-29 02:46:56 +00:00
qDebug("%s data block filter out, brange:%" PRId64 "-%" PRId64 ", rows:%" PRId64 ", elapsed time:%.2f ms",
GET_TASKID(pTaskInfo), pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, el);
} else {
qDebug("%s data block filter applied, elapsed time:%.2f ms", GET_TASKID(pTaskInfo), el);
}
}
2023-01-20 10:08:34 +00:00
bool limitReached = applyLimitOffset(&pTableScanInfo->limitInfo, pBlock, pTaskInfo);
2023-02-08 09:55:28 +00:00
if (limitReached) { // set operator flag is done
setOperatorCompleted(pOperator);
}
2022-10-26 08:25:33 +00:00
pCost->totalRows += pBlock->info.rows;
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
2022-04-04 06:54:39 +00:00
}
2022-11-18 01:47:26 +00:00
static void prepareForDescendingScan(STableScanBase* pTableScanInfo, SqlFunctionCtx* pCtx, int32_t numOfOutput) {
2022-04-04 06:54:39 +00:00
SET_REVERSE_SCAN_FLAG(pTableScanInfo);
switchCtxOrder(pCtx, numOfOutput);
pTableScanInfo->cond.order = TSDB_ORDER_DESC;
2022-07-10 02:15:27 +00:00
STimeWindow* pTWindow = &pTableScanInfo->cond.twindows;
TSWAP(pTWindow->skey, pTWindow->ekey);
2022-04-04 06:54:39 +00:00
}
typedef struct STableCachedVal {
const char* pName;
STag* pTags;
} STableCachedVal;
2022-11-07 03:53:23 +00:00
static void freeTableCachedVal(void* param) {
if (param == NULL) {
return;
}
STableCachedVal* pVal = param;
taosMemoryFree((void*)pVal->pName);
taosMemoryFree(pVal->pTags);
taosMemoryFree(pVal);
}
2024-08-12 10:21:35 +00:00
static int32_t createTableCacheVal(const SMetaReader* pMetaReader, STableCachedVal** ppResVal) {
2024-08-05 03:17:49 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2022-11-17 08:11:42 +00:00
STableCachedVal* pVal = taosMemoryMalloc(sizeof(STableCachedVal));
2024-08-05 03:17:49 +00:00
QUERY_CHECK_NULL(pVal, code, lino, _end, terrno);
2024-08-14 08:11:48 +00:00
pVal->pTags = NULL;
pVal->pName = taosStrdup(pMetaReader->me.name);
2024-08-05 03:17:49 +00:00
QUERY_CHECK_NULL(pVal->pName, code, lino, _end, terrno);
2022-11-17 08:11:42 +00:00
// only child table has tag value
if (pMetaReader->me.type == TSDB_CHILD_TABLE || pMetaReader->me.type == TSDB_VIRTUAL_CHILD_TABLE) {
STag* pTag = (STag*)pMetaReader->me.ctbEntry.pTags;
2022-11-17 08:11:42 +00:00
pVal->pTags = taosMemoryMalloc(pTag->len);
2024-08-05 03:17:49 +00:00
QUERY_CHECK_NULL(pVal->pTags, code, lino, _end, terrno);
2022-11-17 08:11:42 +00:00
memcpy(pVal->pTags, pTag, pTag->len);
}
2024-08-12 10:23:45 +00:00
(*ppResVal) = pVal;
2024-08-05 03:17:49 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
2024-08-12 10:21:35 +00:00
freeTableCachedVal(pVal);
2024-08-05 03:17:49 +00:00
}
2024-08-12 10:21:35 +00:00
return code;
2022-11-17 08:11:42 +00:00
}
// const void *key, size_t keyLen, void *value
2023-06-26 10:43:00 +00:00
static void freeCachedMetaItem(const void* key, size_t keyLen, void* value, void* ud) {
(void)key;
(void)keyLen;
(void)ud;
freeTableCachedVal(value);
}
2022-11-07 03:53:23 +00:00
static void doSetNullValue(SSDataBlock* pBlock, const SExprInfo* pExpr, int32_t numOfExpr) {
for (int32_t j = 0; j < numOfExpr; ++j) {
int32_t dstSlotId = pExpr[j].base.resSchema.slotId;
SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, dstSlotId);
2023-02-20 02:04:08 +00:00
colDataSetNNULL(pColInfoData, 0, pBlock->info.rows);
}
}
2024-08-13 06:35:49 +00:00
static void freeTableCachedValObj(STableCachedVal* pVal) {
taosMemoryFree((void*)pVal->pName);
taosMemoryFree(pVal->pTags);
}
int32_t addTagPseudoColumnData(SReadHandle* pHandle, const SExprInfo* pExpr, int32_t numOfExpr, SSDataBlock* pBlock,
int32_t rows, SExecTaskInfo* pTask, STableMetaCacheInfo* pCache) {
2024-09-11 08:37:06 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
bool freeReader = false;
LRUHandle* h = NULL;
STableCachedVal val = {0};
SMetaReader mr = {0};
const char* idStr = pTask->id.str;
int32_t insertRet = TAOS_LRU_STATUS_OK;
2024-08-23 03:43:08 +00:00
STableCachedVal* pVal = NULL;
// currently only the tbname pseudo column
if (numOfExpr <= 0) {
2022-07-09 04:13:21 +00:00
return TSDB_CODE_SUCCESS;
}
// todo: opt if only require the vgId and the vgVer;
// backup the rows
int32_t backupRows = pBlock->info.rows;
pBlock->info.rows = rows;
// todo refactor: extract method
// the handling of the null data should be packed in the extracted method
// 1. check if it is existed in meta cache
2022-11-07 03:53:23 +00:00
if (pCache == NULL) {
pHandle->api.metaReaderFn.initReader(&mr, pHandle->vnode, META_READER_LOCK, &pHandle->api.metaFn);
code = pHandle->api.metaReaderFn.getEntryGetUidCache(&mr, pBlock->info.id.uid);
if (code != TSDB_CODE_SUCCESS) {
// when encounter the TSDB_CODE_PAR_TABLE_NOT_EXIST error, we proceed.
2024-08-12 10:21:35 +00:00
if (code == TSDB_CODE_PAR_TABLE_NOT_EXIST) {
2022-12-01 11:05:33 +00:00
qWarn("failed to get table meta, table may have been dropped, uid:0x%" PRIx64 ", code:%s, %s",
2024-08-12 10:21:35 +00:00
pBlock->info.id.uid, tstrerror(code), idStr);
// append null value before return to caller, since the caller will ignore this error code and proceed
doSetNullValue(pBlock, pExpr, numOfExpr);
2022-11-17 08:11:42 +00:00
} else {
2024-09-11 08:37:06 +00:00
qError("failed to get table meta, uid:0x%" PRIx64 ", code:%s, %s", pBlock->info.id.uid, tstrerror(code), idStr);
2022-11-17 08:11:42 +00:00
}
pHandle->api.metaReaderFn.clearReader(&mr);
2024-08-12 10:21:35 +00:00
return code;
}
pHandle->api.metaReaderFn.readerReleaseLock(&mr);
2022-11-07 03:53:23 +00:00
val.pName = mr.me.name;
val.pTags = (STag*)mr.me.ctbEntry.pTags;
2022-11-07 03:53:23 +00:00
freeReader = true;
} else {
2022-11-07 03:53:23 +00:00
pCache->metaFetch += 1;
2022-11-28 04:32:40 +00:00
h = taosLRUCacheLookup(pCache->pTableMetaEntryCache, &pBlock->info.id.uid, sizeof(pBlock->info.id.uid));
2022-11-07 03:53:23 +00:00
if (h == NULL) {
pHandle->api.metaReaderFn.initReader(&mr, pHandle->vnode, META_READER_LOCK, &pHandle->api.metaFn);
2024-08-27 02:50:28 +00:00
freeReader = true;
code = pHandle->api.metaReaderFn.getEntryGetUidCache(&mr, pBlock->info.id.uid);
2022-11-07 03:53:23 +00:00
if (code != TSDB_CODE_SUCCESS) {
2024-08-12 10:21:35 +00:00
if (code == TSDB_CODE_PAR_TABLE_NOT_EXIST) {
qWarn("failed to get table meta, table may have been dropped, uid:0x%" PRIx64 ", code:%s, %s",
2024-08-12 10:21:35 +00:00
pBlock->info.id.uid, tstrerror(code), idStr);
// append null value before return to caller, since the caller will ignore this error code and proceed
doSetNullValue(pBlock, pExpr, numOfExpr);
2022-11-17 08:11:42 +00:00
} else {
2024-08-12 10:21:35 +00:00
qError("failed to get table meta, uid:0x%" PRIx64 ", code:%s, %s", pBlock->info.id.uid, tstrerror(code),
idStr);
2022-11-17 08:11:42 +00:00
}
pHandle->api.metaReaderFn.clearReader(&mr);
2024-08-12 10:21:35 +00:00
return code;
2022-11-07 03:53:23 +00:00
}
pHandle->api.metaReaderFn.readerReleaseLock(&mr);
2022-11-07 03:53:23 +00:00
2024-08-12 10:21:35 +00:00
code = createTableCacheVal(&mr, &pVal);
QUERY_CHECK_CODE(code, lino, _end);
2022-11-07 03:53:23 +00:00
2022-11-07 08:02:53 +00:00
val = *pVal;
2022-11-07 03:53:23 +00:00
} else {
pCache->cacheHit += 1;
2024-09-11 03:51:02 +00:00
STableCachedVal* pValTmp = taosLRUCacheValue(pCache->pTableMetaEntryCache, h);
val = *pValTmp;
2022-11-17 08:11:42 +00:00
2024-09-04 10:37:41 +00:00
bool bRes = taosLRUCacheRelease(pCache->pTableMetaEntryCache, h, false);
qTrace("release LRU cache, res %d", bRes);
2022-11-07 03:53:23 +00:00
}
2022-11-07 05:25:09 +00:00
qDebug("retrieve table meta from cache:%" PRIu64 ", hit:%" PRIu64 " miss:%" PRIu64 ", %s", pCache->metaFetch,
pCache->cacheHit, (pCache->metaFetch - pCache->cacheHit), idStr);
2022-07-09 04:13:21 +00:00
}
for (int32_t j = 0; j < numOfExpr; ++j) {
const SExprInfo* pExpr1 = &pExpr[j];
int32_t dstSlotId = pExpr1->base.resSchema.slotId;
SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, dstSlotId);
2022-05-31 06:03:47 +00:00
colInfoDataCleanup(pColInfoData, pBlock->info.rows);
int32_t functionId = pExpr1->pExpr->_function.functionId;
// this is to handle the tbname
if (fmIsScanPseudoColumnFunc(functionId)) {
int32_t fType = pExpr1->pExpr->_function.functionType;
if (fType == FUNCTION_TYPE_TBNAME) {
2024-07-19 08:15:37 +00:00
code = setTbNameColData(pBlock, pColInfoData, functionId, val.pName);
QUERY_CHECK_CODE(code, lino, _end);
} else if (fType == FUNCTION_TYPE_VGID) {
2024-07-19 08:15:37 +00:00
code = setVgIdColData(pBlock, pColInfoData, functionId, pTask->id.vgId);
QUERY_CHECK_CODE(code, lino, _end);
} else if (fType == FUNCTION_TYPE_VGVER) {
2024-07-19 08:15:37 +00:00
code = setVgVerColData(pBlock, pColInfoData, functionId, pBlock->info.version);
QUERY_CHECK_CODE(code, lino, _end);
}
} else { // these are tags
2022-05-31 09:49:33 +00:00
STagVal tagVal = {0};
tagVal.cid = pExpr1->base.pParam[0].pCol->colId;
const char* p = pHandle->api.metaFn.extractTagVal(val.pTags, pColInfoData->info.type, &tagVal);
2022-05-31 09:49:33 +00:00
char* data = NULL;
if (pColInfoData->info.type != TSDB_DATA_TYPE_JSON && p != NULL) {
data = tTagValToData((const STagVal*)p, false);
} else {
2022-05-31 09:49:33 +00:00
data = (char*)p;
2022-05-19 14:10:20 +00:00
}
2022-08-01 08:41:14 +00:00
bool isNullVal = (data == NULL) || (pColInfoData->info.type == TSDB_DATA_TYPE_JSON && tTagIsJsonNull(data));
if (isNullVal) {
2023-02-20 02:04:08 +00:00
colDataSetNNULL(pColInfoData, 0, pBlock->info.rows);
2022-08-01 15:30:25 +00:00
} else if (pColInfoData->info.type != TSDB_DATA_TYPE_JSON) {
2023-03-28 07:21:47 +00:00
code = colDataSetNItems(pColInfoData, 0, data, pBlock->info.rows, false);
2022-10-21 06:00:46 +00:00
if (IS_VAR_DATA_TYPE(((const STagVal*)p)->type)) {
2025-04-24 03:45:37 +00:00
char* tmp = taosMemoryCalloc(1, varDataLen(data) + 1);
if (tmp != NULL){
memcpy(tmp, varDataVal(data), varDataLen(data));
2025-04-25 01:06:14 +00:00
qDebug("get tag value:%s, cid:%d, table name:%s, uid%"PRId64, tmp, tagVal.cid, val.pName, pBlock->info.id.uid);
2025-04-24 03:45:37 +00:00
taosMemoryFree(tmp);
}
2022-10-21 06:00:46 +00:00
taosMemoryFree(data);
}
2024-09-11 03:51:02 +00:00
QUERY_CHECK_CODE(code, lino, _end);
2022-08-16 04:11:56 +00:00
} else { // todo opt for json tag
2022-08-01 15:30:25 +00:00
for (int32_t i = 0; i < pBlock->info.rows; ++i) {
2024-07-19 08:15:37 +00:00
code = colDataSetVal(pColInfoData, i, data, false);
QUERY_CHECK_CODE(code, lino, _end);
2022-08-01 15:30:25 +00:00
}
}
}
}
// restore the rows
pBlock->info.rows = backupRows;
2024-08-13 02:31:24 +00:00
_end:
2024-08-23 03:43:08 +00:00
if (NULL != pVal) {
insertRet = taosLRUCacheInsert(pCache->pTableMetaEntryCache, &pBlock->info.id.uid, sizeof(uint64_t), pVal,
2024-09-27 09:17:37 +00:00
sizeof(STableCachedVal), freeCachedMetaItem, NULL, NULL, TAOS_LRU_PRIORITY_LOW, NULL);
2024-08-23 03:43:08 +00:00
if (insertRet != TAOS_LRU_STATUS_OK) {
2024-09-02 02:22:54 +00:00
qWarn("failed to put meta into lru cache, code:%d, %s", insertRet, idStr);
2024-08-23 03:43:08 +00:00
}
2024-08-13 02:31:24 +00:00
}
2024-08-29 11:55:09 +00:00
2022-11-07 03:53:23 +00:00
if (freeReader) {
pHandle->api.metaReaderFn.clearReader(&mr);
2022-11-07 03:53:23 +00:00
}
2024-07-19 08:15:37 +00:00
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
}
2024-07-19 08:15:37 +00:00
int32_t setTbNameColData(const SSDataBlock* pBlock, SColumnInfoData* pColInfoData, int32_t functionId,
const char* name) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
struct SScalarFuncExecFuncs fpSet = {0};
2024-07-19 08:15:37 +00:00
code = fmGetScalarFuncExecFuncs(functionId, &fpSet);
QUERY_CHECK_CODE(code, lino, _end);
2022-11-04 10:46:48 +00:00
size_t len = TSDB_TABLE_FNAME_LEN + VARSTR_HEADER_SIZE;
char buf[TSDB_TABLE_FNAME_LEN + VARSTR_HEADER_SIZE] = {0};
2022-11-04 10:46:48 +00:00
STR_TO_VARSTR(buf, name)
SColumnInfoData infoData = createColumnInfoData(TSDB_DATA_TYPE_VARCHAR, len, 1);
2024-07-19 08:15:37 +00:00
code = colInfoDataEnsureCapacity(&infoData, 1, false);
QUERY_CHECK_CODE(code, lino, _end);
code = colDataSetVal(&infoData, 0, buf, false);
QUERY_CHECK_CODE(code, lino, _end);
2022-11-04 10:46:48 +00:00
SScalarParam srcParam = {.numOfRows = pBlock->info.rows, .columnData = &infoData};
SScalarParam param = {.columnData = pColInfoData};
2022-10-20 03:27:33 +00:00
if (fpSet.process != NULL) {
2024-07-19 08:15:37 +00:00
code = fpSet.process(&srcParam, 1, &param);
QUERY_CHECK_CODE(code, lino, _end);
2022-10-20 03:27:33 +00:00
} else {
qError("failed to get the corresponding callback function, functionId:%d", functionId);
}
2022-07-20 05:54:06 +00:00
colDataDestroy(&infoData);
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
}
2024-07-19 08:15:37 +00:00
int32_t setVgIdColData(const SSDataBlock* pBlock, SColumnInfoData* pColInfoData, int32_t functionId, int32_t vgId) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
struct SScalarFuncExecFuncs fpSet = {0};
2024-07-19 08:15:37 +00:00
code = fmGetScalarFuncExecFuncs(functionId, &fpSet);
QUERY_CHECK_CODE(code, lino, _end);
SColumnInfoData infoData = createColumnInfoData(pColInfoData->info.type, pColInfoData->info.bytes, 1);
2024-07-19 08:15:37 +00:00
code = colInfoDataEnsureCapacity(&infoData, 1, false);
QUERY_CHECK_CODE(code, lino, _end);
code = colDataSetVal(&infoData, 0, (const char*)&vgId, false);
QUERY_CHECK_CODE(code, lino, _end);
SScalarParam srcParam = {.numOfRows = pBlock->info.rows, .columnData = &infoData};
SScalarParam param = {.columnData = pColInfoData};
if (fpSet.process != NULL) {
2024-07-19 08:15:37 +00:00
code = fpSet.process(&srcParam, 1, &param);
QUERY_CHECK_CODE(code, lino, _end);
} else {
qError("failed to get the corresponding callback function, functionId:%d", functionId);
}
2024-07-19 08:15:37 +00:00
_end:
colDataDestroy(&infoData);
2024-07-19 08:15:37 +00:00
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
}
2024-07-19 08:15:37 +00:00
int32_t setVgVerColData(const SSDataBlock* pBlock, SColumnInfoData* pColInfoData, int32_t functionId, int64_t vgVer) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
struct SScalarFuncExecFuncs fpSet = {0};
2024-07-19 08:15:37 +00:00
code = fmGetScalarFuncExecFuncs(functionId, &fpSet);
QUERY_CHECK_CODE(code, lino, _end);
SColumnInfoData infoData = createColumnInfoData(pColInfoData->info.type, pColInfoData->info.bytes, 1);
2024-07-19 08:15:37 +00:00
code = colInfoDataEnsureCapacity(&infoData, 1, false);
QUERY_CHECK_CODE(code, lino, _end);
code = colDataSetVal(&infoData, 0, (const char*)&vgVer, false);
QUERY_CHECK_CODE(code, lino, _end);
SScalarParam srcParam = {.numOfRows = pBlock->info.rows, .columnData = &infoData};
SScalarParam param = {.columnData = pColInfoData};
if (fpSet.process != NULL) {
2024-07-19 08:15:37 +00:00
code = fpSet.process(&srcParam, 1, &param);
QUERY_CHECK_CODE(code, lino, _end);
} else {
qError("failed to get the corresponding callback function, functionId:%d", functionId);
}
2024-07-19 08:15:37 +00:00
_end:
colDataDestroy(&infoData);
2024-07-19 08:15:37 +00:00
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
}
2023-12-28 17:40:17 +00:00
2024-07-19 08:15:37 +00:00
static int32_t initNextGroupScan(STableScanInfo* pInfo, STableKeyInfo** pKeyInfo, int32_t* size) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
code = tableListGetGroupList(pInfo->base.pTableListInfo, pInfo->currentGroupId, pKeyInfo, size);
QUERY_CHECK_CODE(code, lino, _end);
2024-01-16 07:08:50 +00:00
pInfo->tableStartIndex = TARRAY_ELEM_IDX(pInfo->base.pTableListInfo->pTableList, *pKeyInfo);
pInfo->tableEndIndex = (pInfo->tableStartIndex + (*size) - 1);
2024-01-30 12:24:59 +00:00
pInfo->pResBlock->info.blankFill = false;
taosMemoryFreeClear(pInfo->pResBlock->pBlockAgg);
2024-01-30 12:24:59 +00:00
2023-12-28 17:40:17 +00:00
if (!pInfo->needCountEmptyTable) {
pInfo->countState = TABLE_COUNT_STATE_END;
} else {
pInfo->countState = TABLE_COUNT_STATE_SCAN;
2023-12-27 15:15:11 +00:00
}
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
2023-12-27 13:37:00 +00:00
}
2024-01-02 07:45:03 +00:00
void markGroupProcessed(STableScanInfo* pInfo, uint64_t groupId) {
2024-07-19 08:15:37 +00:00
if (pInfo->countState == TABLE_COUNT_STATE_END) {
2024-01-02 07:45:03 +00:00
return;
}
if (pInfo->base.pTableListInfo->groupOffset) {
2024-01-02 07:45:03 +00:00
pInfo->countState = TABLE_COUNT_STATE_PROCESSED;
} else {
2024-09-04 10:37:41 +00:00
int32_t code = taosHashRemove(pInfo->base.pTableListInfo->remainGroups, &groupId, sizeof(groupId));
if (code != TSDB_CODE_SUCCESS) {
2024-09-27 06:21:51 +00:00
qDebug("%s failed at line %d since %s", __func__, __LINE__, tstrerror(code));
2024-09-04 10:37:41 +00:00
}
2024-01-02 07:45:03 +00:00
}
}
2023-12-28 08:18:38 +00:00
static SSDataBlock* getOneRowResultBlock(SExecTaskInfo* pTaskInfo, STableScanBase* pBase, SSDataBlock* pBlock,
const STableKeyInfo* tbInfo) {
2023-12-13 15:25:37 +00:00
blockDataEmpty(pBlock);
pBlock->info.rows = 1;
pBlock->info.id.uid = tbInfo->uid;
2023-12-22 08:03:09 +00:00
pBlock->info.id.groupId = tbInfo->groupId;
2024-01-30 09:34:06 +00:00
pBlock->info.blankFill = true;
2023-12-13 15:25:37 +00:00
2023-12-28 08:18:38 +00:00
// only one row: set all col data to null & hasNull
2023-12-13 15:25:37 +00:00
int32_t col_num = blockDataGetNumOfCols(pBlock);
for (int32_t i = 0; i < col_num; ++i) {
SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, i);
colDataSetNULL(pColInfoData, 0);
}
// set tag/tbname
terrno = doSetTagColumnData(pBase, pBlock, pTaskInfo, 1);
2023-12-28 08:18:38 +00:00
return pBlock;
}
static SSDataBlock* getBlockForEmptyTable(SOperatorInfo* pOperator, const STableKeyInfo* tbInfo) {
STableScanInfo* pTableScanInfo = pOperator->info;
SSDataBlock* pBlock =
getOneRowResultBlock(pOperator->pTaskInfo, &pTableScanInfo->base, pTableScanInfo->pResBlock, tbInfo);
2023-12-13 15:25:37 +00:00
pOperator->resultInfo.totalRows++;
return pBlock;
}
2024-07-24 08:17:28 +00:00
static int32_t doTableScanImplNext(SOperatorInfo* pOperator, SSDataBlock** ppRes) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2022-04-04 06:54:39 +00:00
STableScanInfo* pTableScanInfo = pOperator->info;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
SSDataBlock* pBlock = pTableScanInfo->pResBlock;
bool hasNext = false;
int64_t st = taosGetTimestampUs();
QRY_PARAM_CHECK(ppRes);
pBlock->info.dataLoad = false;
2022-04-04 06:54:39 +00:00
2023-03-28 07:21:47 +00:00
while (true) {
code = pAPI->tsdReader.tsdNextDataBlock(pTableScanInfo->base.dataReader, &hasNext);
2024-07-24 08:17:28 +00:00
if (code != TSDB_CODE_SUCCESS) {
2023-05-23 10:58:54 +00:00
pAPI->tsdReader.tsdReaderReleaseDataBlock(pTableScanInfo->base.dataReader);
2024-07-24 08:17:28 +00:00
QUERY_CHECK_CODE(code, lino, _end);
2023-03-28 07:21:47 +00:00
}
if (!hasNext) {
break;
}
2023-04-04 06:50:58 +00:00
if (isTaskKilled(pTaskInfo)) {
2023-05-23 10:58:54 +00:00
pAPI->tsdReader.tsdReaderReleaseDataBlock(pTableScanInfo->base.dataReader);
code = pTaskInfo->code;
goto _end;
}
2022-04-04 06:54:39 +00:00
if (pOperator->status == OP_EXEC_DONE) {
2023-05-23 10:58:54 +00:00
pAPI->tsdReader.tsdReaderReleaseDataBlock(pTableScanInfo->base.dataReader);
break;
}
// process this data block based on the probabilities
bool processThisBlock = processBlockWithProbability(&pTableScanInfo->sample);
if (!processThisBlock) {
continue;
}
2023-03-27 11:40:29 +00:00
if (pBlock->info.id.uid) {
2023-09-01 05:24:47 +00:00
pBlock->info.id.groupId = tableListGetTableGroupId(pTableScanInfo->base.pTableListInfo, pBlock->info.id.uid);
2023-03-27 11:40:29 +00:00
}
2022-08-02 06:19:15 +00:00
uint32_t status = 0;
code = loadDataBlock(pOperator, &pTableScanInfo->base, pBlock, &status);
2024-07-24 08:17:28 +00:00
QUERY_CHECK_CODE(code, lino, _end);
if (status == FUNC_DATA_REQUIRED_ALL_FILTEROUT) {
break;
}
// current block is filter out according to filter condition, continue load the next block
if (status == FUNC_DATA_REQUIRED_FILTEROUT || pBlock->info.rows == 0) {
continue;
}
2022-11-18 01:47:26 +00:00
pOperator->resultInfo.totalRows = pTableScanInfo->base.readRecorder.totalRows;
pTableScanInfo->base.readRecorder.elapsedTime += (taosGetTimestampUs() - st) / 1000.0;
2022-11-18 01:47:26 +00:00
pOperator->cost.totalCost = pTableScanInfo->base.readRecorder.elapsedTime;
pBlock->info.scanFlag = pTableScanInfo->base.scanFlag;
2024-07-24 08:17:28 +00:00
(*ppRes) = pBlock;
return code;
2022-04-04 06:54:39 +00:00
}
2024-07-24 08:17:28 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
pTaskInfo->code = code;
T_LONG_JMP(pTaskInfo->env, code);
2024-07-24 08:17:28 +00:00
}
return code;
}
2024-08-27 09:04:44 +00:00
static int32_t doGroupedTableScan(SOperatorInfo* pOperator, SSDataBlock** pBlock) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2022-04-04 06:54:39 +00:00
STableScanInfo* pTableScanInfo = pOperator->info;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2024-07-19 08:15:37 +00:00
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
2022-04-04 06:54:39 +00:00
QRY_PARAM_CHECK(pBlock);
2024-08-27 09:04:44 +00:00
2022-04-04 06:54:39 +00:00
// The read handle is not initialized yet, since no qualified tables exists
2022-11-18 01:47:26 +00:00
if (pTableScanInfo->base.dataReader == NULL || pOperator->status == OP_EXEC_DONE) {
2024-08-27 09:04:44 +00:00
return code;
2022-04-04 06:54:39 +00:00
}
2022-05-03 15:23:49 +00:00
// do the ascending order traverse in the first place.
while (pTableScanInfo->scanTimes < pTableScanInfo->scanInfo.numOfAsc) {
2024-08-27 09:04:44 +00:00
SSDataBlock* p = NULL;
code = doTableScanImplNext(pOperator, &p);
QUERY_CHECK_CODE(code, lino, _end);
2022-07-10 02:15:27 +00:00
if (p != NULL) {
2024-01-02 07:45:03 +00:00
markGroupProcessed(pTableScanInfo, p->info.id.groupId);
2024-08-27 09:04:44 +00:00
*pBlock = p;
return code;
2022-04-04 06:54:39 +00:00
}
2022-05-03 15:23:49 +00:00
pTableScanInfo->scanTimes += 1;
taosHashClear(pTableScanInfo->pIgnoreTables);
2022-05-03 15:23:49 +00:00
if (pTableScanInfo->scanTimes < pTableScanInfo->scanInfo.numOfAsc) {
setTaskStatus(pTaskInfo, TASK_NOT_COMPLETED);
2023-02-21 09:24:09 +00:00
pTableScanInfo->base.scanFlag = MAIN_SCAN;
pTableScanInfo->base.dataBlockLoadFlag = FUNC_DATA_REQUIRED_DATA_LOAD;
qDebug("start to repeat ascending order scan data blocks due to query func required, %s", GET_TASKID(pTaskInfo));
2022-07-10 02:15:27 +00:00
// do prepare for the next round table scan operation
2024-07-19 08:15:37 +00:00
code = pAPI->tsdReader.tsdReaderResetStatus(pTableScanInfo->base.dataReader, &pTableScanInfo->base.cond);
QUERY_CHECK_CODE(code, lino, _end);
2022-04-04 06:54:39 +00:00
}
}
2022-04-04 06:54:39 +00:00
int32_t total = pTableScanInfo->scanInfo.numOfAsc + pTableScanInfo->scanInfo.numOfDesc;
2022-05-03 15:23:49 +00:00
if (pTableScanInfo->scanTimes < total) {
2022-11-18 01:47:26 +00:00
if (pTableScanInfo->base.cond.order == TSDB_ORDER_ASC) {
prepareForDescendingScan(&pTableScanInfo->base, pOperator->exprSupp.pCtx, 0);
2024-07-19 08:15:37 +00:00
code = pAPI->tsdReader.tsdReaderResetStatus(pTableScanInfo->base.dataReader, &pTableScanInfo->base.cond);
QUERY_CHECK_CODE(code, lino, _end);
qDebug("%s start to descending order scan data blocks due to query func required", GET_TASKID(pTaskInfo));
}
2022-04-04 06:54:39 +00:00
2022-05-03 15:23:49 +00:00
while (pTableScanInfo->scanTimes < total) {
2024-08-27 09:04:44 +00:00
SSDataBlock* p = NULL;
code = doTableScanImplNext(pOperator, &p);
QUERY_CHECK_CODE(code, lino, _end);
2022-07-10 02:15:27 +00:00
if (p != NULL) {
2024-01-02 07:45:03 +00:00
markGroupProcessed(pTableScanInfo, p->info.id.groupId);
2024-08-27 09:04:44 +00:00
*pBlock = p;
return code;
}
2022-04-04 06:54:39 +00:00
2022-05-03 15:23:49 +00:00
pTableScanInfo->scanTimes += 1;
taosHashClear(pTableScanInfo->pIgnoreTables);
2022-04-04 06:54:39 +00:00
if (pTableScanInfo->scanTimes < total) {
setTaskStatus(pTaskInfo, TASK_NOT_COMPLETED);
2023-02-21 09:24:09 +00:00
pTableScanInfo->base.scanFlag = MAIN_SCAN;
2022-04-04 06:54:39 +00:00
qDebug("%s start to repeat descending order scan data blocks", GET_TASKID(pTaskInfo));
2024-07-19 08:15:37 +00:00
code = pAPI->tsdReader.tsdReaderResetStatus(pTableScanInfo->base.dataReader, &pTableScanInfo->base.cond);
QUERY_CHECK_CODE(code, lino, _end);
}
2022-04-04 06:54:39 +00:00
}
}
2023-12-27 15:15:11 +00:00
if (pTableScanInfo->countState < TABLE_COUNT_STATE_END) {
2024-01-02 07:45:03 +00:00
STableListInfo* pTableListInfo = pTableScanInfo->base.pTableListInfo;
if (pTableListInfo->groupOffset) { // group by tbname, group by tag + sort
2024-01-02 07:45:03 +00:00
if (pTableScanInfo->countState < TABLE_COUNT_STATE_PROCESSED) {
pTableScanInfo->countState = TABLE_COUNT_STATE_PROCESSED;
STableKeyInfo* pStart =
(STableKeyInfo*)tableListGetInfo(pTableScanInfo->base.pTableListInfo, pTableScanInfo->tableStartIndex);
2024-08-27 09:04:44 +00:00
if (NULL == pStart) {
return code;
}
*pBlock = getBlockForEmptyTable(pOperator, pStart);
return code;
2024-01-02 07:45:03 +00:00
}
2024-04-01 11:44:26 +00:00
} else { // group by tag + no sort
int32_t numOfTables = 0;
code = tableListGetSize(pTableListInfo, &numOfTables);
QUERY_CHECK_CODE(code, lino, _end);
2024-01-02 07:45:03 +00:00
if (pTableScanInfo->tableEndIndex + 1 >= numOfTables) {
// get empty group, mark processed & rm from hash
void* pIte = taosHashIterate(pTableListInfo->remainGroups, NULL);
if (pIte != NULL) {
size_t keySize = 0;
uint64_t* pGroupId = taosHashGetKey(pIte, &keySize);
STableKeyInfo info = {.uid = *(uint64_t*)pIte, .groupId = *pGroupId};
taosHashCancelIterate(pTableListInfo->remainGroups, pIte);
markGroupProcessed(pTableScanInfo, *pGroupId);
2024-08-27 09:04:44 +00:00
*pBlock = getBlockForEmptyTable(pOperator, &info);
return code;
2024-01-02 07:45:03 +00:00
}
}
}
2023-12-27 13:37:00 +00:00
pTableScanInfo->countState = TABLE_COUNT_STATE_END;
2023-12-13 15:25:37 +00:00
}
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
2024-07-19 08:15:37 +00:00
}
2024-08-27 09:04:44 +00:00
return code;
2022-06-23 11:58:12 +00:00
}
2023-09-01 05:24:47 +00:00
static int32_t createTableListInfoFromParam(SOperatorInfo* pOperator) {
2024-07-19 08:15:37 +00:00
STableScanInfo* pInfo = pOperator->info;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
int32_t code = 0;
STableListInfo* pListInfo = pInfo->base.pTableListInfo;
2023-09-01 05:24:47 +00:00
STableScanOperatorParam* pParam = (STableScanOperatorParam*)pOperator->pOperatorGetParam->value;
2024-07-19 08:15:37 +00:00
int32_t num = taosArrayGetSize(pParam->pUidList);
2023-09-01 05:24:47 +00:00
if (num <= 0) {
qError("empty table scan uid list");
return TSDB_CODE_INVALID_PARA;
}
2024-07-19 08:15:37 +00:00
qDebug("vgId:%d add total %d dynamic tables to scan, tableSeq:%d, exist num:%" PRId64 ", operator status:%d",
pTaskInfo->id.vgId, num, pParam->tableSeq, (int64_t)taosArrayGetSize(pListInfo->pTableList),
pOperator->status);
2023-09-01 05:24:47 +00:00
if (pParam->tableSeq) {
pListInfo->oneTableForEachGroup = true;
if (taosArrayGetSize(pListInfo->pTableList) > 0) {
taosHashClear(pListInfo->map);
taosArrayClear(pListInfo->pTableList);
pOperator->status = OP_EXEC_DONE;
}
} else {
pListInfo->oneTableForEachGroup = false;
pListInfo->numOfOuputGroups = 1;
}
2024-07-19 08:15:37 +00:00
STableKeyInfo info = {.groupId = 0};
int32_t tableIdx = 0;
2023-09-01 05:24:47 +00:00
for (int32_t i = 0; i < num; ++i) {
uint64_t* pUid = taosArrayGet(pParam->pUidList, i);
2024-08-05 08:09:01 +00:00
if (!pUid) {
qError("%s failed at line %d since %s", __func__, __LINE__, tstrerror(terrno));
return terrno;
}
2023-09-01 05:24:47 +00:00
if (taosHashPut(pListInfo->map, pUid, sizeof(uint64_t), &tableIdx, sizeof(int32_t))) {
if (TSDB_CODE_DUP_KEY == terrno) {
continue;
}
2024-12-11 11:18:50 +00:00
return terrno;
2023-09-01 05:24:47 +00:00
}
info.uid = *pUid;
void* p = taosArrayPush(pListInfo->pTableList, &info);
if (p == NULL) {
2024-09-20 05:23:44 +00:00
return terrno;
2023-09-01 05:24:47 +00:00
}
tableIdx++;
2024-03-22 00:47:07 +00:00
qDebug("add dynamic table scan uid:%" PRIu64 ", %s", info.uid, GET_TASKID(pTaskInfo));
2023-09-01 05:24:47 +00:00
}
2024-07-19 08:15:37 +00:00
2023-09-01 05:24:47 +00:00
return code;
}
static int32_t doInitReader(STableScanInfo* pInfo, SExecTaskInfo* pTaskInfo, SStorageAPI* pAPI, int32_t* pNum,
STableKeyInfo** pList) {
const char* idStr = GET_TASKID(pTaskInfo);
int32_t code = initNextGroupScan(pInfo, pList, pNum);
if (code) {
qError("%s failed to init groupScan Info, code:%s at line:%d", idStr, tstrerror(code), __LINE__);
return code;
}
if (pInfo->base.dataReader != NULL) {
qError("%s tsdb reader should be null", idStr);
return TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR;
}
code = pAPI->tsdReader.tsdReaderOpen(pInfo->base.readHandle.vnode, &pInfo->base.cond, *pList, *pNum, pInfo->pResBlock,
(void**)&pInfo->base.dataReader, idStr, &pInfo->pIgnoreTables);
if (code) {
qError("%s failed to open tsdbReader, code:%s at line:%d", idStr, tstrerror(code), __LINE__);
}
return code;
}
int compareColIdPair(const void* elem1, const void* elem2) {
SColIdPair* node1 = (SColIdPair*)elem1;
SColIdPair* node2 = (SColIdPair*)elem2;
if (node1->orgColId < node2->orgColId) {
return -1;
}
return node1->orgColId > node2->orgColId;
}
static int32_t createVTableScanInfoFromParam(SOperatorInfo* pOperator) {
int32_t code = 0;
int32_t lino = 0;
STableScanInfo* pInfo = pOperator->info;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
STableListInfo* pListInfo = pInfo->base.pTableListInfo;
STableScanOperatorParam* pParam = (STableScanOperatorParam*)pOperator->pOperatorGetParam->value;
SMetaReader orgTable = {0};
SMetaReader superTable = {0};
SSchemaWrapper* schema = NULL;
SArray* pColArray = NULL;
SArray* pBlockColArray = NULL;
int32_t num = 0;
STableKeyInfo* pList = NULL;
cleanupQueryTableDataCond(&pInfo->base.cond);
if (pAPI->tsdReader.tsdReaderClose) {
pAPI->tsdReader.tsdReaderClose(pInfo->base.dataReader);
}
pAPI->metaReaderFn.initReader(&orgTable, pInfo->base.readHandle.vnode, META_READER_LOCK, &pAPI->metaFn);
code = pAPI->metaReaderFn.getTableEntryByName(&orgTable, strstr(pParam->pOrgTbInfo->tbName, ".") + 1);
QUERY_CHECK_CODE(code, lino, _return);
switch (orgTable.me.type) {
case TSDB_CHILD_TABLE:
pAPI->metaReaderFn.initReader(&superTable, pInfo->base.readHandle.vnode, META_READER_LOCK, &pAPI->metaFn);
code = pAPI->metaReaderFn.getTableEntryByUid(&superTable, orgTable.me.ctbEntry.suid);
QUERY_CHECK_CODE(code, lino, _return);
schema = &superTable.me.stbEntry.schemaRow;
break;
case TSDB_NORMAL_TABLE:
schema = &orgTable.me.ntbEntry.schemaRow;
break;
default:
qError("invalid table type:%d", orgTable.me.type);
return TSDB_CODE_INVALID_PARA;
break;
}
pColArray = taosArrayInit(schema->nCols, sizeof(SColIdPair));
QUERY_CHECK_NULL(pColArray, code, lino, _return, terrno);
pBlockColArray = taosArrayInit(schema->nCols, sizeof(int32_t));
QUERY_CHECK_NULL(pBlockColArray, code, lino, _return, terrno);
// virtual table's origin table scan do not has ts column.
SColIdPair tsPair = {.vtbColId = PRIMARYKEY_TIMESTAMP_COL_ID, .orgColId = PRIMARYKEY_TIMESTAMP_COL_ID};
QUERY_CHECK_NULL(taosArrayPush(pColArray, &tsPair), code, lino, _return, terrno);
for (int32_t i = 0; i < taosArrayGetSize(pParam->pOrgTbInfo->colMap); ++i) {
SColIdNameKV *kv = taosArrayGet(pParam->pOrgTbInfo->colMap, i);
for (int32_t j = 0; j < schema->nCols; j++) {
if (strcmp(kv->colName, schema->pSchema[j].name) == 0) {
SColIdPair pPair = {.vtbColId = kv->colId, .orgColId = (col_id_t)(j + 1)};
QUERY_CHECK_NULL(taosArrayPush(pColArray, &pPair), code, lino, _return, terrno);
break;
}
}
}
for (int32_t i = 0; i < taosArrayGetSize(pColArray); i++) {
SColIdPair *pPair = (SColIdPair*)taosArrayGet(pColArray, i);
for (int32_t j = 0; j < taosArrayGetSize(pInfo->base.matchInfo.pList); j++) {
SColMatchItem *pItem = taosArrayGet(pInfo->base.matchInfo.pList, j);
if (pItem->colId == pPair->vtbColId) {
SColIdPair tmpPair = {.orgColId = pPair->orgColId, .vtbColId = pItem->dstSlotId};
QUERY_CHECK_NULL(taosArrayPush(pBlockColArray, &tmpPair), code, lino, _return, terrno);
break;
}
}
}
if (pInfo->pResBlock) {
blockDataDestroy(pInfo->pResBlock);
pInfo->pResBlock = NULL;
}
taosArraySort(pColArray, compareColIdPair);
taosArraySort(pBlockColArray, compareColIdPair);
code = createOneDataBlockWithColArray(pInfo->pOrgBlock, pBlockColArray, &pInfo->pResBlock);
QUERY_CHECK_CODE(code, lino, _return);
code = initQueryTableDataCondWithColArray(&pInfo->base.cond, &pInfo->base.orgCond, &pInfo->base.readHandle, pColArray);
QUERY_CHECK_CODE(code, lino, _return);
pInfo->base.cond.twindows.skey = pParam->window.ekey + 1;
pInfo->base.cond.suid = orgTable.me.type == TSDB_CHILD_TABLE ? superTable.me.uid : 0;
pInfo->currentGroupId = 0;
pInfo->base.dataReader = NULL;
pInfo->ignoreTag = true;
pListInfo->oneTableForEachGroup = true;
taosHashClear(pListInfo->map);
taosArrayClear(pListInfo->pTableList);
uint64_t pUid = orgTable.me.uid;
STableKeyInfo info = {.groupId = 0, .uid = pUid};
int32_t tableIdx = 0;
code = taosHashPut(pListInfo->map, &pUid, sizeof(uint64_t), &tableIdx, sizeof(int32_t));
QUERY_CHECK_CODE(code, lino, _return);
QUERY_CHECK_NULL(taosArrayPush(pListInfo->pTableList, &info), code, lino, _return, terrno);
qDebug("add dynamic table scan uid:%" PRIu64 ", %s", info.uid, GET_TASKID(pTaskInfo));
pOperator->status = OP_OPENED;
taosRLockLatch(&pTaskInfo->lock);
code = doInitReader(pInfo, pTaskInfo, pAPI, &num, &pList);
taosRUnLockLatch(&pTaskInfo->lock);
QUERY_CHECK_CODE(code, lino, _return);
if (pInfo->pResBlock->info.capacity > pOperator->resultInfo.capacity) {
pOperator->resultInfo.capacity = pInfo->pResBlock->info.capacity;
}
pInfo->currentGroupId = -1;
_return:
if (code) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
taosArrayDestroy(pColArray);
taosArrayDestroy(pBlockColArray);
pAPI->metaReaderFn.clearReader(&superTable);
pAPI->metaReaderFn.clearReader(&orgTable);
return code;
}
2024-08-27 09:04:44 +00:00
static int32_t startNextGroupScan(SOperatorInfo* pOperator, SSDataBlock** pResult) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2023-09-01 05:24:47 +00:00
STableScanInfo* pInfo = pOperator->info;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
int32_t numOfTables = 0;
2024-08-27 09:04:44 +00:00
QRY_PARAM_CHECK(pResult);
2024-08-27 09:04:44 +00:00
code = tableListGetSize(pInfo->base.pTableListInfo, &numOfTables);
QUERY_CHECK_CODE(code, lino, _end);
if ((++pInfo->currentGroupId) >= tableListGetOutputGroups(pInfo->base.pTableListInfo)) {
2023-09-01 05:24:47 +00:00
setOperatorCompleted(pOperator);
if (pOperator->dynamicTask) {
taosArrayClear(pInfo->base.pTableListInfo->pTableList);
taosHashClear(pInfo->base.pTableListInfo->map);
}
2024-08-27 09:04:44 +00:00
return code;
2023-09-01 05:24:47 +00:00
}
// reset value for the next group data output
pOperator->status = OP_OPENED;
resetLimitInfoForNextGroup(&pInfo->base.limitInfo);
2024-07-19 08:15:37 +00:00
2023-09-01 05:24:47 +00:00
int32_t num = 0;
STableKeyInfo* pList = NULL;
2024-07-19 08:15:37 +00:00
code = initNextGroupScan(pInfo, &pList, &num);
QUERY_CHECK_CODE(code, lino, _end);
2023-12-27 13:37:00 +00:00
2024-07-19 08:15:37 +00:00
code = pAPI->tsdReader.tsdSetQueryTableList(pInfo->base.dataReader, pList, num);
QUERY_CHECK_CODE(code, lino, _end);
code = pAPI->tsdReader.tsdReaderResetStatus(pInfo->base.dataReader, &pInfo->base.cond);
QUERY_CHECK_CODE(code, lino, _end);
2023-09-01 05:24:47 +00:00
pInfo->scanTimes = 0;
2024-07-19 08:15:37 +00:00
2024-08-27 09:04:44 +00:00
code = doGroupedTableScan(pOperator, pResult);
QUERY_CHECK_CODE(code, lino, _end);
if (*pResult != NULL) {
2023-09-01 05:24:47 +00:00
if (pOperator->dynamicTask) {
2024-08-27 09:04:44 +00:00
(*pResult)->info.id.groupId = (*pResult)->info.id.uid;
2023-09-01 05:24:47 +00:00
}
2024-08-27 09:04:44 +00:00
return code;
2023-09-01 05:24:47 +00:00
}
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
2024-07-19 08:15:37 +00:00
}
2024-08-27 09:04:44 +00:00
return code;
2023-09-01 05:24:47 +00:00
}
static int32_t groupSeqTableScan(SOperatorInfo* pOperator, SSDataBlock** pResBlock) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2023-09-01 05:24:47 +00:00
STableScanInfo* pInfo = pOperator->info;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
int32_t num = 0;
STableKeyInfo* pList = NULL;
SSDataBlock* pResult = NULL;
const char* idStr = GET_TASKID(pTaskInfo);
QRY_PARAM_CHECK(pResBlock);
2023-09-01 05:24:47 +00:00
if (pInfo->currentGroupId == -1) {
if ((++pInfo->currentGroupId) >= tableListGetOutputGroups(pInfo->base.pTableListInfo)) {
2023-09-01 05:24:47 +00:00
setOperatorCompleted(pOperator);
return code;
2023-09-01 05:24:47 +00:00
}
2024-01-16 07:08:50 +00:00
taosRLockLatch(&pTaskInfo->lock);
code = doInitReader(pInfo, pTaskInfo, pAPI, &num, &pList);
taosRUnLockLatch(&pTaskInfo->lock);
2024-07-23 02:50:16 +00:00
QUERY_CHECK_CODE(code, lino, _end);
if (pInfo->filesetDelimited) {
pAPI->tsdReader.tsdSetFilesetDelimited(pInfo->base.dataReader);
}
2023-09-01 05:24:47 +00:00
if (pInfo->pResBlock->info.capacity > pOperator->resultInfo.capacity) {
pOperator->resultInfo.capacity = pInfo->pResBlock->info.capacity;
}
}
code = doGroupedTableScan(pOperator, &pResult);
2024-08-27 09:04:44 +00:00
QUERY_CHECK_CODE(code, lino, _end);
if (pResult != NULL) {
2023-09-01 05:24:47 +00:00
if (pOperator->dynamicTask) {
pResult->info.id.groupId = pResult->info.id.uid;
2023-09-01 05:24:47 +00:00
}
*pResBlock = pResult;
return code;
2023-09-01 05:24:47 +00:00
}
while (true) {
code = startNextGroupScan(pOperator, &pResult);
2024-08-27 09:04:44 +00:00
QUERY_CHECK_CODE(code, lino, _end);
if (pResult || pOperator->status == OP_EXEC_DONE) {
*pResBlock = pResult;
return code;
2023-09-01 05:24:47 +00:00
}
}
2024-01-18 01:52:04 +00:00
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s %s failed at line %d since %s", idStr, __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
2024-07-19 08:15:37 +00:00
}
return code;
2023-09-01 05:24:47 +00:00
}
feat(stream): add new trigger continuous_window_close (#30125) * opt stream build twa result * opt force window close memory * feat(stream):optimize new interval and scan operator * adj log * opt code * opt code * fill history * fix issue for fill history * add ci * feat(stream): add new stream nonblock interval operator * adjust code * use new scan operator * use new scan operator * add log * fix issue * recover stream scan next function * fix issue * fix issue * fix issue * ignore disorder data * fix issue * fix issue for interval sliding * fix issue * fix ci issue * fix ci issue * fix ci issue * add semi && final nonblock interval operator * fix issue * fix issue * fix issue * fix issue * fix issue * fix issue * fix issue * fix issue * refactor(stream): track the msgId for each upstream tasks. * fix(stream): fix race condition. * fix(stream): update the task last msgId when putting into input queue succ. * fix issue * fix issue * put recalculate data to rocksdb * fix issue * fix issue * enh(query)[TD-33071]: add support for saving and restoring tsdbReader scan progress - Implement functionality to save scan progress during tsdbReader operations - Enable resuming scans from the last saved position * fix issue * fix issue * fix issue * fix issue * fix issue * add rec interval check * enh(stream):add recalculate tasks. * enh(stream): support the re-calculate the tasks. * fix issue && do refactor * do refactor * fix issue * fix issue * update backend opt * add new interface * add new session operator * support blob * add new session operator * fix issue * add rec state for rec task * fix invalid read * add new session window * enh(stream): update the stream tasks backend. * new session operator * add pull data * fix(stream): fix error in expand stream backend. * fix issue * fix issue * fix issue * merge code * fix issue * fix(stream): check for null ptr. * fix(stream): add more check. * fix issue * fix issue * fix issue * add debug code * fix issue * fix issue * fix issue * set rec end flag * fix(stream): opt re-calculate stream tasks. * fix issue * fix issue * add new operator * enh(stream): dispatch recalculate block to agg tasks. * fix issue * fix issue * fix(stream): adjust filter. * fix issue * refactor * refactor(stream): adjust the recalculate end block. * fix issue * fix(stream): set correct create trigger block. * fix issue * fix(stream): fix error in build recalculate end block. * fix(stream): check null ptr. * add stream client && fix issue * fix mem leak * fix(stream): free msg. * add stream client * fix(stream): fix error. * add stream client && fix issue * add stream client * refactor(stream): set the recalculate task complete. * add wend and group_id for session window dest table * feat(stream): refactor and set the recalcul agg task complete. * add cfg for adapter * fix issue * add state && event operator * feat(stream): support fill-history task. * add new fill operator * fix(stream): set correct backend when updating fill-history task to recalculate task. * add new fill operator * fix(stream): s2025-03-06 11:10:31.272 et ops always open in scan tsdb * fix(stream):set the correct taskType for sink task. * new fill operator * adj stream fill operator * fix issue * fix issue * fix issue * fix issue * fix issue * fix issue * fix issue * fix issue * adj test * fix issue * fix(stream): fix issue * fix(steam): fix issue * fix(steam): fix issue * fix(steam): fix issue * fix(steam): fix issue * fix(stream): fix issue * fix(stream): fix issue * fix(stream): fix issue * fix: ut com error * fix(stream): fix mem leak and adjust operator type check rule * fix(stream): fix mem leak and adjust test case * refactor code * fix(stream): free items. * fix(stream): free fix memory leak. * fix(stream): fix syntax error. * fix: ignore unexpect block * fix: adjust op type --------- Co-authored-by: Haojun Liao <hjliao@taosdata.com> Co-authored-by: Jinqing Kuang <kuangjinqingcn@gmail.com> Co-authored-by: yihaoDeng <luomoxyz@126.com>
2025-03-14 12:14:01 +00:00
int32_t doTableScanNext(SOperatorInfo* pOperator, SSDataBlock** ppRes) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2022-06-23 11:58:12 +00:00
STableScanInfo* pInfo = pOperator->info;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
QRY_PARAM_CHECK(ppRes);
2025-04-19 02:26:32 +00:00
qTrace("%s call", __FUNCTION__);
2023-09-01 05:24:47 +00:00
if (pOperator->pOperatorGetParam) {
pOperator->dynamicTask = true;
if (isDynVtbScan(pOperator)) {
code = createVTableScanInfoFromParam(pOperator);
2024-07-24 08:17:28 +00:00
freeOperatorParam(pOperator->pOperatorGetParam, OP_GET_PARAM);
pOperator->pOperatorGetParam = NULL;
QUERY_CHECK_CODE(code, lino, _end);
2024-08-27 09:04:44 +00:00
SSDataBlock* result = NULL;
2023-09-01 05:24:47 +00:00
while (true) {
code = startNextGroupScan(pOperator, &result);
QUERY_CHECK_CODE(code, lino, _end);
2024-08-27 09:04:44 +00:00
2023-09-01 05:24:47 +00:00
if (result || pOperator->status == OP_EXEC_DONE) {
SSDataBlock* res = NULL;
if (result) {
code = createOneDataBlockWithTwoBlock(result, pInfo->pOrgBlock, &res);
QUERY_CHECK_CODE(code, lino, _end);
pInfo->pResBlock = res;
blockDataDestroy(result);
}
(*ppRes) = res;
2024-07-24 08:17:28 +00:00
return code;
2023-09-01 05:24:47 +00:00
}
}
} else {
code = createTableListInfoFromParam(pOperator);
freeOperatorParam(pOperator->pOperatorGetParam, OP_GET_PARAM);
pOperator->pOperatorGetParam = NULL;
QUERY_CHECK_CODE(code, lino, _end);
if (pOperator->status == OP_EXEC_DONE) {
pInfo->currentGroupId = -1;
pOperator->status = OP_OPENED;
SSDataBlock* result = NULL;
while (true) {
code = startNextGroupScan(pOperator, &result);
QUERY_CHECK_CODE(code, lino, _end);
if (result || pOperator->status == OP_EXEC_DONE) {
(*ppRes) = result;
return code;
}
}
}
2023-09-01 05:24:47 +00:00
}
}
// scan table one by one sequentially
2022-06-30 06:41:50 +00:00
if (pInfo->scanMode == TABLE_SCAN__TABLE_ORDER) {
int32_t numOfTables = 0;
STableKeyInfo tInfo = {0};
2023-12-27 13:37:00 +00:00
pInfo->countState = TABLE_COUNT_STATE_END;
2022-09-16 05:06:57 +00:00
2022-06-30 08:40:17 +00:00
while (1) {
2024-08-27 09:04:44 +00:00
SSDataBlock* result = NULL;
code = doGroupedTableScan(pOperator, &result);
QUERY_CHECK_CODE(code, lino, _end);
2023-03-31 02:35:13 +00:00
if (result || (pOperator->status == OP_EXEC_DONE) || isTaskKilled(pTaskInfo)) {
2024-07-24 08:17:28 +00:00
(*ppRes) = result;
return code;
2022-06-30 06:41:50 +00:00
}
2022-09-16 05:06:57 +00:00
2022-06-30 06:41:50 +00:00
// if no data, switch to next table and continue scan
pInfo->currentTable++;
taosRLockLatch(&pTaskInfo->lock);
numOfTables = 0;
code = tableListGetSize(pInfo->base.pTableListInfo, &numOfTables);
if (code != TSDB_CODE_SUCCESS) {
taosRUnLockLatch(&pTaskInfo->lock);
2024-09-24 10:19:47 +00:00
TSDB_CHECK_CODE(code, lino, _end);
}
if (pInfo->currentTable >= numOfTables) {
2023-03-30 04:04:47 +00:00
qDebug("all table checked in table list, total:%d, return NULL, %s", numOfTables, GET_TASKID(pTaskInfo));
taosRUnLockLatch(&pTaskInfo->lock);
2024-07-24 08:17:28 +00:00
(*ppRes) = NULL;
return code;
2022-06-30 06:41:50 +00:00
}
2024-08-27 09:04:44 +00:00
2024-08-06 01:24:31 +00:00
STableKeyInfo* tmp = (STableKeyInfo*)tableListGetInfo(pInfo->base.pTableListInfo, pInfo->currentTable);
if (!tmp) {
taosRUnLockLatch(&pTaskInfo->lock);
(*ppRes) = NULL;
2024-09-24 10:19:47 +00:00
QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
2024-08-06 01:24:31 +00:00
}
2024-09-24 10:19:47 +00:00
2024-08-06 01:24:31 +00:00
tInfo = *tmp;
taosRUnLockLatch(&pTaskInfo->lock);
2024-07-19 08:15:37 +00:00
code = pAPI->tsdReader.tsdSetQueryTableList(pInfo->base.dataReader, &tInfo, 1);
QUERY_CHECK_CODE(code, lino, _end);
qDebug("set uid:%" PRIu64 " into scanner, total tables:%d, index:%d/%d %s", tInfo.uid, numOfTables,
pInfo->currentTable, numOfTables, GET_TASKID(pTaskInfo));
2022-09-16 05:06:57 +00:00
2024-07-19 08:15:37 +00:00
code = pAPI->tsdReader.tsdReaderResetStatus(pInfo->base.dataReader, &pInfo->base.cond);
QUERY_CHECK_CODE(code, lino, _end);
2022-06-30 06:41:50 +00:00
pInfo->scanTimes = 0;
}
} else { // scan table group by group sequentially
code = groupSeqTableScan(pOperator, ppRes);
2024-09-24 10:19:47 +00:00
QUERY_CHECK_CODE(code, lino, _end);
}
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
2024-09-24 10:19:47 +00:00
qError("%s %s failed at line %d since %s", GET_TASKID(pTaskInfo), __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
T_LONG_JMP(pTaskInfo->env, code);
2024-07-19 08:15:37 +00:00
}
2024-07-24 08:17:28 +00:00
2024-08-27 09:04:44 +00:00
return code;
2022-04-04 06:54:39 +00:00
}
static int32_t getTableScannerExecInfo(struct SOperatorInfo* pOptr, void** pOptrExplain, uint32_t* len) {
SFileBlockLoadRecorder* pRecorder = taosMemoryCalloc(1, sizeof(SFileBlockLoadRecorder));
2024-08-05 04:22:25 +00:00
if (!pRecorder) {
return terrno;
}
2024-09-11 08:37:06 +00:00
STableScanInfo* pTableScanInfo = pOptr->info;
2022-11-18 01:47:26 +00:00
*pRecorder = pTableScanInfo->base.readRecorder;
*pOptrExplain = pRecorder;
*len = sizeof(SFileBlockLoadRecorder);
return 0;
}
2023-05-23 10:58:54 +00:00
static void destroyTableScanBase(STableScanBase* pBase, TsdReader* pAPI) {
cleanupQueryTableDataCond(&pBase->cond);
cleanupQueryTableDataCond(&pBase->orgCond);
2022-06-12 15:37:29 +00:00
2024-08-05 05:18:54 +00:00
if (pAPI->tsdReaderClose) {
pAPI->tsdReaderClose(pBase->dataReader);
}
pBase->dataReader = NULL;
if (pBase->matchInfo.pList != NULL) {
taosArrayDestroy(pBase->matchInfo.pList);
}
2022-07-08 13:37:15 +00:00
2024-07-24 09:08:08 +00:00
tableListDestroy(pBase->pTableListInfo);
taosLRUCacheCleanup(pBase->metaCache.pTableMetaEntryCache);
cleanupExprSupp(&pBase->pseudoSup);
}
static void destroyTableScanOperatorInfo(void* param) {
STableScanInfo* pTableScanInfo = (STableScanInfo*)param;
blockDataDestroy(pTableScanInfo->pResBlock);
blockDataDestroy(pTableScanInfo->pOrgBlock);
taosHashCleanup(pTableScanInfo->pIgnoreTables);
2023-05-24 15:49:26 +00:00
destroyTableScanBase(&pTableScanInfo->base, &pTableScanInfo->base.readerAPI);
2022-07-08 06:26:53 +00:00
taosMemoryFreeClear(param);
}
static void resetClolumnReserve(SSDataBlock* pBlock, int32_t dataRequireFlag) {
if (pBlock && dataRequireFlag == FUNC_DATA_REQUIRED_NOT_LOAD) {
int32_t numOfCols = taosArrayGetSize(pBlock->pDataBlock);
for (int32_t i = 0; i < numOfCols; ++i) {
SColumnInfoData* pCol = (SColumnInfoData*)taosArrayGet(pBlock->pDataBlock, i);
if (pCol) {
pCol->info.noData = true;
}
}
}
}
2024-07-24 09:08:08 +00:00
int32_t createTableScanOperatorInfo(STableScanPhysiNode* pTableScanNode, SReadHandle* readHandle,
2024-07-29 02:35:06 +00:00
STableListInfo* pTableListInfo, SExecTaskInfo* pTaskInfo,
SOperatorInfo** pOptrInfo) {
QRY_PARAM_CHECK(pOptrInfo);
2024-07-24 09:08:08 +00:00
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2022-04-04 06:54:39 +00:00
STableScanInfo* pInfo = taosMemoryCalloc(1, sizeof(STableScanInfo));
SOperatorInfo* pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
if (pInfo == NULL || pOperator == NULL) {
code = terrno;
goto _error;
2022-04-04 06:54:39 +00:00
}
SScanPhysiNode* pScanNode = &pTableScanNode->scan;
2022-11-04 10:46:48 +00:00
SDataBlockDescNode* pDescNode = pScanNode->node.pOutputDataBlockDesc;
int32_t numOfCols = 0;
2023-04-13 06:32:05 +00:00
code =
2022-11-18 01:47:26 +00:00
extractColMatchInfo(pScanNode->pScanCols, pDescNode, &numOfCols, COL_MATCH_FROM_COL_ID, &pInfo->base.matchInfo);
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _error);
2022-11-18 05:40:03 +00:00
initLimitInfo(pScanNode->node.pLimit, pScanNode->node.pSlimit, &pInfo->base.limitInfo);
2023-11-07 11:59:05 +00:00
code = initQueryTableDataCond(&pInfo->base.cond, pTableScanNode, readHandle);
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _error);
2022-11-04 10:46:48 +00:00
if (pScanNode->pScanPseudoCols != NULL) {
2022-11-18 01:47:26 +00:00
SExprSupp* pSup = &pInfo->base.pseudoSup;
2024-08-05 03:57:18 +00:00
pSup->pExprInfo = NULL;
code = createExprInfo(pScanNode->pScanPseudoCols, NULL, &pSup->pExprInfo, &pSup->numOfExprs);
QUERY_CHECK_CODE(code, lino, _error);
2024-07-19 08:15:37 +00:00
pSup->pCtx = createSqlFunctionCtx(pSup->pExprInfo, pSup->numOfExprs, &pSup->rowEntryInfoOffset,
&pTaskInfo->storageAPI.functionStore);
2024-08-05 04:22:25 +00:00
QUERY_CHECK_NULL(pSup->pCtx, code, lino, _error, terrno);
}
pInfo->scanInfo = (SScanInfo){.numOfAsc = pTableScanNode->scanSeq[0], .numOfDesc = pTableScanNode->scanSeq[1]};
2023-02-22 03:09:23 +00:00
pInfo->base.scanFlag = (pInfo->scanInfo.numOfAsc > 1) ? PRE_SCAN : MAIN_SCAN;
2022-11-18 09:27:05 +00:00
2022-11-18 01:47:26 +00:00
pInfo->base.pdInfo.interval = extractIntervalInfo(pTableScanNode);
pInfo->base.readHandle = *readHandle;
2022-12-01 09:24:26 +00:00
pInfo->base.dataBlockLoadFlag = pTableScanNode->dataRequired;
pInfo->sample.sampleRatio = pTableScanNode->ratio;
pInfo->sample.seed = taosGetTimestampSec();
2023-05-24 15:49:26 +00:00
pInfo->base.readerAPI = pTaskInfo->storageAPI.tsdReader;
2022-11-05 17:34:04 +00:00
initResultSizeInfo(&pOperator->resultInfo, 4096);
2022-11-27 16:27:49 +00:00
pInfo->pResBlock = createDataBlockFromDescNode(pDescNode);
resetClolumnReserve(pInfo->pResBlock, pInfo->base.dataBlockLoadFlag);
2024-08-05 03:17:49 +00:00
QUERY_CHECK_NULL(pInfo->pResBlock, code, lino, _error, terrno);
2024-09-11 08:37:06 +00:00
2024-07-19 08:15:37 +00:00
code = prepareDataBlockBuf(pInfo->pResBlock, &pInfo->base.matchInfo);
QUERY_CHECK_CODE(code, lino, _error);
2022-09-20 06:12:39 +00:00
pInfo->virtualStableScan = pScanNode->virtualStableScan;
if (pScanNode->node.dynamicOp && pScanNode->virtualStableScan) {
TSWAP(pInfo->pOrgBlock, pInfo->pResBlock);
pInfo->pResBlock = NULL;
memcpy(&pInfo->base.orgCond, &pInfo->base.cond, sizeof(SQueryTableDataCond));
memset(&pInfo->base.cond, 0, sizeof(SQueryTableDataCond));
}
2025-05-09 10:05:02 +00:00
code = filterInitFromNode((SNode*)pTableScanNode->scan.node.pConditions, &pOperator->exprSupp.pFilterInfo, 0,
&pTaskInfo->pStreamRuntimeInfo);
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _error);
pInfo->currentGroupId = -1;
2022-09-20 06:12:39 +00:00
2023-12-28 17:40:17 +00:00
pInfo->tableEndIndex = -1;
pInfo->assignBlockUid = pTableScanNode->assignBlockUid;
pInfo->hasGroupByTag = pTableScanNode->pGroupTags ? true : false;
2022-11-11 01:12:57 +00:00
setOperatorInfo(pOperator, "TableScanOperator", QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN, false, OP_NOT_OPENED, pInfo,
pTaskInfo);
2022-06-18 04:00:41 +00:00
pOperator->exprSupp.numOfExprs = numOfCols;
2022-05-03 15:23:49 +00:00
2023-12-13 15:25:37 +00:00
pInfo->needCountEmptyTable = tsCountAlwaysReturnValue && pTableScanNode->needCountEmptyTable;
pInfo->ignoreTag = false;
2023-12-13 15:25:37 +00:00
pInfo->base.pTableListInfo = pTableListInfo;
2022-11-18 01:47:26 +00:00
pInfo->base.metaCache.pTableMetaEntryCache = taosLRUCacheInit(1024 * 128, -1, .5);
if (pInfo->base.metaCache.pTableMetaEntryCache == NULL) {
code = terrno;
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _error);
}
pInfo->filesetDelimited = pTableScanNode->filesetDelimited;
2022-11-18 01:47:26 +00:00
taosLRUCacheSetStrictCapacity(pInfo->base.metaCache.pTableMetaEntryCache, false);
2024-08-27 09:04:44 +00:00
pOperator->fpSet = createOperatorFpSet(optrDummyOpenFn, doTableScanNext, NULL, destroyTableScanOperatorInfo,
2023-09-01 05:24:47 +00:00
optrDefaultBufFn, getTableScannerExecInfo, optrDefaultGetNextExtFn, NULL);
2022-05-03 15:23:49 +00:00
// for non-blocking operator, the open cost is always 0
pOperator->cost.openCost = 0;
2024-07-24 09:08:08 +00:00
*pOptrInfo = pOperator;
2024-08-29 11:43:59 +00:00
return TSDB_CODE_SUCCESS;
_error:
2022-10-26 05:44:53 +00:00
if (pInfo != NULL) {
2024-09-11 08:37:06 +00:00
pInfo->base.pTableListInfo = NULL; // this attribute will be destroy outside of this function
2022-10-26 05:44:53 +00:00
destroyTableScanOperatorInfo(pInfo);
}
2024-08-07 07:53:23 +00:00
if (pOperator != NULL) {
pOperator->info = NULL;
destroyOperator(pOperator);
}
2022-10-26 05:44:53 +00:00
pTaskInfo->code = code;
2024-07-24 09:08:08 +00:00
return code;
2022-04-04 06:54:39 +00:00
}
2024-07-24 09:08:08 +00:00
int32_t createTableSeqScanOperatorInfo(void* pReadHandle, SExecTaskInfo* pTaskInfo, SOperatorInfo** pOptrInfo) {
QRY_PARAM_CHECK(pOptrInfo);
2024-07-24 09:08:08 +00:00
2024-07-29 02:35:06 +00:00
int32_t code = 0;
2022-04-04 06:54:39 +00:00
STableScanInfo* pInfo = taosMemoryCalloc(1, sizeof(STableScanInfo));
2022-05-07 16:21:17 +00:00
SOperatorInfo* pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
2024-07-24 09:08:08 +00:00
if (pInfo == NULL || pOperator == NULL) {
code = terrno;
2024-07-24 09:08:08 +00:00
goto _end;
}
2022-04-04 06:54:39 +00:00
2022-11-18 01:47:26 +00:00
pInfo->base.dataReader = pReadHandle;
2022-05-07 16:21:17 +00:00
// pInfo->prevGroupId = -1;
2022-04-04 06:54:39 +00:00
2022-11-11 01:12:57 +00:00
setOperatorInfo(pOperator, "TableSeqScanOperator", QUERY_NODE_PHYSICAL_PLAN_TABLE_SEQ_SCAN, false, OP_NOT_OPENED,
pInfo, pTaskInfo);
2024-08-27 09:04:44 +00:00
pOperator->fpSet = createOperatorFpSet(optrDummyOpenFn, doTableScanImplNext, NULL, NULL, optrDefaultBufFn, NULL,
2024-07-19 08:15:37 +00:00
optrDefaultGetNextExtFn, NULL);
2024-07-24 09:08:08 +00:00
*pOptrInfo = pOperator;
return code;
2024-07-29 02:35:06 +00:00
_end:
2024-07-24 09:08:08 +00:00
if (pInfo != NULL) {
taosMemoryFree(pInfo);
}
if (pOperator != NULL) {
taosMemoryFree(pOperator);
}
pTaskInfo->code = code;
return code;
2022-04-04 06:54:39 +00:00
}
2025-04-24 01:11:54 +00:00
static int32_t doBlockDataPrimaryKeyFilter(SSDataBlock* pBlock, STqOffsetVal* offset) {
2024-10-27 07:42:14 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2025-04-24 01:11:54 +00:00
if (pBlock->info.window.skey != offset->ts || offset->primaryKey.type == 0) {
2024-07-24 08:17:28 +00:00
return code;
2022-07-15 09:48:48 +00:00
}
2025-04-24 01:11:54 +00:00
bool* p = taosMemoryCalloc(pBlock->info.rows, sizeof(bool));
QUERY_CHECK_NULL(p, code, lino, _end, terrno);
bool hasUnqualified = false;
2022-07-15 09:48:48 +00:00
2025-04-24 01:11:54 +00:00
SColumnInfoData* pColTs = taosArrayGet(pBlock->pDataBlock, 0);
SColumnInfoData* pColPk = taosArrayGet(pBlock->pDataBlock, 1);
2024-07-19 08:15:37 +00:00
2025-04-24 01:11:54 +00:00
qDebug("doBlockDataWindowFilter primary key, ts:%" PRId64 " %" PRId64, offset->ts,
VALUE_GET_TRIVIAL_DATUM(&offset->primaryKey));
QUERY_CHECK_CONDITION((pColPk->info.type == offset->primaryKey.type), code, lino, _end,
TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR);
2025-04-24 01:11:54 +00:00
__compar_fn_t func = getComparFunc(pColPk->info.type, 0);
QUERY_CHECK_NULL(func, code, lino, _end, terrno);
for (int32_t i = 0; i < pBlock->info.rows; ++i) {
int64_t* ts = (int64_t*)colDataGetData(pColTs, i);
void* data = colDataGetData(pColPk, i);
if (IS_VAR_DATA_TYPE(pColPk->info.type)) {
void* tmq = taosMemoryMalloc(offset->primaryKey.nData + VARSTR_HEADER_SIZE);
QUERY_CHECK_NULL(tmq, code, lino, _end, terrno);
memcpy(varDataVal(tmq), offset->primaryKey.pData, offset->primaryKey.nData);
varDataLen(tmq) = offset->primaryKey.nData;
p[i] = (*ts > offset->ts) || (func(data, tmq) > 0);
taosMemoryFree(tmq);
} else {
p[i] = (*ts > offset->ts) || (func(data, VALUE_GET_DATUM(&offset->primaryKey, pColPk->info.type)) > 0);
}
2023-05-11 06:19:27 +00:00
2025-04-24 01:11:54 +00:00
if (!p[i]) {
hasUnqualified = true;
2022-04-04 06:54:39 +00:00
}
2025-04-24 01:11:54 +00:00
}
2022-04-04 06:54:39 +00:00
2025-04-24 01:11:54 +00:00
if (hasUnqualified) {
code = trimDataBlock(pBlock, pBlock->info.rows, p);
QUERY_CHECK_CODE(code, lino, _end);
}
2022-04-04 06:54:39 +00:00
2025-04-24 01:11:54 +00:00
_end:
taosMemoryFree(p);
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
}
2025-04-24 01:11:54 +00:00
static int32_t processPrimaryKey(SSDataBlock* pBlock, bool hasPrimaryKey, STqOffsetVal* offset) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
SValue val = {0};
if (hasPrimaryKey) {
code = doBlockDataPrimaryKeyFilter(pBlock, offset);
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, __LINE__, tstrerror(code));
return code;
}
2025-04-24 01:11:54 +00:00
SColumnInfoData* pColPk = taosArrayGet(pBlock->pDataBlock, 1);
2025-04-24 01:11:54 +00:00
if (pBlock->info.rows < 1) {
2024-07-24 08:17:28 +00:00
return code;
2023-09-01 05:24:47 +00:00
}
2025-04-24 01:11:54 +00:00
void* tmp = colDataGetData(pColPk, pBlock->info.rows - 1);
val.type = pColPk->info.type;
if (IS_VAR_DATA_TYPE(pColPk->info.type)) {
val.pData = taosMemoryMalloc(varDataLen(tmp));
QUERY_CHECK_NULL(val.pData, code, lino, _end, terrno);
val.nData = varDataLen(tmp);
memcpy(val.pData, varDataVal(tmp), varDataLen(tmp));
} else {
valueSetDatum(&val, pColPk->info.type, tmp, pColPk->info.bytes);
2023-09-01 05:24:47 +00:00
}
2022-04-04 06:54:39 +00:00
}
2025-04-24 01:11:54 +00:00
tqOffsetResetToData(offset, pBlock->info.id.uid, pBlock->info.window.ekey, val);
2023-05-18 08:59:18 +00:00
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
2024-07-24 08:17:28 +00:00
return code;
2022-04-04 06:54:39 +00:00
}
2025-05-06 10:05:47 +00:00
static int32_t doQueueScanNext(SOperatorInfo* pOperator, SSDataBlock** ppRes) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
SStreamScanInfo* pInfo = pOperator->info;
const char* id = GET_TASKID(pTaskInfo);
qDebug("start to exec queue scan, %s", id);
if (isTaskKilled(pTaskInfo)) {
(*ppRes) = NULL;
return pTaskInfo->code;
}
if (pTaskInfo->streamInfo.currentOffset.type == TMQ_OFFSET__SNAPSHOT_DATA) {
while (1) {
SSDataBlock* pResult = NULL;
code = doTableScanNext(pInfo->pTableScanOp, &pResult);
QUERY_CHECK_CODE(code, lino, _end);
if (pResult && pResult->info.rows > 0) {
bool hasPrimaryKey = pAPI->tqReaderFn.tqGetTablePrimaryKey(pInfo->tqReader);
code = processPrimaryKey(pResult, hasPrimaryKey, &pTaskInfo->streamInfo.currentOffset);
QUERY_CHECK_CODE(code, lino, _end);
qDebug("tmqsnap doQueueScan get data utid:%" PRId64, pResult->info.id.uid);
if (pResult->info.rows > 0) {
(*ppRes) = pResult;
return code;
}
} else {
break;
}
}
STableScanInfo* pTSInfo = pInfo->pTableScanOp->info;
pAPI->tsdReader.tsdReaderClose(pTSInfo->base.dataReader);
pTSInfo->base.dataReader = NULL;
int64_t validVer = pTaskInfo->streamInfo.snapshotVer + 1;
qDebug("queue scan tsdb over, switch to wal ver %" PRId64, validVer);
if (pAPI->tqReaderFn.tqReaderSeek(pInfo->tqReader, validVer, pTaskInfo->id.str) < 0) {
(*ppRes) = NULL;
return code;
}
tqOffsetResetToLog(&pTaskInfo->streamInfo.currentOffset, validVer);
}
if (pTaskInfo->streamInfo.currentOffset.type == TMQ_OFFSET__LOG) {
while (1) {
bool hasResult =
pAPI->tqReaderFn.tqReaderNextBlockInWal(pInfo->tqReader, id, pTaskInfo->streamInfo.sourceExcluded);
SSDataBlock* pRes = pAPI->tqReaderFn.tqGetResultBlock(pInfo->tqReader);
struct SWalReader* pWalReader = pAPI->tqReaderFn.tqReaderGetWalReader(pInfo->tqReader);
// curVersion move to next
tqOffsetResetToLog(&pTaskInfo->streamInfo.currentOffset, pWalReader->curVersion);
// use ts to pass time when replay, because ts not used if type is log
pTaskInfo->streamInfo.currentOffset.ts = pAPI->tqReaderFn.tqGetResultBlockTime(pInfo->tqReader);
if (hasResult) {
qDebug("doQueueScan get data from log %" PRId64 " rows, version:%" PRId64, pRes->info.rows,
pTaskInfo->streamInfo.currentOffset.version);
blockDataCleanup(pInfo->pRes);
STimeWindow defaultWindow = {.skey = INT64_MIN, .ekey = INT64_MAX};
// code = setBlockIntoRes(pInfo, pRes, &defaultWindow, true);
QUERY_CHECK_CODE(code, lino, _end);
qDebug("doQueueScan after filter get data from log %" PRId64 " rows, version:%" PRId64, pInfo->pRes->info.rows,
pTaskInfo->streamInfo.currentOffset.version);
if (pInfo->pRes->info.rows > 0) {
(*ppRes) = pInfo->pRes;
return code;
}
} else {
qDebug("doQueueScan get none from log, return, version:%" PRId64, pTaskInfo->streamInfo.currentOffset.version);
(*ppRes) = NULL;
return code;
}
}
} else {
qError("unexpected streamInfo prepare type: %d", pTaskInfo->streamInfo.currentOffset.type);
(*ppRes) = NULL;
return code;
}
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
pTaskInfo->code = code;
T_LONG_JMP(pTaskInfo->env, code);
}
(*ppRes) = NULL;
return code;
}
static SSDataBlock* doQueueScan(SOperatorInfo* pOperator) {
SSDataBlock* pRes = NULL;
int32_t code = doQueueScanNext(pOperator, &pRes);
return pRes;
}
feat(stream): add new trigger continuous_window_close (#30125) * opt stream build twa result * opt force window close memory * feat(stream):optimize new interval and scan operator * adj log * opt code * opt code * fill history * fix issue for fill history * add ci * feat(stream): add new stream nonblock interval operator * adjust code * use new scan operator * use new scan operator * add log * fix issue * recover stream scan next function * fix issue * fix issue * fix issue * ignore disorder data * fix issue * fix issue for interval sliding * fix issue * fix ci issue * fix ci issue * fix ci issue * add semi && final nonblock interval operator * fix issue * fix issue * fix issue * fix issue * fix issue * fix issue * fix issue * fix issue * refactor(stream): track the msgId for each upstream tasks. * fix(stream): fix race condition. * fix(stream): update the task last msgId when putting into input queue succ. * fix issue * fix issue * put recalculate data to rocksdb * fix issue * fix issue * enh(query)[TD-33071]: add support for saving and restoring tsdbReader scan progress - Implement functionality to save scan progress during tsdbReader operations - Enable resuming scans from the last saved position * fix issue * fix issue * fix issue * fix issue * fix issue * add rec interval check * enh(stream):add recalculate tasks. * enh(stream): support the re-calculate the tasks. * fix issue && do refactor * do refactor * fix issue * fix issue * update backend opt * add new interface * add new session operator * support blob * add new session operator * fix issue * add rec state for rec task * fix invalid read * add new session window * enh(stream): update the stream tasks backend. * new session operator * add pull data * fix(stream): fix error in expand stream backend. * fix issue * fix issue * fix issue * merge code * fix issue * fix(stream): check for null ptr. * fix(stream): add more check. * fix issue * fix issue * fix issue * add debug code * fix issue * fix issue * fix issue * set rec end flag * fix(stream): opt re-calculate stream tasks. * fix issue * fix issue * add new operator * enh(stream): dispatch recalculate block to agg tasks. * fix issue * fix issue * fix(stream): adjust filter. * fix issue * refactor * refactor(stream): adjust the recalculate end block. * fix issue * fix(stream): set correct create trigger block. * fix issue * fix(stream): fix error in build recalculate end block. * fix(stream): check null ptr. * add stream client && fix issue * fix mem leak * fix(stream): free msg. * add stream client * fix(stream): fix error. * add stream client && fix issue * add stream client * refactor(stream): set the recalculate task complete. * add wend and group_id for session window dest table * feat(stream): refactor and set the recalcul agg task complete. * add cfg for adapter * fix issue * add state && event operator * feat(stream): support fill-history task. * add new fill operator * fix(stream): set correct backend when updating fill-history task to recalculate task. * add new fill operator * fix(stream): s2025-03-06 11:10:31.272 et ops always open in scan tsdb * fix(stream):set the correct taskType for sink task. * new fill operator * adj stream fill operator * fix issue * fix issue * fix issue * fix issue * fix issue * fix issue * fix issue * fix issue * adj test * fix issue * fix(stream): fix issue * fix(steam): fix issue * fix(steam): fix issue * fix(steam): fix issue * fix(steam): fix issue * fix(stream): fix issue * fix(stream): fix issue * fix(stream): fix issue * fix: ut com error * fix(stream): fix mem leak and adjust operator type check rule * fix(stream): fix mem leak and adjust test case * refactor code * fix(stream): free items. * fix(stream): free fix memory leak. * fix(stream): fix syntax error. * fix: ignore unexpect block * fix: adjust op type --------- Co-authored-by: Haojun Liao <hjliao@taosdata.com> Co-authored-by: Jinqing Kuang <kuangjinqingcn@gmail.com> Co-authored-by: yihaoDeng <luomoxyz@126.com>
2025-03-14 12:14:01 +00:00
int32_t extractTableIdList(const STableListInfo* pTableListInfo, SArray** ppArrayRes) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
SArray* tableIdList = taosArrayInit(4, sizeof(uint64_t));
2024-08-05 04:22:25 +00:00
QUERY_CHECK_NULL(tableIdList, code, lino, _end, terrno);
// Transfer the Array of STableKeyInfo into uid list.
int32_t size = 0;
code = tableListGetSize(pTableListInfo, &size);
QUERY_CHECK_CODE(code, lino, _end);
2022-10-30 14:13:49 +00:00
for (int32_t i = 0; i < size; ++i) {
STableKeyInfo* pkeyInfo = tableListGetInfo(pTableListInfo, i);
2024-08-06 01:24:31 +00:00
QUERY_CHECK_NULL(pkeyInfo, code, lino, _end, terrno);
2024-09-11 08:37:06 +00:00
void* tmp = taosArrayPush(tableIdList, &pkeyInfo->uid);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
}
2024-07-19 08:15:37 +00:00
(*ppArrayRes) = tableIdList;
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
}
2024-07-24 08:17:28 +00:00
static int32_t doRawScanNext(SOperatorInfo* pOperator, SSDataBlock** ppRes) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
SStreamRawScanInfo* pInfo = pOperator->info;
2024-05-23 09:35:54 +00:00
pTaskInfo->streamInfo.btMetaRsp.batchMetaReq = NULL; // use batchMetaReq != NULL to judge if data is meta
pTaskInfo->streamInfo.btMetaRsp.batchMetaLen = NULL;
2022-08-23 09:28:49 +00:00
qDebug("tmqsnap doRawScan called");
if (pTaskInfo->streamInfo.currentOffset.type == TMQ_OFFSET__SNAPSHOT_DATA) {
2023-03-28 07:21:47 +00:00
bool hasNext = false;
if (pInfo->dataReader && pInfo->sContext->withMeta != ONLY_META) {
code = pAPI->tsdReader.tsdNextDataBlock(pInfo->dataReader, &hasNext);
2024-07-24 08:17:28 +00:00
if (code != TSDB_CODE_SUCCESS) {
2023-05-23 10:58:54 +00:00
pAPI->tsdReader.tsdReaderReleaseDataBlock(pInfo->dataReader);
2024-07-24 08:17:28 +00:00
QUERY_CHECK_CODE(code, lino, _end);
2023-03-28 07:21:47 +00:00
}
}
2023-04-04 06:50:58 +00:00
2023-03-28 07:21:47 +00:00
if (pInfo->dataReader && hasNext) {
2022-08-05 13:12:18 +00:00
if (isTaskKilled(pTaskInfo)) {
2023-05-23 10:58:54 +00:00
pAPI->tsdReader.tsdReaderReleaseDataBlock(pInfo->dataReader);
return code;
2022-08-05 13:12:18 +00:00
}
SSDataBlock* pBlock = NULL;
code = pAPI->tsdReader.tsdReaderRetrieveDataBlock(pInfo->dataReader, &pBlock, NULL);
2024-07-24 08:37:10 +00:00
QUERY_CHECK_CODE(code, lino, _end);
2022-08-05 13:12:18 +00:00
if (pBlock && pBlock->info.rows > 0) {
bool hasPrimaryKey = pAPI->snapshotFn.taosXGetTablePrimaryKey(pInfo->sContext);
2024-07-29 02:35:06 +00:00
code = processPrimaryKey(pBlock, hasPrimaryKey, &pTaskInfo->streamInfo.currentOffset);
QUERY_CHECK_CODE(code, lino, _end);
qDebug("tmqsnap doRawScan get data uid:%" PRId64, pBlock->info.id.uid);
2024-07-24 08:17:28 +00:00
(*ppRes) = pBlock;
return code;
}
2022-08-05 13:12:18 +00:00
}
2022-08-09 11:06:24 +00:00
SMetaTableInfo mtInfo = {0};
code = pAPI->snapshotFn.getMetaTableInfoFromSnapshot(pInfo->sContext, &mtInfo);
QUERY_CHECK_CODE(code, lino, _end);
if (code != 0) {
feat(decimal): support decimal data type (#30060) * decimal: create table * decimal: add test case decimal.py * decimal: add decimal.c * support input decimal * decimal test * refactor svalue * fix test cases * add decimal unit test * add decimal test cmake * support insert and query decimal type * define wide integer, support decimal128 * support decimal128 divide * set decimal type expr res types * scalar decimal * convert to decimal * fix decimal64/128 from str and to str * fix decimal from str and decimal to str * decimal simple conversion * unit test for decimal * decimal conversion and unit tests * decimal + - * / * decimal scalar ops and comparision * start to refactor GET_TYPED_DATA * support decimal max func, cast func * refactor GET_TYPED_DATA interface * decimal scalar comparision * start to implement sum for decimal * support sum and avg for decimal type * decimal tests * add decimal test * decimal add test cases * decimal use int256/int128 * decimal testing * fix decimal table meta and add tests for decimal col streams * fix create stream and create tsma * test insert decimal values * decimal from str * test decimal input * test parse decimal from string * add taos_fetch_field_e api * decimal insert tests * test decimal operators * decimal operator test * feat:support decimal in raw block * decimal operator tests * decimal test * feat:support decimal in raw block * feat:support decimal in raw block * feat:add schemaExt to SMqDataRsp * feat:remove add schemaExt to SMqDataRsp * feat:remove add schemaExt to SMqDataRsp * feat:remove add schemaExt to SMqDataRsp * decimal test operators * decimal operator test * test decimal operators * test decimal compare operators * decimal unary operator test * decimal col with decimal col oper test * test decimal col filtering * fix decimal float operator test * decimal test where filtering * fix decimal filtering * fix decimal order by * fix decimal op test * test decimal agg funcs * test decimal functions * remove assert * fix ci build for ret check * fix decimal windows build * fix ci ret check * skip decimal ret check * skip decimal ret check * fix decimal tests * fix decimal ci test * decimal test * fix(tmq): heap user after free * fix(tmq): double free * fix(tmq): double free * fix decimal tests * fix(decimal): decimal test ci build * fix(decimal): windows build * fix(decimal): decimal test build * fix(decimal): fix decimal build and tests * fix(decimal): fix decimal tests * fix(decimal): fix taos_fetch_fields_e api * fix(decimal): fix decimal taos_fetch_fields_e api * fix(decimal): rebase 3.0 * fix(decimal): fix decimal functions * fix(decimal): fix decimal test case memory leak * fix(decimal): fix decimal tests * fix(decimal): fix decimal test case * fix(decimal): fix decimal tests * feat(decimal): fix unit tests * feat(decimal): fix deicmal unit test --------- Co-authored-by: wangmm0220 <wangmm0220@gmail.com> Co-authored-by: yihaoDeng <yhdeng@taosdata.com>
2025-03-14 10:08:07 +00:00
destroyMetaTableInfo(&mtInfo);
QUERY_CHECK_CODE(code, lino, _end);
}
2024-07-29 02:35:06 +00:00
STqOffsetVal offset = {0};
if (mtInfo.uid == 0 || pInfo->sContext->withMeta == ONLY_META) { // read snapshot done, change to get data from wal
2022-08-09 11:06:24 +00:00
qDebug("tmqsnap read snapshot done, change to get data from wal");
tqOffsetResetToLog(&offset, pInfo->sContext->snapVersion + 1);
2022-08-31 03:35:25 +00:00
} else {
SValue val = {0};
tqOffsetResetToData(&offset, mtInfo.uid, INT64_MIN, val);
qDebug("tmqsnap change get data uid:%" PRId64, mtInfo.uid);
2022-08-09 11:06:24 +00:00
}
feat(decimal): support decimal data type (#30060) * decimal: create table * decimal: add test case decimal.py * decimal: add decimal.c * support input decimal * decimal test * refactor svalue * fix test cases * add decimal unit test * add decimal test cmake * support insert and query decimal type * define wide integer, support decimal128 * support decimal128 divide * set decimal type expr res types * scalar decimal * convert to decimal * fix decimal64/128 from str and to str * fix decimal from str and decimal to str * decimal simple conversion * unit test for decimal * decimal conversion and unit tests * decimal + - * / * decimal scalar ops and comparision * start to refactor GET_TYPED_DATA * support decimal max func, cast func * refactor GET_TYPED_DATA interface * decimal scalar comparision * start to implement sum for decimal * support sum and avg for decimal type * decimal tests * add decimal test * decimal add test cases * decimal use int256/int128 * decimal testing * fix decimal table meta and add tests for decimal col streams * fix create stream and create tsma * test insert decimal values * decimal from str * test decimal input * test parse decimal from string * add taos_fetch_field_e api * decimal insert tests * test decimal operators * decimal operator test * feat:support decimal in raw block * decimal operator tests * decimal test * feat:support decimal in raw block * feat:support decimal in raw block * feat:add schemaExt to SMqDataRsp * feat:remove add schemaExt to SMqDataRsp * feat:remove add schemaExt to SMqDataRsp * feat:remove add schemaExt to SMqDataRsp * decimal test operators * decimal operator test * test decimal operators * test decimal compare operators * decimal unary operator test * decimal col with decimal col oper test * test decimal col filtering * fix decimal float operator test * decimal test where filtering * fix decimal filtering * fix decimal order by * fix decimal op test * test decimal agg funcs * test decimal functions * remove assert * fix ci build for ret check * fix decimal windows build * fix ci ret check * skip decimal ret check * skip decimal ret check * fix decimal tests * fix decimal ci test * decimal test * fix(tmq): heap user after free * fix(tmq): double free * fix(tmq): double free * fix decimal tests * fix(decimal): decimal test ci build * fix(decimal): windows build * fix(decimal): decimal test build * fix(decimal): fix decimal build and tests * fix(decimal): fix decimal tests * fix(decimal): fix taos_fetch_fields_e api * fix(decimal): fix decimal taos_fetch_fields_e api * fix(decimal): rebase 3.0 * fix(decimal): fix decimal functions * fix(decimal): fix decimal test case memory leak * fix(decimal): fix decimal tests * fix(decimal): fix decimal test case * fix(decimal): fix decimal tests * feat(decimal): fix unit tests * feat(decimal): fix deicmal unit test --------- Co-authored-by: wangmm0220 <wangmm0220@gmail.com> Co-authored-by: yihaoDeng <yhdeng@taosdata.com>
2025-03-14 10:08:07 +00:00
destroyMetaTableInfo(&mtInfo);
2024-07-19 08:15:37 +00:00
code = qStreamPrepareScan(pTaskInfo, &offset, pInfo->sContext->subType);
QUERY_CHECK_CODE(code, lino, _end);
2024-07-24 08:17:28 +00:00
(*ppRes) = NULL;
return code;
} else if (pTaskInfo->streamInfo.currentOffset.type == TMQ_OFFSET__SNAPSHOT_META) {
2022-08-31 03:35:25 +00:00
SSnapContext* sContext = pInfo->sContext;
2024-07-19 08:15:37 +00:00
for (int32_t i = 0; i < tmqRowSize; i++) {
void* data = NULL;
int32_t dataLen = 0;
int16_t type = 0;
int64_t uid = 0;
2024-05-23 09:35:54 +00:00
if (pAPI->snapshotFn.getTableInfoFromSnapshot(sContext, &data, &dataLen, &type, &uid) < 0) {
qError("tmqsnap getTableInfoFromSnapshot error");
taosMemoryFreeClear(data);
break;
}
2024-05-23 09:35:54 +00:00
if (!sContext->queryMeta) { // change to get data next poll request
STqOffsetVal offset = {0};
2024-07-19 08:15:37 +00:00
SValue val = {0};
2024-05-23 09:35:54 +00:00
tqOffsetResetToData(&offset, 0, INT64_MIN, val);
2024-07-19 08:15:37 +00:00
code = qStreamPrepareScan(pTaskInfo, &offset, pInfo->sContext->subType);
QUERY_CHECK_CODE(code, lino, _end);
2024-05-23 09:35:54 +00:00
break;
} else {
tqOffsetResetToMeta(&pTaskInfo->streamInfo.currentOffset, uid);
SMqMetaRsp tmpMetaRsp = {0};
tmpMetaRsp.resMsgType = type;
tmpMetaRsp.metaRspLen = dataLen;
tmpMetaRsp.metaRsp = data;
if (!pTaskInfo->streamInfo.btMetaRsp.batchMetaReq) {
pTaskInfo->streamInfo.btMetaRsp.batchMetaReq = taosArrayInit(4, POINTER_BYTES);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(pTaskInfo->streamInfo.btMetaRsp.batchMetaReq, code, lino, _end, terrno);
2024-07-19 08:15:37 +00:00
2024-05-23 09:35:54 +00:00
pTaskInfo->streamInfo.btMetaRsp.batchMetaLen = taosArrayInit(4, sizeof(int32_t));
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(pTaskInfo->streamInfo.btMetaRsp.batchMetaLen, code, lino, _end, terrno);
2024-05-23 09:35:54 +00:00
}
2024-07-24 08:17:28 +00:00
int32_t tempRes = TSDB_CODE_SUCCESS;
2024-05-23 09:35:54 +00:00
uint32_t len = 0;
2024-07-24 08:17:28 +00:00
tEncodeSize(tEncodeMqMetaRsp, &tmpMetaRsp, len, tempRes);
if (TSDB_CODE_SUCCESS != tempRes) {
2024-05-23 09:35:54 +00:00
qError("tmqsnap tEncodeMqMetaRsp error");
taosMemoryFreeClear(data);
break;
}
2024-07-24 08:17:28 +00:00
int32_t tLen = sizeof(SMqRspHead) + len;
void* tBuf = taosMemoryCalloc(1, tLen);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(tBuf, code, lino, _end, terrno);
2024-07-24 08:17:28 +00:00
2024-07-19 08:15:37 +00:00
void* metaBuff = POINTER_SHIFT(tBuf, sizeof(SMqRspHead));
2024-05-23 09:35:54 +00:00
SEncoder encoder = {0};
tEncoderInit(&encoder, metaBuff, len);
2024-07-25 02:41:50 +00:00
int32_t tempLen = tEncodeMqMetaRsp(&encoder, &tmpMetaRsp);
if (tempLen < 0) {
2024-05-23 09:35:54 +00:00
qError("tmqsnap tEncodeMqMetaRsp error");
tEncoderClear(&encoder);
taosMemoryFreeClear(tBuf);
taosMemoryFreeClear(data);
break;
}
taosMemoryFreeClear(data);
2024-07-19 08:15:37 +00:00
void* tmp = taosArrayPush(pTaskInfo->streamInfo.btMetaRsp.batchMetaReq, &tBuf);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
2024-07-19 08:15:37 +00:00
tmp = taosArrayPush(pTaskInfo->streamInfo.btMetaRsp.batchMetaLen, &tLen);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
2024-05-23 09:35:54 +00:00
}
}
2024-07-24 08:17:28 +00:00
(*ppRes) = NULL;
return code;
}
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
T_LONG_JMP(pTaskInfo->env, code);
2024-07-19 08:15:37 +00:00
}
2024-07-24 08:17:28 +00:00
(*ppRes) = NULL;
return code;
}
2022-08-25 09:36:00 +00:00
static void destroyRawScanOperatorInfo(void* param) {
2022-08-05 13:12:18 +00:00
SStreamRawScanInfo* pRawScan = (SStreamRawScanInfo*)param;
2023-05-23 10:58:54 +00:00
pRawScan->pAPI->tsdReader.tsdReaderClose(pRawScan->dataReader);
pRawScan->pAPI->snapshotFn.destroySnapshot(pRawScan->sContext);
2024-07-24 09:08:08 +00:00
tableListDestroy(pRawScan->pTableListInfo);
2022-08-05 13:12:18 +00:00
taosMemoryFree(pRawScan);
}
2022-07-10 12:48:02 +00:00
// for subscribing db or stb (not including column),
// if this scan is used, meta data can be return
// and schemas are decided when scanning
2024-07-24 09:08:08 +00:00
int32_t createRawScanOperatorInfo(SReadHandle* pHandle, SExecTaskInfo* pTaskInfo, SOperatorInfo** pOptrInfo) {
2022-07-10 12:48:02 +00:00
// create operator
// create tb reader
// create meta reader
// create tq reader
QRY_PARAM_CHECK(pOptrInfo);
2022-10-19 05:38:01 +00:00
int32_t code = TSDB_CODE_SUCCESS;
2024-08-05 09:08:21 +00:00
int32_t lino = 0;
2022-10-19 05:38:01 +00:00
SStreamRawScanInfo* pInfo = taosMemoryCalloc(1, sizeof(SStreamRawScanInfo));
2022-08-31 03:35:25 +00:00
SOperatorInfo* pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
if (pInfo == NULL || pOperator == NULL) {
code = terrno;
2024-08-05 10:36:45 +00:00
lino = __LINE__;
2022-10-19 05:38:01 +00:00
goto _end;
}
2023-04-03 06:49:14 +00:00
pInfo->pTableListInfo = tableListCreate();
2024-08-05 09:08:21 +00:00
QUERY_CHECK_NULL(pInfo->pTableListInfo, code, lino, _end, terrno);
2022-08-06 11:31:53 +00:00
pInfo->vnode = pHandle->vnode;
2023-05-25 16:00:07 +00:00
pInfo->pAPI = &pTaskInfo->storageAPI;
2022-08-06 11:31:53 +00:00
pInfo->sContext = pHandle->sContext;
2022-11-11 01:12:57 +00:00
setOperatorInfo(pOperator, "RawScanOperator", QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN, false, OP_NOT_OPENED, pInfo,
pTaskInfo);
2024-08-27 09:04:44 +00:00
pOperator->fpSet = createOperatorFpSet(NULL, doRawScanNext, NULL, destroyRawScanOperatorInfo, optrDefaultBufFn, NULL,
2024-07-19 08:15:37 +00:00
optrDefaultGetNextExtFn, NULL);
2024-07-24 09:08:08 +00:00
*pOptrInfo = pOperator;
return code;
2022-10-19 05:38:01 +00:00
2022-10-21 01:47:04 +00:00
_end:
2024-08-05 10:36:45 +00:00
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
2022-10-19 05:38:01 +00:00
taosMemoryFree(pInfo);
taosMemoryFree(pOperator);
pTaskInfo->code = code;
2024-07-24 09:08:08 +00:00
return code;
2022-07-10 12:48:02 +00:00
}
void destroyStreamScanOperatorInfo(void* param) {
2024-08-14 03:12:50 +00:00
if (param == NULL) {
return;
}
2024-09-14 05:39:23 +00:00
SStreamScanInfo* pStreamScan = (SStreamScanInfo*)param;
2022-07-14 07:32:21 +00:00
if (pStreamScan->pTableScanOp && pStreamScan->pTableScanOp->info) {
2023-04-27 16:23:38 +00:00
destroyOperator(pStreamScan->pTableScanOp);
2022-07-14 07:32:21 +00:00
}
2024-08-07 07:33:09 +00:00
if (pStreamScan->tqReader != NULL && pStreamScan->readerFn.tqReaderClose != NULL) {
pStreamScan->readerFn.tqReaderClose(pStreamScan->tqReader);
2022-07-14 07:32:21 +00:00
}
if (pStreamScan->pVtableMergeHandles) {
taosHashCleanup(pStreamScan->pVtableMergeHandles);
pStreamScan->pVtableMergeHandles = NULL;
}
if (pStreamScan->pVtableMergeBuf) {
destroyDiskbasedBuf(pStreamScan->pVtableMergeBuf);
pStreamScan->pVtableMergeBuf = NULL;
}
if (pStreamScan->pVtableReadyHandles) {
taosArrayDestroy(pStreamScan->pVtableReadyHandles);
pStreamScan->pVtableReadyHandles = NULL;
}
if (pStreamScan->pTableListInfo) {
tableListDestroy(pStreamScan->pTableListInfo);
pStreamScan->pTableListInfo = NULL;
}
2022-10-24 08:44:44 +00:00
if (pStreamScan->matchInfo.pList) {
taosArrayDestroy(pStreamScan->matchInfo.pList);
2022-07-14 07:32:21 +00:00
}
2022-08-04 13:31:13 +00:00
if (pStreamScan->pPseudoExpr) {
destroyExprInfo(pStreamScan->pPseudoExpr, pStreamScan->numOfPseudoExpr);
2022-08-31 03:35:25 +00:00
taosMemoryFree(pStreamScan->pPseudoExpr);
2022-08-04 13:31:13 +00:00
}
2022-08-04 13:27:01 +00:00
2022-11-15 10:32:08 +00:00
cleanupExprSupp(&pStreamScan->tbnameCalSup);
2023-01-10 02:13:56 +00:00
cleanupExprSupp(&pStreamScan->tagCalSup);
2022-11-15 10:32:08 +00:00
2022-07-14 07:32:21 +00:00
blockDataDestroy(pStreamScan->pRes);
blockDataDestroy(pStreamScan->pUpdateRes);
blockDataDestroy(pStreamScan->pDeleteDataRes);
2022-07-22 11:20:22 +00:00
blockDataDestroy(pStreamScan->pUpdateDataRes);
2023-01-10 02:13:56 +00:00
blockDataDestroy(pStreamScan->pCreateTbRes);
2022-07-14 07:32:21 +00:00
taosArrayDestroy(pStreamScan->pBlockLists);
2023-09-01 05:24:47 +00:00
blockDataDestroy(pStreamScan->pCheckpointRes);
2022-07-14 07:32:21 +00:00
taosMemoryFree(pStreamScan);
}
2024-07-19 08:15:37 +00:00
int32_t addPrimaryKeyCol(SSDataBlock* pBlock, uint8_t type, int32_t bytes) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2024-03-26 08:38:24 +00:00
pBlock->info.rowSize += bytes;
SColumnInfoData infoData = {0};
infoData.info.type = type;
infoData.info.bytes = bytes;
2024-07-19 08:15:37 +00:00
void* tmp = taosArrayPush(pBlock->pDataBlock, &infoData);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
2024-03-26 08:38:24 +00:00
}
static SSDataBlock* createStreamVtableBlock(SColMatchInfo *pMatchInfo, const char *idstr) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
SSDataBlock *pRes = NULL;
QUERY_CHECK_NULL(pMatchInfo, code, lino, _end, TSDB_CODE_INVALID_PARA);
code = createDataBlock(&pRes);
QUERY_CHECK_CODE(code, lino, _end);
int32_t numOfOutput = taosArrayGetSize(pMatchInfo->pList);
for (int32_t i = 0; i < numOfOutput; ++i) {
SColMatchItem* pItem = taosArrayGet(pMatchInfo->pList, i);
if (!pItem->needOutput) {
continue;
}
SColumnInfoData colInfo = createColumnInfoData(pItem->dataType.type, pItem->dataType.bytes, pItem->colId);
code = blockDataAppendColInfo(pRes, &colInfo);
QUERY_CHECK_CODE(code, lino, _end);
}
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s, id: %s", __func__, lino, tstrerror(code), idstr);
if (pRes != NULL) {
blockDataDestroy(pRes);
}
pRes = NULL;
terrno = code;
}
return pRes;
}
static int32_t doTagScanOneTable(SOperatorInfo* pOperator, SSDataBlock* pRes, SMetaReader* mr, SStorageAPI* pAPI) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2024-07-19 08:15:37 +00:00
STagScanInfo* pInfo = pOperator->info;
SExprInfo* pExprInfo = &pOperator->exprSupp.pExprInfo[0];
int32_t count = pRes->info.rows;
STableKeyInfo* item = tableListGetInfo(pInfo->pTableListInfo, pInfo->curPos);
2024-08-06 01:24:31 +00:00
if (!item) {
qError("failed to get table meta, uid:0x%" PRIx64 ", code:%s, %s", item->uid, tstrerror(terrno),
GET_TASKID(pTaskInfo));
tDecoderClear(&(*mr).coder);
goto _end;
2024-08-06 01:24:31 +00:00
}
2024-07-19 08:15:37 +00:00
code = pAPI->metaReaderFn.getTableEntryByUid(mr, item->uid);
tDecoderClear(&(*mr).coder);
if (code != TSDB_CODE_SUCCESS) {
qError("failed to get table meta, uid:0x%" PRIx64 ", code:%s, %s", item->uid, tstrerror(terrno),
GET_TASKID(pTaskInfo));
goto _end;
}
char str[512];
for (int32_t j = 0; j < pOperator->exprSupp.numOfExprs; ++j) {
SColumnInfoData* pDst = taosArrayGet(pRes->pDataBlock, pExprInfo[j].base.resSchema.slotId);
// refactor later
2023-09-01 05:24:47 +00:00
if (FUNCTION_TYPE_TBNAME == pExprInfo[j].pExpr->_function.functionType) {
STR_TO_VARSTR(str, (*mr).me.name);
2024-07-19 08:15:37 +00:00
code = colDataSetVal(pDst, (count), str, false);
QUERY_CHECK_CODE(code, lino, _end);
2023-09-01 05:24:47 +00:00
} else if (FUNCTION_TYPE_TBUID == pExprInfo[j].pExpr->_function.functionType) {
2024-07-19 08:15:37 +00:00
code = colDataSetVal(pDst, (count), (char*)&(*mr).me.uid, false);
QUERY_CHECK_CODE(code, lino, _end);
2023-09-01 05:24:47 +00:00
} else if (FUNCTION_TYPE_VGID == pExprInfo[j].pExpr->_function.functionType) {
2024-07-19 08:15:37 +00:00
code = colDataSetVal(pDst, (count), (char*)&pTaskInfo->id.vgId, false);
QUERY_CHECK_CODE(code, lino, _end);
} else { // it is a tag value
STagVal val = {0};
val.cid = pExprInfo[j].base.pParam[0].pCol->colId;
const char* p = pAPI->metaFn.extractTagVal((*mr).me.ctbEntry.pTags, pDst->info.type, &val);
char* data = NULL;
if (pDst->info.type != TSDB_DATA_TYPE_JSON && p != NULL) {
data = tTagValToData((const STagVal*)p, false);
} else {
data = (char*)p;
}
2024-07-19 08:15:37 +00:00
code = colDataSetVal(pDst, (count), data,
(data == NULL) || (pDst->info.type == TSDB_DATA_TYPE_JSON && tTagIsJsonNull(data)));
QUERY_CHECK_CODE(code, lino, _end);
if ((pDst->info.type != TSDB_DATA_TYPE_JSON) && (p != NULL) && IS_VAR_DATA_TYPE(((const STagVal*)p)->type) &&
(data != NULL)) {
taosMemoryFree(data);
}
}
}
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
} else {
pRes->info.rows++;
2024-07-19 08:15:37 +00:00
}
return code;
}
2023-09-01 05:24:47 +00:00
static void tagScanFreeUidTag(void* p) {
STUidTagInfo* pInfo = p;
if (pInfo->pTagVal != NULL) {
taosMemoryFree(pInfo->pTagVal);
}
}
static int32_t tagScanCreateResultData(SDataType* pType, int32_t numOfRows, SScalarParam* pParam) {
SColumnInfoData* pColumnData = taosMemoryCalloc(1, sizeof(SColumnInfoData));
if (pColumnData == NULL) {
return terrno;
}
pColumnData->info.type = pType->type;
pColumnData->info.bytes = pType->bytes;
pColumnData->info.scale = pType->scale;
pColumnData->info.precision = pType->precision;
int32_t code = colInfoDataEnsureCapacity(pColumnData, numOfRows, true);
if (code != TSDB_CODE_SUCCESS) {
terrno = code;
taosMemoryFree(pColumnData);
return terrno;
}
pParam->columnData = pColumnData;
pParam->colAlloced = true;
return TSDB_CODE_SUCCESS;
}
static EDealRes tagScanRewriteTagColumn(SNode** pNode, void* pContext) {
2024-07-21 10:20:30 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
STagScanFilterContext* pCtx = (STagScanFilterContext*)pContext;
2024-07-29 02:35:06 +00:00
SColumnNode* pSColumnNode = NULL;
2023-09-01 05:24:47 +00:00
if (QUERY_NODE_COLUMN == nodeType((*pNode))) {
pSColumnNode = *(SColumnNode**)pNode;
} else if (QUERY_NODE_FUNCTION == nodeType((*pNode))) {
SFunctionNode* pFuncNode = *(SFunctionNode**)(pNode);
if (pFuncNode->funcType == FUNCTION_TYPE_TBNAME) {
2024-07-21 10:20:30 +00:00
pSColumnNode = NULL;
pCtx->code = nodesMakeNode(QUERY_NODE_COLUMN, (SNode**)&pSColumnNode);
2023-09-01 05:24:47 +00:00
if (NULL == pSColumnNode) {
return DEAL_RES_ERROR;
}
pSColumnNode->colId = -1;
pSColumnNode->colType = COLUMN_TYPE_TBNAME;
pSColumnNode->node.resType.type = TSDB_DATA_TYPE_VARCHAR;
pSColumnNode->node.resType.bytes = TSDB_TABLE_FNAME_LEN - 1 + VARSTR_HEADER_SIZE;
nodesDestroyNode(*pNode);
*pNode = (SNode*)pSColumnNode;
} else {
return DEAL_RES_CONTINUE;
}
} else {
return DEAL_RES_CONTINUE;
}
2024-07-21 10:20:30 +00:00
void* data = taosHashGet(pCtx->colHash, &pSColumnNode->colId, sizeof(pSColumnNode->colId));
2023-09-01 05:24:47 +00:00
if (!data) {
2024-07-19 08:15:37 +00:00
code = taosHashPut(pCtx->colHash, &pSColumnNode->colId, sizeof(pSColumnNode->colId), pNode, sizeof((*pNode)));
2024-07-23 10:32:03 +00:00
if (code == TSDB_CODE_DUP_KEY) {
code = TSDB_CODE_SUCCESS;
2024-07-23 06:19:04 +00:00
}
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _end);
2023-09-01 05:24:47 +00:00
pSColumnNode->slotId = pCtx->index++;
SColumnInfo cInfo = {.colId = pSColumnNode->colId,
.type = pSColumnNode->node.resType.type,
.bytes = pSColumnNode->node.resType.bytes};
2024-07-19 08:15:37 +00:00
void* tmp = taosArrayPush(pCtx->cInfoList, &cInfo);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
2023-09-01 05:24:47 +00:00
} else {
SColumnNode* col = *(SColumnNode**)data;
pSColumnNode->slotId = col->slotId;
}
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
return DEAL_RES_ERROR;
}
2023-09-01 05:24:47 +00:00
return DEAL_RES_CONTINUE;
}
2024-07-19 08:15:37 +00:00
static int32_t tagScanFilterByTagCond(SArray* aUidTags, SNode* pTagCond, SArray* aFilterIdxs, void* pVnode,
SStorageAPI* pAPI, STagScanInfo* pInfo) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2023-09-01 05:24:47 +00:00
int32_t numOfTables = taosArrayGetSize(aUidTags);
2024-08-07 08:59:19 +00:00
SArray* pBlockList = NULL;
2023-09-01 05:24:47 +00:00
SSDataBlock* pResBlock = createTagValBlockForFilter(pInfo->filterCtx.cInfoList, numOfTables, aUidTags, pVnode, pAPI);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(pResBlock, code, lino, _end, terrno);
2023-09-01 05:24:47 +00:00
2024-08-07 08:59:19 +00:00
pBlockList = taosArrayInit(1, POINTER_BYTES);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(pBlockList, code, lino, _end, terrno);
2024-07-19 08:15:37 +00:00
void* tmp = taosArrayPush(pBlockList, &pResBlock);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
2024-07-19 08:15:37 +00:00
2023-09-01 05:24:47 +00:00
SDataType type = {.type = TSDB_DATA_TYPE_BOOL, .bytes = sizeof(bool)};
SScalarParam output = {0};
2023-09-06 02:57:49 +00:00
code = tagScanCreateResultData(&type, numOfTables, &output);
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _end);
2023-09-01 05:24:47 +00:00
2025-05-21 00:50:15 +00:00
code = scalarCalculate(pTagCond, pBlockList, &output, NULL, NULL);
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _end);
2023-09-01 05:24:47 +00:00
bool* result = (bool*)output.columnData->pData;
2024-07-19 08:15:37 +00:00
for (int32_t i = 0; i < numOfTables; ++i) {
2023-09-01 05:24:47 +00:00
if (result[i]) {
2024-07-19 08:15:37 +00:00
void* tmp = taosArrayPush(aFilterIdxs, &i);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
2023-09-01 05:24:47 +00:00
}
}
colDataDestroy(output.columnData);
taosMemoryFreeClear(output.columnData);
2024-07-19 08:15:37 +00:00
_end:
2023-09-01 05:24:47 +00:00
blockDataDestroy(pResBlock);
taosArrayDestroy(pBlockList);
2024-07-19 08:15:37 +00:00
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
2023-09-01 05:24:47 +00:00
}
2024-07-19 08:15:37 +00:00
static int32_t tagScanFillOneCellWithTag(SOperatorInfo* pOperator, const STUidTagInfo* pUidTagInfo,
SExprInfo* pExprInfo, SColumnInfoData* pColInfo, int rowIndex,
const SStorageAPI* pAPI, void* pVnode) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2023-09-01 05:24:47 +00:00
if (QUERY_NODE_FUNCTION == pExprInfo->pExpr->nodeType) {
if (FUNCTION_TYPE_TBNAME == pExprInfo->pExpr->_function.functionType) { // tbname
char str[TSDB_TABLE_FNAME_LEN + VARSTR_HEADER_SIZE] = {0};
STR_TO_VARSTR(str, "ctbidx");
2024-07-19 08:15:37 +00:00
code = colDataSetVal(pColInfo, rowIndex, str, false);
QUERY_CHECK_CODE(code, lino, _end);
2023-09-01 05:24:47 +00:00
} else if (FUNCTION_TYPE_TBUID == pExprInfo->pExpr->_function.functionType) {
2024-07-19 08:15:37 +00:00
code = colDataSetVal(pColInfo, rowIndex, (char*)&pUidTagInfo->uid, false);
QUERY_CHECK_CODE(code, lino, _end);
2023-09-01 05:24:47 +00:00
} else if (FUNCTION_TYPE_VGID == pExprInfo->pExpr->_function.functionType) {
2024-07-19 08:15:37 +00:00
code = colDataSetVal(pColInfo, rowIndex, (char*)&pOperator->pTaskInfo->id.vgId, false);
QUERY_CHECK_CODE(code, lino, _end);
}
2023-09-01 05:24:47 +00:00
} else {
STagVal tagVal = {0};
tagVal.cid = pExprInfo->base.pParam[0].pCol->colId;
if (pUidTagInfo->pTagVal == NULL) {
colDataSetNULL(pColInfo, rowIndex);
} else {
const char* p = pAPI->metaFn.extractTagVal(pUidTagInfo->pTagVal, pColInfo->info.type, &tagVal);
if (p == NULL || (pColInfo->info.type == TSDB_DATA_TYPE_JSON && ((STag*)p)->nTag == 0)) {
colDataSetNULL(pColInfo, rowIndex);
} else if (pColInfo->info.type == TSDB_DATA_TYPE_JSON) {
2024-07-19 08:15:37 +00:00
code = colDataSetVal(pColInfo, rowIndex, p, false);
QUERY_CHECK_CODE(code, lino, _end);
2023-09-01 05:24:47 +00:00
} else if (IS_VAR_DATA_TYPE(pColInfo->info.type)) {
char* tmp = taosMemoryMalloc(tagVal.nData + VARSTR_HEADER_SIZE + 1);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
2024-07-19 08:15:37 +00:00
2023-09-01 05:24:47 +00:00
varDataSetLen(tmp, tagVal.nData);
memcpy(tmp + VARSTR_HEADER_SIZE, tagVal.pData, tagVal.nData);
2024-07-19 08:15:37 +00:00
code = colDataSetVal(pColInfo, rowIndex, tmp, false);
2023-09-01 05:24:47 +00:00
taosMemoryFree(tmp);
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _end);
2023-09-01 05:24:47 +00:00
} else {
2024-07-19 08:15:37 +00:00
code = colDataSetVal(pColInfo, rowIndex, (const char*)&tagVal.i64, false);
QUERY_CHECK_CODE(code, lino, _end);
2023-09-01 05:24:47 +00:00
}
}
}
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
2023-09-01 05:24:47 +00:00
}
2024-07-19 08:15:37 +00:00
static int32_t tagScanFillResultBlock(SOperatorInfo* pOperator, SSDataBlock* pRes, SArray* aUidTags,
SArray* aFilterIdxs, bool ignoreFilterIdx, SStorageAPI* pAPI) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2023-09-01 05:24:47 +00:00
STagScanInfo* pInfo = pOperator->info;
SExprInfo* pExprInfo = &pOperator->exprSupp.pExprInfo[0];
if (!ignoreFilterIdx) {
size_t szTables = taosArrayGetSize(aFilterIdxs);
for (int i = 0; i < szTables; ++i) {
2024-07-19 08:15:37 +00:00
int32_t idx = *(int32_t*)taosArrayGet(aFilterIdxs, i);
2023-09-01 05:24:47 +00:00
STUidTagInfo* pUidTagInfo = taosArrayGet(aUidTags, idx);
2024-08-05 08:09:01 +00:00
QUERY_CHECK_NULL(pUidTagInfo, code, lino, _end, terrno);
2023-09-01 05:24:47 +00:00
for (int32_t j = 0; j < pOperator->exprSupp.numOfExprs; ++j) {
SColumnInfoData* pDst = taosArrayGet(pRes->pDataBlock, pExprInfo[j].base.resSchema.slotId);
2024-08-05 08:09:01 +00:00
QUERY_CHECK_NULL(pDst, code, lino, _end, terrno);
2024-07-19 08:15:37 +00:00
code = tagScanFillOneCellWithTag(pOperator, pUidTagInfo, &pExprInfo[j], pDst, i, pAPI, pInfo->readHandle.vnode);
QUERY_CHECK_CODE(code, lino, _end);
2023-09-01 05:24:47 +00:00
}
}
} else {
size_t szTables = taosArrayGetSize(aUidTags);
for (int i = 0; i < szTables; ++i) {
STUidTagInfo* pUidTagInfo = taosArrayGet(aUidTags, i);
2024-08-05 08:09:01 +00:00
QUERY_CHECK_NULL(pUidTagInfo, code, lino, _end, terrno);
2023-09-01 05:24:47 +00:00
for (int32_t j = 0; j < pOperator->exprSupp.numOfExprs; ++j) {
SColumnInfoData* pDst = taosArrayGet(pRes->pDataBlock, pExprInfo[j].base.resSchema.slotId);
2024-08-05 08:09:01 +00:00
QUERY_CHECK_NULL(pDst, code, lino, _end, terrno);
2024-07-19 08:15:37 +00:00
code = tagScanFillOneCellWithTag(pOperator, pUidTagInfo, &pExprInfo[j], pDst, i, pAPI, pInfo->readHandle.vnode);
2024-09-03 00:35:24 +00:00
QUERY_CHECK_CODE(code, lino, _end);
2023-09-01 05:24:47 +00:00
}
}
}
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
2023-09-01 05:24:47 +00:00
}
2024-07-24 08:17:28 +00:00
static int32_t doTagScanFromCtbIdxNext(SOperatorInfo* pOperator, SSDataBlock** ppRes) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2023-09-01 05:24:47 +00:00
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2024-07-19 08:15:37 +00:00
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
2023-09-01 05:24:47 +00:00
STagScanInfo* pInfo = pOperator->info;
SSDataBlock* pRes = pInfo->pRes;
QRY_PARAM_CHECK(ppRes);
if (pOperator->status == OP_EXEC_DONE) {
return TSDB_CODE_SUCCESS;
}
2023-09-01 05:24:47 +00:00
blockDataCleanup(pRes);
if (pInfo->pCtbCursor == NULL) {
pInfo->pCtbCursor = pAPI->metaFn.openCtbCursor(pInfo->readHandle.vnode, pInfo->suid, 1);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(pInfo->pCtbCursor, code, lino, _end, terrno);
2023-09-01 05:24:47 +00:00
} else {
2024-07-19 08:15:37 +00:00
code = pAPI->metaFn.resumeCtbCursor(pInfo->pCtbCursor, 0);
QUERY_CHECK_CODE(code, lino, _end);
2023-09-01 05:24:47 +00:00
}
SArray* aUidTags = pInfo->aUidTags;
SArray* aFilterIdxs = pInfo->aFilterIdxs;
int32_t count = 0;
2024-07-19 08:15:37 +00:00
bool ctbCursorFinished = false;
2023-09-01 05:24:47 +00:00
while (1) {
taosArrayClearEx(aUidTags, tagScanFreeUidTag);
taosArrayClear(aFilterIdxs);
int32_t numTables = 0;
while (numTables < pOperator->resultInfo.capacity) {
SMCtbCursor* pCur = pInfo->pCtbCursor;
tb_uid_t uid = pAPI->metaFn.ctbCursorNext(pInfo->pCtbCursor);
if (uid == 0) {
ctbCursorFinished = true;
break;
}
STUidTagInfo info = {.uid = uid, .pTagVal = pCur->pVal};
info.pTagVal = taosMemoryMalloc(pCur->vLen);
2024-08-05 03:17:49 +00:00
QUERY_CHECK_NULL(info.pTagVal, code, lino, _end, terrno);
2023-09-01 05:24:47 +00:00
memcpy(info.pTagVal, pCur->pVal, pCur->vLen);
2024-07-19 08:15:37 +00:00
void* tmp = taosArrayPush(aUidTags, &info);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
2023-09-01 05:24:47 +00:00
++numTables;
}
if (numTables == 0) {
break;
}
bool ignoreFilterIdx = true;
if (pInfo->pTagCond != NULL) {
ignoreFilterIdx = false;
2024-07-19 08:15:37 +00:00
code = tagScanFilterByTagCond(aUidTags, pInfo->pTagCond, aFilterIdxs, pInfo->readHandle.vnode, pAPI, pInfo);
QUERY_CHECK_CODE(code, lino, _end);
2023-09-01 05:24:47 +00:00
} else {
ignoreFilterIdx = true;
}
2024-07-19 08:15:37 +00:00
code = tagScanFillResultBlock(pOperator, pRes, aUidTags, aFilterIdxs, ignoreFilterIdx, pAPI);
QUERY_CHECK_CODE(code, lino, _end);
count = ignoreFilterIdx ? taosArrayGetSize(aUidTags) : taosArrayGetSize(aFilterIdxs);
2023-09-01 05:24:47 +00:00
if (count != 0) {
break;
}
}
if (count > 0) {
pAPI->metaFn.pauseCtbCursor(pInfo->pCtbCursor);
}
if (count == 0 || ctbCursorFinished) {
pAPI->metaFn.closeCtbCursor(pInfo->pCtbCursor);
pInfo->pCtbCursor = NULL;
setOperatorCompleted(pOperator);
}
pRes->info.rows = count;
bool bLimitReached = applyLimitOffset(&pInfo->limitInfo, pRes, pTaskInfo);
if (bLimitReached) {
setOperatorCompleted(pOperator);
}
2024-07-19 08:15:37 +00:00
pOperator->resultInfo.totalRows += pRes->info.rows;
(*ppRes) = (pRes->info.rows == 0) ? NULL : pInfo->pRes;
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
T_LONG_JMP(pTaskInfo->env, code);
2024-07-19 08:15:37 +00:00
}
2023-09-01 05:24:47 +00:00
return code;
2024-07-24 08:17:28 +00:00
}
static int32_t doTagScanFromMetaEntryNext(SOperatorInfo* pOperator, SSDataBlock** ppRes) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2022-04-25 01:44:39 +00:00
if (pOperator->status == OP_EXEC_DONE) {
2024-07-24 08:17:28 +00:00
(*ppRes) = NULL;
return code;
2022-04-25 01:44:39 +00:00
}
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2024-07-19 08:15:37 +00:00
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
STagScanInfo* pInfo = pOperator->info;
2022-06-18 04:00:41 +00:00
SExprInfo* pExprInfo = &pOperator->exprSupp.pExprInfo[0];
SSDataBlock* pRes = pInfo->pRes;
blockDataCleanup(pRes);
2022-04-25 01:44:39 +00:00
int32_t size = 0;
code = tableListGetSize(pInfo->pTableListInfo, &size);
QUERY_CHECK_CODE(code, lino, _end);
2022-05-26 08:05:27 +00:00
if (size == 0) {
2022-05-07 07:11:49 +00:00
setTaskStatus(pTaskInfo, TASK_COMPLETED);
2024-07-24 08:17:28 +00:00
(*ppRes) = NULL;
return code;
2022-05-07 07:11:49 +00:00
}
SMetaReader mr = {0};
pAPI->metaReaderFn.initReader(&mr, pInfo->readHandle.vnode, META_READER_LOCK, &pAPI->metaFn);
pRes->info.rows = 0;
2022-04-25 01:44:39 +00:00
while (pInfo->curPos < size && pRes->info.rows < pOperator->resultInfo.capacity) {
code = doTagScanOneTable(pOperator, pRes, &mr, &pTaskInfo->storageAPI);
2024-12-11 11:18:50 +00:00
if (code != TSDB_CODE_OUT_OF_MEMORY && code != TSDB_CODE_QRY_REACH_QMEM_THRESHOLD && code != TSDB_CODE_QRY_QUERY_MEM_EXHAUSTED) {
2024-09-11 08:37:06 +00:00
// ignore other error
code = TSDB_CODE_SUCCESS;
2024-09-11 08:37:06 +00:00
}
QUERY_CHECK_CODE(code, lino, _end);
2024-09-11 08:37:06 +00:00
2022-05-26 08:05:27 +00:00
if (++pInfo->curPos >= size) {
2022-11-09 11:14:27 +00:00
setOperatorCompleted(pOperator);
2022-04-25 01:44:39 +00:00
}
}
pAPI->metaReaderFn.clearReader(&mr);
bool bLimitReached = applyLimitOffset(&pInfo->limitInfo, pRes, pTaskInfo);
if (bLimitReached) {
setOperatorCompleted(pOperator);
}
2025-02-27 06:27:46 +00:00
// qDebug("QInfo:0x%" PRIx64 ", create tag values results completed, rows:%d", GET_TASKID(pRuntimeEnv), count);
2022-04-25 01:44:39 +00:00
if (pOperator->status == OP_EXEC_DONE) {
setTaskStatus(pTaskInfo, TASK_COMPLETED);
2022-04-25 01:44:39 +00:00
}
pOperator->resultInfo.totalRows += pRes->info.rows;
2024-07-24 08:17:28 +00:00
(*ppRes) = (pRes->info.rows == 0) ? NULL : pInfo->pRes;
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
pTaskInfo->code = code;
T_LONG_JMP(pTaskInfo->env, code);
}
2024-07-24 08:17:28 +00:00
return code;
}
static SSDataBlock* doTagScanFromMetaEntry(SOperatorInfo* pOperator) {
SSDataBlock* pRes = NULL;
int32_t code = doTagScanFromMetaEntryNext(pOperator, &pRes);
return pRes;
2022-04-25 01:44:39 +00:00
}
static void destroyTagScanOperatorInfo(void* param) {
2022-04-25 01:44:39 +00:00
STagScanInfo* pInfo = (STagScanInfo*)param;
2024-08-07 07:33:09 +00:00
if (pInfo->pCtbCursor != NULL && pInfo->pStorageAPI != NULL) {
2023-09-01 05:24:47 +00:00
pInfo->pStorageAPI->metaFn.closeCtbCursor(pInfo->pCtbCursor);
}
taosHashCleanup(pInfo->filterCtx.colHash);
taosArrayDestroy(pInfo->filterCtx.cInfoList);
taosArrayDestroy(pInfo->aFilterIdxs);
taosArrayDestroyEx(pInfo->aUidTags, tagScanFreeUidTag);
2024-07-18 16:09:28 +00:00
blockDataDestroy(pInfo->pRes);
2022-10-24 08:44:44 +00:00
taosArrayDestroy(pInfo->matchInfo.pList);
2024-07-24 09:08:08 +00:00
tableListDestroy(pInfo->pTableListInfo);
pInfo->pRes = NULL;
pInfo->pTableListInfo = NULL;
2022-07-08 06:26:53 +00:00
taosMemoryFreeClear(param);
2022-04-25 01:44:39 +00:00
}
2024-07-24 09:08:08 +00:00
int32_t createTagScanOperatorInfo(SReadHandle* pReadHandle, STagScanPhysiNode* pTagScanNode,
2024-07-29 02:35:06 +00:00
STableListInfo* pTableListInfo, SNode* pTagCond, SNode* pTagIndexCond,
SExecTaskInfo* pTaskInfo, SOperatorInfo** pOptrInfo) {
QRY_PARAM_CHECK(pOptrInfo);
2024-07-24 09:08:08 +00:00
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2023-09-01 05:24:47 +00:00
SScanPhysiNode* pPhyNode = (SScanPhysiNode*)pTagScanNode;
2024-07-19 08:15:37 +00:00
STagScanInfo* pInfo = taosMemoryCalloc(1, sizeof(STagScanInfo));
SOperatorInfo* pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
2022-04-25 01:44:39 +00:00
if (pInfo == NULL || pOperator == NULL) {
code = terrno;
2022-04-25 01:44:39 +00:00
goto _error;
}
2022-06-05 06:48:15 +00:00
SDataBlockDescNode* pDescNode = pPhyNode->node.pOutputDataBlockDesc;
int32_t numOfExprs = 0;
2024-08-05 03:57:18 +00:00
SExprInfo* pExprInfo = NULL;
code = createExprInfo(pPhyNode->pScanPseudoCols, NULL, &pExprInfo, &numOfExprs);
QUERY_CHECK_CODE(code, lino, _error);
2024-07-19 08:15:37 +00:00
code = initExprSupp(&pOperator->exprSupp, pExprInfo, numOfExprs, &pTaskInfo->storageAPI.functionStore);
QUERY_CHECK_CODE(code, lino, _error);
2022-06-05 06:48:15 +00:00
2022-11-04 10:46:48 +00:00
int32_t num = 0;
code = extractColMatchInfo(pPhyNode->pScanPseudoCols, pDescNode, &num, COL_MATCH_FROM_COL_ID, &pInfo->matchInfo);
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _error);
2023-09-01 05:24:47 +00:00
pInfo->pTagCond = pTagCond;
pInfo->pTagIndexCond = pTagIndexCond;
pInfo->suid = pPhyNode->suid;
pInfo->pStorageAPI = &pTaskInfo->storageAPI;
pInfo->pTableListInfo = pTableListInfo;
2022-11-27 16:27:49 +00:00
pInfo->pRes = createDataBlockFromDescNode(pDescNode);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(pInfo->pRes, code, lino, _error, terrno);
2024-07-19 08:15:37 +00:00
pInfo->readHandle = *pReadHandle;
pInfo->curPos = 0;
2022-06-05 06:48:15 +00:00
initLimitInfo(pPhyNode->node.pLimit, pPhyNode->node.pSlimit, &pInfo->limitInfo);
2022-11-11 01:12:57 +00:00
setOperatorInfo(pOperator, "TagScanOperator", QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN, false, OP_NOT_OPENED, pInfo,
pTaskInfo);
initResultSizeInfo(&pOperator->resultInfo, 4096);
2024-07-19 08:15:37 +00:00
code = blockDataEnsureCapacity(pInfo->pRes, pOperator->resultInfo.capacity);
QUERY_CHECK_CODE(code, lino, _error);
2023-09-01 05:24:47 +00:00
if (pTagScanNode->onlyMetaCtbIdx) {
pInfo->aUidTags = taosArrayInit(pOperator->resultInfo.capacity, sizeof(STUidTagInfo));
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(pInfo->aUidTags, code, lino, _error, terrno);
2024-07-19 08:15:37 +00:00
2023-09-01 05:24:47 +00:00
pInfo->aFilterIdxs = taosArrayInit(pOperator->resultInfo.capacity, sizeof(int32_t));
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(pInfo->aFilterIdxs, code, lino, _error, terrno);
2024-07-19 08:15:37 +00:00
pInfo->filterCtx.colHash =
taosHashInit(4, taosGetDefaultHashFunction(TSDB_DATA_TYPE_SMALLINT), false, HASH_NO_LOCK);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(pInfo->filterCtx.colHash, code, lino, _error, terrno);
2024-07-19 08:15:37 +00:00
2023-09-01 05:24:47 +00:00
pInfo->filterCtx.cInfoList = taosArrayInit(4, sizeof(SColumnInfo));
2024-08-26 07:16:07 +00:00
QUERY_CHECK_NULL(pInfo->filterCtx.cInfoList, code, lino, _error, terrno);
2024-07-19 08:15:37 +00:00
2023-09-01 05:24:47 +00:00
if (pInfo->pTagCond != NULL) {
nodesRewriteExprPostOrder(&pTagCond, tagScanRewriteTagColumn, (void*)&pInfo->filterCtx);
}
}
2024-08-27 09:04:44 +00:00
__optr_fn_t tagScanNextFn = (pTagScanNode->onlyMetaCtbIdx) ? doTagScanFromCtbIdxNext : doTagScanFromMetaEntryNext;
2024-07-19 08:15:37 +00:00
pOperator->fpSet = createOperatorFpSet(optrDummyOpenFn, tagScanNextFn, NULL, destroyTagScanOperatorInfo,
optrDefaultBufFn, NULL, optrDefaultGetNextExtFn, NULL);
2024-07-24 09:08:08 +00:00
*pOptrInfo = pOperator;
return code;
2022-05-03 15:23:49 +00:00
_error:
2024-08-06 02:19:22 +00:00
if (pInfo) {
pInfo->pTableListInfo = NULL;
}
2024-08-06 11:36:39 +00:00
if (pInfo != NULL) destroyTagScanOperatorInfo(pInfo);
2024-08-07 07:53:23 +00:00
if (pOperator != NULL) {
pOperator->info = NULL;
destroyOperator(pOperator);
}
2024-07-24 09:08:08 +00:00
return code;
2022-04-25 01:44:39 +00:00
}
2022-06-14 10:17:18 +00:00
// table merge scan operator
static int32_t subTblRowCompareTsFn(const void* pLeft, const void* pRight, void* param) {
2024-07-19 08:15:37 +00:00
int32_t left = *(int32_t*)pLeft;
int32_t right = *(int32_t*)pRight;
STmsSubTablesMergeInfo* pInfo = (STmsSubTablesMergeInfo*)param;
int32_t leftIdx = pInfo->aInputs[left].rowIdx;
int32_t rightIdx = pInfo->aInputs[right].rowIdx;
if (leftIdx == -1) {
return 1;
} else if (rightIdx == -1) {
return -1;
}
int64_t leftTs = pInfo->aInputs[left].aTs[leftIdx];
int64_t rightTs = pInfo->aInputs[right].aTs[rightIdx];
2024-07-19 08:15:37 +00:00
int32_t ret = leftTs > rightTs ? 1 : ((leftTs < rightTs) ? -1 : 0);
if (pInfo->pTsOrderInfo->order == TSDB_ORDER_DESC) {
ret = -1 * ret;
}
return ret;
}
static int32_t subTblRowCompareTsPkFn(const void* pLeft, const void* pRight, void* param) {
2024-07-19 08:15:37 +00:00
int32_t left = *(int32_t*)pLeft;
int32_t right = *(int32_t*)pRight;
STmsSubTablesMergeInfo* pInfo = (STmsSubTablesMergeInfo*)param;
int32_t leftIdx = pInfo->aInputs[left].rowIdx;
int32_t rightIdx = pInfo->aInputs[right].rowIdx;
if (leftIdx == -1) {
return 1;
} else if (rightIdx == -1) {
return -1;
}
int64_t leftTs = pInfo->aInputs[left].aTs[leftIdx];
int64_t rightTs = pInfo->aInputs[right].aTs[rightIdx];
2024-07-19 08:15:37 +00:00
int32_t ret = leftTs > rightTs ? 1 : ((leftTs < rightTs) ? -1 : 0);
if (pInfo->pTsOrderInfo->order == TSDB_ORDER_DESC) {
ret = -1 * ret;
}
2024-07-19 08:15:37 +00:00
if (ret == 0 && pInfo->pPkOrderInfo) {
ret = tsortComparBlockCell(pInfo->aInputs[left].pInputBlock, pInfo->aInputs[right].pInputBlock, leftIdx, rightIdx,
pInfo->pPkOrderInfo);
}
return ret;
}
2024-01-26 06:10:02 +00:00
int32_t dumpQueryTableCond(const SQueryTableDataCond* src, SQueryTableDataCond* dst) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2024-01-26 06:10:02 +00:00
memcpy((void*)dst, (void*)src, sizeof(SQueryTableDataCond));
dst->colList = taosMemoryCalloc(src->numOfCols, sizeof(SColumnInfo));
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(dst->colList, code, lino, _end, terrno);
2024-01-26 06:10:02 +00:00
for (int i = 0; i < src->numOfCols; i++) {
dst->colList[i] = src->colList[i];
}
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
2024-01-26 06:10:02 +00:00
}
2024-07-19 08:15:37 +00:00
static int32_t fetchNextSubTableBlockFromReader(SOperatorInfo* pOperator, STmsSubTableInput* pInput,
bool* pSubTableHasBlock) {
2024-01-26 06:10:02 +00:00
int32_t code = 0;
2024-07-19 08:15:37 +00:00
STableMergeScanInfo* pInfo = pOperator->info;
SReadHandle* pHandle = &pInfo->base.readHandle;
STmsSubTablesMergeInfo* pSubTblsInfo = pInfo->pSubTablesMergeInfo;
2024-07-19 08:15:37 +00:00
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
const SStorageAPI* pAPI = &pTaskInfo->storageAPI;
blockDataCleanup(pInput->pReaderBlock);
2024-01-26 06:10:02 +00:00
if (!pInput->bInMemReader) {
code = pAPI->tsdReader.tsdReaderOpen(pHandle->vnode, &pInput->tblCond, pInput->pKeyInfo, 1, pInput->pReaderBlock,
2024-07-19 08:15:37 +00:00
(void**)&pInput->pReader, GET_TASKID(pTaskInfo), NULL);
2024-01-26 06:10:02 +00:00
if (code != 0) {
return code;
2024-01-26 06:10:02 +00:00
}
}
2024-01-24 07:23:03 +00:00
pInfo->base.dataReader = pInput->pReader;
2024-01-24 01:12:27 +00:00
while (true) {
2024-09-11 08:37:06 +00:00
bool hasNext = false;
code = pAPI->tsdReader.tsdNextDataBlock(pInfo->base.dataReader, &hasNext);
2024-01-24 01:12:27 +00:00
if (code != 0) {
2024-01-26 06:10:02 +00:00
pAPI->tsdReader.tsdReaderReleaseDataBlock(pInfo->base.dataReader);
2024-01-24 07:23:03 +00:00
pInfo->base.dataReader = NULL;
return code;
2024-01-24 01:12:27 +00:00
}
2024-01-24 01:12:27 +00:00
if (!hasNext || isTaskKilled(pTaskInfo)) {
if (isTaskKilled(pTaskInfo)) {
2024-01-26 06:10:02 +00:00
pAPI->tsdReader.tsdReaderReleaseDataBlock(pInfo->base.dataReader);
2024-02-01 08:40:53 +00:00
pInfo->base.dataReader = NULL;
return code;
2024-01-24 01:12:27 +00:00
}
2024-01-26 06:10:02 +00:00
*pSubTableHasBlock = false;
2024-01-24 01:12:27 +00:00
break;
}
2024-07-19 08:15:37 +00:00
if (pInput->tblCond.order == TSDB_ORDER_ASC) {
2024-01-26 06:10:02 +00:00
pInput->tblCond.twindows.skey = pInput->pReaderBlock->info.window.ekey + 1;
} else {
pInput->tblCond.twindows.ekey = pInput->pReaderBlock->info.window.skey - 1;
}
2024-01-24 01:12:27 +00:00
uint32_t status = 0;
code = loadDataBlock(pOperator, &pInfo->base, pInput->pReaderBlock, &status);
2024-01-24 01:12:27 +00:00
if (code != 0) {
2024-01-24 07:23:03 +00:00
pInfo->base.dataReader = NULL;
return code;
2024-01-24 01:12:27 +00:00
}
2024-01-24 01:12:27 +00:00
if (status == FUNC_DATA_REQUIRED_ALL_FILTEROUT) {
2024-01-26 06:10:02 +00:00
*pSubTableHasBlock = false;
2024-01-24 01:12:27 +00:00
break;
}
if (status == FUNC_DATA_REQUIRED_FILTEROUT || pInput->pReaderBlock->info.rows == 0) {
2024-01-24 01:12:27 +00:00
continue;
}
2024-01-24 02:21:17 +00:00
2024-01-24 01:12:27 +00:00
*pSubTableHasBlock = true;
2024-01-26 06:10:02 +00:00
break;
}
if (*pSubTableHasBlock) {
2024-07-19 08:15:37 +00:00
pInput->pReaderBlock->info.id.groupId =
tableListGetTableGroupId(pInfo->base.pTableListInfo, pInput->pReaderBlock->info.id.uid);
pOperator->resultInfo.totalRows += pInput->pReaderBlock->info.rows;
2024-01-24 01:12:27 +00:00
}
2024-01-26 06:10:02 +00:00
if (!pInput->bInMemReader || !*pSubTableHasBlock) {
pAPI->tsdReader.tsdReaderClose(pInput->pReader);
pInput->pReader = NULL;
}
2024-01-24 07:23:03 +00:00
pInfo->base.dataReader = NULL;
2024-01-24 01:12:27 +00:00
return TSDB_CODE_SUCCESS;
}
2024-08-06 01:24:31 +00:00
static int32_t setGroupStartEndIndex(STableMergeScanInfo* pInfo) {
2024-01-24 02:21:17 +00:00
pInfo->bGroupProcessed = false;
int32_t numOfTables = 0;
int32_t code = tableListGetSize(pInfo->base.pTableListInfo, &numOfTables);
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, __LINE__, tstrerror(code));
return code;
}
int32_t i = pInfo->tableStartIndex + 1;
for (; i < numOfTables; ++i) {
STableKeyInfo* tableKeyInfo = tableListGetInfo(pInfo->base.pTableListInfo, i);
2024-08-06 01:24:31 +00:00
if (!tableKeyInfo) {
qError("%s failed at line %d since %s", __func__, __LINE__, tstrerror(terrno));
return terrno;
}
if (tableKeyInfo->groupId != pInfo->groupId) {
break;
}
}
pInfo->tableEndIndex = i - 1;
2024-08-06 01:24:31 +00:00
return TSDB_CODE_SUCCESS;
}
static int32_t openSubTablesMergeSort(STmsSubTablesMergeInfo* pSubTblsInfo) {
for (int32_t i = 0; i < pSubTblsInfo->numSubTables; ++i) {
2024-07-19 08:15:37 +00:00
STmsSubTableInput* pInput = pSubTblsInfo->aInputs + i;
if (pInput->rowIdx == -1) {
continue;
}
2024-06-26 02:32:15 +00:00
2024-02-02 07:00:09 +00:00
if (pInput->type == SUB_TABLE_MEM_BLOCK) {
pInput->rowIdx = 0;
pInput->pageIdx = -1;
}
2024-06-26 02:32:15 +00:00
pInput->pInputBlock = (pInput->type == SUB_TABLE_MEM_BLOCK) ? pInput->pReaderBlock : pInput->pPageBlock;
SColumnInfoData* col = taosArrayGet(pInput->pInputBlock->pDataBlock, pSubTblsInfo->pTsOrderInfo->slotId);
2024-08-05 08:09:01 +00:00
if (!col) {
qError("%s failed at line %d since %s", __func__, __LINE__, tstrerror(terrno));
return terrno;
}
pInput->aTs = (int64_t*)col->pData;
}
2024-06-26 02:32:15 +00:00
__merge_compare_fn_t mergeCompareFn = (!pSubTblsInfo->pPkOrderInfo) ? subTblRowCompareTsFn : subTblRowCompareTsPkFn;
2024-06-26 02:32:15 +00:00
return tMergeTreeCreate(&pSubTblsInfo->pTree, pSubTblsInfo->numSubTables, pSubTblsInfo, mergeCompareFn);
}
2024-01-24 01:12:27 +00:00
static int32_t initSubTablesMergeInfo(STableMergeScanInfo* pInfo) {
2024-08-06 01:24:31 +00:00
int32_t code = setGroupStartEndIndex(pInfo);
if (code != TSDB_CODE_SUCCESS) {
2024-09-11 08:37:06 +00:00
qError("%s failed at line %d since %s", __func__, __LINE__, tstrerror(code));
2024-08-06 01:24:31 +00:00
return code;
}
2024-02-04 01:20:28 +00:00
STmsSubTablesMergeInfo* pSubTblsInfo = taosMemoryCalloc(1, sizeof(STmsSubTablesMergeInfo));
if (pSubTblsInfo == NULL) {
return terrno;
2024-02-04 01:20:28 +00:00
}
pSubTblsInfo->pTsOrderInfo = taosArrayGet(pInfo->pSortInfo, 0);
2024-08-05 08:09:01 +00:00
if (!pSubTblsInfo->pTsOrderInfo) {
qError("%s failed at line %d since %s", __func__, __LINE__, tstrerror(terrno));
return terrno;
}
if (taosArrayGetSize(pInfo->pSortInfo) == 2) {
pSubTblsInfo->pPkOrderInfo = taosArrayGet(pInfo->pSortInfo, 1);
2024-08-05 08:09:01 +00:00
if (!pSubTblsInfo->pPkOrderInfo) {
qError("%s failed at line %d since %s", __func__, __LINE__, tstrerror(terrno));
return terrno;
}
} else {
pSubTblsInfo->pPkOrderInfo = NULL;
}
pSubTblsInfo->numSubTables = pInfo->tableEndIndex - pInfo->tableStartIndex + 1;
pSubTblsInfo->aInputs = taosMemoryCalloc(pSubTblsInfo->numSubTables, sizeof(STmsSubTableInput));
2024-02-04 01:20:28 +00:00
if (pSubTblsInfo->aInputs == NULL) {
taosMemoryFree(pSubTblsInfo);
return terrno;
2024-02-04 01:20:28 +00:00
}
int32_t bufPageSize = pInfo->bufPageSize;
int32_t inMemSize = (pSubTblsInfo->numSubTables - pSubTblsInfo->numTableBlocksInMem) * bufPageSize;
2024-09-11 08:37:06 +00:00
code = createDiskbasedBuf(&pSubTblsInfo->pBlocksBuf, pInfo->bufPageSize, inMemSize, "blocksExternalBuf", tsTempDir);
2024-02-04 01:20:28 +00:00
if (code != TSDB_CODE_SUCCESS) {
taosMemoryFree(pSubTblsInfo->aInputs);
taosMemoryFree(pSubTblsInfo);
return code;
}
pSubTblsInfo->numTableBlocksInMem = pSubTblsInfo->numSubTables;
pSubTblsInfo->numInMemReaders = pSubTblsInfo->numSubTables;
2024-02-04 01:20:28 +00:00
pInfo->pSubTablesMergeInfo = pSubTblsInfo;
2024-01-24 01:12:27 +00:00
return TSDB_CODE_SUCCESS;
2024-07-19 08:15:37 +00:00
}
2024-01-24 01:12:27 +00:00
static int32_t initSubTableInputs(SOperatorInfo* pOperator, STableMergeScanInfo* pInfo) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
SReadHandle* pHandle = &pInfo->base.readHandle;
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
2024-01-24 01:12:27 +00:00
STmsSubTablesMergeInfo* pSubTblsInfo = pInfo->pSubTablesMergeInfo;
for (int32_t i = 0; i < pSubTblsInfo->numSubTables; ++i) {
2024-07-19 08:15:37 +00:00
STmsSubTableInput* pInput = pSubTblsInfo->aInputs + i;
pInput->type = SUB_TABLE_MEM_BLOCK;
2024-07-27 10:55:34 +00:00
2024-07-19 08:15:37 +00:00
code = dumpQueryTableCond(&pInfo->base.cond, &pInput->tblCond);
QUERY_CHECK_CODE(code, lino, _end);
2024-07-27 10:55:34 +00:00
code = createOneDataBlock(pInfo->pResBlock, false, &pInput->pReaderBlock);
QUERY_CHECK_CODE(code, lino, _end);
code = createOneDataBlock(pInfo->pResBlock, false, &pInput->pPageBlock);
QUERY_CHECK_CODE(code, lino, _end);
2024-01-24 01:12:27 +00:00
STableKeyInfo* keyInfo = tableListGetInfo(pInfo->base.pTableListInfo, i + pInfo->tableStartIndex);
2024-01-26 06:10:02 +00:00
pInput->pKeyInfo = keyInfo;
2024-02-01 08:40:53 +00:00
if (isTaskKilled(pTaskInfo)) {
T_LONG_JMP(pTaskInfo->env, pTaskInfo->code);
}
2024-01-26 06:10:02 +00:00
if (i + 1 < pSubTblsInfo->numInMemReaders) {
2024-07-19 08:15:37 +00:00
code = pAPI->tsdReader.tsdReaderOpen(pHandle->vnode, &pInput->tblCond, keyInfo, 1, pInput->pReaderBlock,
(void**)&pInput->pReader, GET_TASKID(pTaskInfo), NULL);
QUERY_CHECK_CODE(code, lino, _end);
2024-01-26 06:10:02 +00:00
pInput->bInMemReader = true;
} else {
pInput->pReader = NULL;
pInput->bInMemReader = false;
}
bool hasNext = true;
2024-07-19 08:15:37 +00:00
code = fetchNextSubTableBlockFromReader(pOperator, pInput, &hasNext);
QUERY_CHECK_CODE(code, lino, _end);
2024-01-24 01:12:27 +00:00
if (!hasNext) {
pInput->rowIdx = -1;
2024-01-24 02:21:17 +00:00
++pSubTblsInfo->numSubTablesCompleted;
2024-01-24 01:12:27 +00:00
continue;
} else {
pInput->rowIdx = 0;
pInput->pageIdx = -1;
}
2024-07-19 08:15:37 +00:00
}
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
2024-01-24 01:12:27 +00:00
}
2024-07-19 08:15:37 +00:00
static void adjustSubTableFromMemBlock(SOperatorInfo* pOperatorInfo, STmsSubTablesMergeInfo* pSubTblsInfo) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
SExecTaskInfo* pTaskInfo = pOperatorInfo->pTaskInfo;
2024-01-24 01:12:27 +00:00
STableMergeScanInfo* pInfo = pOperatorInfo->info;
2024-07-19 08:15:37 +00:00
STmsSubTableInput* pInput = pSubTblsInfo->aInputs + tMergeTreeGetChosenIndex(pSubTblsInfo->pTree);
bool hasNext = true;
code = fetchNextSubTableBlockFromReader(pOperatorInfo, pInput, &hasNext);
QUERY_CHECK_CODE(code, lino, _end);
2024-01-24 01:12:27 +00:00
if (!hasNext) {
pInput->rowIdx = -1;
2024-01-24 02:21:17 +00:00
++pSubTblsInfo->numSubTablesCompleted;
2024-01-24 01:12:27 +00:00
} else {
2024-07-19 08:15:37 +00:00
pInput->rowIdx = 0;
}
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
T_LONG_JMP(pTaskInfo->env, code);
2024-01-24 01:12:27 +00:00
}
}
2024-01-24 02:21:17 +00:00
static int32_t adjustSubTableForNextRow(SOperatorInfo* pOperatorInfo, STmsSubTablesMergeInfo* pSubTblsInfo) {
2024-01-24 01:12:27 +00:00
STableMergeScanInfo* pInfo = pOperatorInfo->info;
2024-07-19 08:15:37 +00:00
STmsSubTableInput* pInput = pSubTblsInfo->aInputs + tMergeTreeGetChosenIndex(pSubTblsInfo->pTree);
2024-01-24 01:12:27 +00:00
SSDataBlock* pInputBlock = (pInput->type == SUB_TABLE_MEM_BLOCK) ? pInput->pReaderBlock : pInput->pPageBlock;
if (pInput->rowIdx < pInputBlock->info.rows - 1) {
++pInput->rowIdx;
2024-07-19 08:15:37 +00:00
} else if (pInput->rowIdx == pInputBlock->info.rows - 1) {
if (pInput->type == SUB_TABLE_MEM_BLOCK) {
2024-01-24 01:12:27 +00:00
adjustSubTableFromMemBlock(pOperatorInfo, pSubTblsInfo);
}
if (pInput->rowIdx != -1) {
SColumnInfoData* col = taosArrayGet(pInputBlock->pDataBlock, pSubTblsInfo->pTsOrderInfo->slotId);
2024-08-05 08:09:01 +00:00
if (!col) {
qError("%s failed at line %d since %s", __func__, __LINE__, tstrerror(terrno));
return terrno;
}
pInput->pInputBlock = pInputBlock;
2024-01-24 01:12:27 +00:00
pInput->aTs = (int64_t*)col->pData;
}
}
2024-01-24 01:12:27 +00:00
return tMergeTreeAdjust(pSubTblsInfo->pTree, tMergeTreeGetAdjustIndex(pSubTblsInfo->pTree));
}
static int32_t appendChosenRowToDataBlock(STmsSubTablesMergeInfo* pSubTblsInfo, SSDataBlock* pBlock) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
STmsSubTableInput* pInput = pSubTblsInfo->aInputs + tMergeTreeGetChosenIndex(pSubTblsInfo->pTree);
2024-07-19 08:15:37 +00:00
SSDataBlock* pInputBlock = (pInput->type == SUB_TABLE_MEM_BLOCK) ? pInput->pReaderBlock : pInput->pPageBlock;
for (int32_t i = 0; i < taosArrayGetSize(pBlock->pDataBlock); ++i) {
SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, i);
2024-08-05 08:09:01 +00:00
QUERY_CHECK_NULL(pColInfo, code, lino, _end, terrno);
SColumnInfoData* pSrcColInfo = taosArrayGet(pInputBlock->pDataBlock, i);
2024-08-05 08:09:01 +00:00
QUERY_CHECK_NULL(pSrcColInfo, code, lino, _end, terrno);
2024-09-11 08:37:06 +00:00
bool isNull = colDataIsNull(pSrcColInfo, pInputBlock->info.rows, pInput->rowIdx, NULL);
if (isNull) {
2024-07-19 08:15:37 +00:00
code = colDataSetVal(pColInfo, pBlock->info.rows, NULL, true);
QUERY_CHECK_CODE(code, lino, _end);
} else {
if (pSrcColInfo->pData != NULL) {
char* pData = colDataGetData(pSrcColInfo, pInput->rowIdx);
2024-07-19 08:15:37 +00:00
code = colDataSetVal(pColInfo, pBlock->info.rows, pData, false);
QUERY_CHECK_CODE(code, lino, _end);
}
}
}
2024-01-26 05:11:05 +00:00
pBlock->info.dataLoad = 1;
pBlock->info.scanFlag = pInputBlock->info.scanFlag;
pBlock->info.rows += 1;
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
}
2024-09-11 08:37:06 +00:00
static int32_t getSubTablesSortedBlock(SOperatorInfo* pOperator, SSDataBlock* pBlock, int32_t capacity,
SSDataBlock** pResBlock) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
STableMergeScanInfo* pInfo = pOperator->info;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2024-01-24 02:21:17 +00:00
STmsSubTablesMergeInfo* pSubTblsInfo = pInfo->pSubTablesMergeInfo;
bool finished = false;
QRY_PARAM_CHECK(pResBlock);
blockDataCleanup(pBlock);
2024-01-24 02:21:17 +00:00
while (true) {
while (true) {
2024-01-24 02:21:17 +00:00
if (pSubTblsInfo->numSubTablesCompleted >= pSubTblsInfo->numSubTables) {
finished = true;
break;
}
code = appendChosenRowToDataBlock(pSubTblsInfo, pBlock);
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _end);
2024-07-19 08:15:37 +00:00
code = adjustSubTableForNextRow(pOperator, pSubTblsInfo);
QUERY_CHECK_CODE(code, lino, _end);
if (pBlock->info.rows >= capacity) {
2024-01-24 02:21:17 +00:00
break;
}
}
2024-02-01 08:40:53 +00:00
if (isTaskKilled(pTaskInfo)) {
return pTaskInfo->code;
2024-02-01 08:40:53 +00:00
}
bool limitReached = applyLimitOffset(&pInfo->limitInfo, pBlock, pTaskInfo);
if (finished || limitReached || pBlock->info.rows > 0) {
2024-01-24 02:21:17 +00:00
break;
}
}
2024-07-19 08:15:37 +00:00
if (pBlock->info.rows > 0) {
*pResBlock = pBlock;
}
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
2024-07-19 08:15:37 +00:00
}
return code;
2024-01-24 02:21:17 +00:00
}
static int32_t startSubTablesTableMergeScan(SOperatorInfo* pOperator) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2024-01-24 02:21:17 +00:00
STableMergeScanInfo* pInfo = pOperator->info;
2024-07-19 08:15:37 +00:00
code = initSubTablesMergeInfo(pInfo);
QUERY_CHECK_CODE(code, lino, _end);
2024-01-24 02:21:17 +00:00
2024-07-19 08:15:37 +00:00
code = initSubTableInputs(pOperator, pInfo);
QUERY_CHECK_CODE(code, lino, _end);
2024-01-24 02:21:17 +00:00
2024-07-19 08:15:37 +00:00
code = openSubTablesMergeSort(pInfo->pSubTablesMergeInfo);
QUERY_CHECK_CODE(code, lino, _end);
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
2024-01-24 02:21:17 +00:00
}
2024-07-19 08:15:37 +00:00
static void stopSubTablesTableMergeScan(STableMergeScanInfo* pInfo) {
2024-01-24 02:21:17 +00:00
STmsSubTablesMergeInfo* pSubTblsInfo = pInfo->pSubTablesMergeInfo;
if (pSubTblsInfo != NULL) {
tMergeTreeDestroy(&pSubTblsInfo->pTree);
2024-01-24 02:21:17 +00:00
2024-01-24 07:23:03 +00:00
for (int32_t i = 0; i < pSubTblsInfo->numSubTables; ++i) {
2024-07-19 08:15:37 +00:00
STmsSubTableInput* pInput = pSubTblsInfo->aInputs + i;
2024-01-26 06:10:02 +00:00
taosMemoryFree(pInput->tblCond.colList);
blockDataDestroy(pInput->pReaderBlock);
blockDataDestroy(pInput->pPageBlock);
taosArrayDestroy(pInput->aBlockPages);
pInfo->base.readerAPI.tsdReaderClose(pInput->pReader);
pInput->pReader = NULL;
}
2024-01-24 02:21:17 +00:00
destroyDiskbasedBuf(pSubTblsInfo->pBlocksBuf);
taosMemoryFree(pSubTblsInfo->aInputs);
2024-01-24 02:21:17 +00:00
taosMemoryFree(pSubTblsInfo);
pInfo->pSubTablesMergeInfo = NULL;
2024-07-19 08:15:37 +00:00
// taosMemoryTrim(0);
2024-01-24 02:21:17 +00:00
}
}
2024-07-24 08:17:28 +00:00
int32_t doTableMergeScanParaSubTablesNext(SOperatorInfo* pOperator, SSDataBlock** ppRes) {
QRY_PARAM_CHECK(ppRes);
int32_t lino = 0;
int32_t tableListSize = 0;
int64_t st = taosGetTimestampUs();
2024-01-24 02:21:17 +00:00
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
STableMergeScanInfo* pInfo = pOperator->info;
if (pOperator->status == OP_EXEC_DONE) {
return TSDB_CODE_SUCCESS;
2024-01-24 02:21:17 +00:00
}
int32_t code = pOperator->fpSet._openFn(pOperator);
QUERY_CHECK_CODE(code, lino, _end);
2024-04-03 10:35:50 +00:00
code = tableListGetSize(pInfo->base.pTableListInfo, &tableListSize);
QUERY_CHECK_CODE(code, lino, _end);
2024-01-24 02:21:17 +00:00
if (!pInfo->hasGroupId) {
pInfo->hasGroupId = true;
if (tableListSize == 0) {
setOperatorCompleted(pOperator);
2024-07-24 08:17:28 +00:00
(*ppRes) = NULL;
return code;
2024-01-24 02:21:17 +00:00
}
2024-01-24 02:21:17 +00:00
pInfo->tableStartIndex = 0;
2024-08-06 01:24:31 +00:00
STableKeyInfo* pTmpGpId = (STableKeyInfo*)tableListGetInfo(pInfo->base.pTableListInfo, pInfo->tableStartIndex);
QUERY_CHECK_NULL(pTmpGpId, code, lino, _end, terrno);
pInfo->groupId = pTmpGpId->groupId;
2024-07-19 08:15:37 +00:00
code = startSubTablesTableMergeScan(pOperator);
QUERY_CHECK_CODE(code, lino, _end);
2024-01-24 02:21:17 +00:00
}
SSDataBlock* pBlock = NULL;
while (pInfo->tableStartIndex < tableListSize) {
if (isTaskKilled(pTaskInfo)) {
break;
2024-01-24 02:21:17 +00:00
}
code = getSubTablesSortedBlock(pOperator, pInfo->pResBlock, pOperator->resultInfo.capacity, &pBlock);
QUERY_CHECK_CODE(code, lino, _end);
2024-01-24 02:21:17 +00:00
if (pBlock == NULL && !pInfo->bGroupProcessed && pInfo->needCountEmptyTable) {
STableKeyInfo* tbInfo = tableListGetInfo(pInfo->base.pTableListInfo, pInfo->tableStartIndex);
2024-08-06 01:24:31 +00:00
QUERY_CHECK_NULL(tbInfo, code, lino, _end, terrno);
2024-01-24 02:21:17 +00:00
pBlock = getOneRowResultBlock(pTaskInfo, &pInfo->base, pInfo->pResBlock, tbInfo);
}
2024-01-24 02:21:17 +00:00
if (pBlock != NULL) {
pBlock->info.id.groupId = pInfo->groupId;
pOperator->resultInfo.totalRows += pBlock->info.rows;
pInfo->bGroupProcessed = true;
2024-04-03 10:35:50 +00:00
break;
2024-01-24 02:21:17 +00:00
} else {
// Data of this group are all dumped, let's try the next group
2024-01-24 03:13:37 +00:00
stopSubTablesTableMergeScan(pInfo);
2024-01-24 02:21:17 +00:00
if (pInfo->tableEndIndex >= tableListSize - 1) {
setOperatorCompleted(pOperator);
break;
}
pInfo->tableStartIndex = pInfo->tableEndIndex + 1;
2024-08-06 01:24:31 +00:00
STableKeyInfo* pTmpGpId = tableListGetInfo(pInfo->base.pTableListInfo, pInfo->tableStartIndex);
QUERY_CHECK_NULL(pTmpGpId, code, lino, _end, terrno);
pInfo->groupId = pTmpGpId->groupId;
2024-07-19 08:15:37 +00:00
code = startSubTablesTableMergeScan(pOperator);
QUERY_CHECK_CODE(code, lino, _end);
2024-01-24 02:21:17 +00:00
resetLimitInfoForNextGroup(&pInfo->limitInfo);
}
}
2024-07-19 08:15:37 +00:00
pOperator->cost.totalCost += (taosGetTimestampUs() - st) / 1000.0;
2024-04-03 10:35:50 +00:00
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
T_LONG_JMP(pTaskInfo->env, code);
} else {
(*ppRes) = pBlock;
2024-07-19 08:15:37 +00:00
}
2024-07-24 08:17:28 +00:00
return code;
2024-01-24 02:21:17 +00:00
}
2024-07-19 08:15:37 +00:00
static void tableMergeScanDoSkipTable(uint64_t uid, void* pTableMergeOpInfo) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
SOperatorInfo* pOperator = (SOperatorInfo*)pTableMergeOpInfo;
STableMergeScanInfo* pInfo = pOperator->info;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2024-01-24 02:21:17 +00:00
if (pInfo->mSkipTables == NULL) {
2024-07-19 08:15:37 +00:00
pInfo->mSkipTables = taosHashInit(pInfo->tableEndIndex - pInfo->tableStartIndex + 1,
taosGetDefaultHashFunction(TSDB_DATA_TYPE_UBIGINT), false, HASH_NO_LOCK);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(pInfo->mSkipTables, code, lino, _end, terrno);
}
int bSkip = 1;
if (pInfo->mSkipTables != NULL) {
2024-07-19 08:15:37 +00:00
code = taosHashPut(pInfo->mSkipTables, &uid, sizeof(uid), &bSkip, sizeof(bSkip));
2024-07-23 10:32:03 +00:00
if (code == TSDB_CODE_DUP_KEY) {
code = TSDB_CODE_SUCCESS;
2024-07-23 06:19:04 +00:00
}
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _end);
}
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
T_LONG_JMP(pTaskInfo->env, code);
2024-07-19 08:15:37 +00:00
}
}
static int32_t doGetBlockForTableMergeScan(SOperatorInfo* pOperator, bool* pFinished, bool* pSkipped) {
2024-04-11 11:35:14 +00:00
STableMergeScanInfo* pInfo = pOperator->info;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
SSDataBlock* pBlock = pInfo->pReaderBlock;
int32_t code = 0;
bool hasNext = false;
STsdbReader* reader = pInfo->base.dataReader;
2023-12-15 07:04:47 +00:00
code = pAPI->tsdReader.tsdNextDataBlock(reader, &hasNext);
if (code != 0) {
pAPI->tsdReader.tsdReaderReleaseDataBlock(reader);
qError("table merge scan fetch next data block error code: %d, %s", code, GET_TASKID(pTaskInfo));
pTaskInfo->code = code;
return code;
2023-12-15 07:04:47 +00:00
}
if (!hasNext || isTaskKilled(pTaskInfo)) {
if (isTaskKilled(pTaskInfo)) {
qInfo("table merge scan fetch next data block found task killed. %s", GET_TASKID(pTaskInfo));
pAPI->tsdReader.tsdReaderReleaseDataBlock(reader);
}
*pFinished = true;
return code;
2023-12-15 07:04:47 +00:00
}
uint32_t status = 0;
code = loadDataBlock(pOperator, &pInfo->base, pBlock, &status);
2023-12-19 06:55:31 +00:00
2023-12-15 07:04:47 +00:00
if (code != TSDB_CODE_SUCCESS) {
qInfo("table merge scan load datablock code %d, %s", code, GET_TASKID(pTaskInfo));
pTaskInfo->code = code;
return code;
2023-12-15 07:04:47 +00:00
}
if (status == FUNC_DATA_REQUIRED_ALL_FILTEROUT) {
*pFinished = true;
return code;
2023-12-15 07:04:47 +00:00
}
// current block is filter out according to filter condition, continue load the next block
if (status == FUNC_DATA_REQUIRED_FILTEROUT || pBlock->info.rows == 0) {
*pSkipped = true;
return code;
2023-12-15 07:04:47 +00:00
}
2024-04-11 11:35:14 +00:00
return code;
2023-12-15 07:04:47 +00:00
}
2024-08-22 05:49:38 +00:00
static int32_t getBlockForTableMergeScan(void* param, SSDataBlock** ppBlock) {
2022-10-27 12:38:57 +00:00
STableMergeScanSortSourceParam* source = param;
2024-04-11 11:35:14 +00:00
SOperatorInfo* pOperator = source->pOperator;
STableMergeScanInfo* pInfo = pOperator->info;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
SSDataBlock* pBlock = NULL;
int64_t st = taosGetTimestampUs();
int32_t code = TSDB_CODE_SUCCESS;
2023-03-28 07:21:47 +00:00
while (true) {
2023-12-15 07:04:47 +00:00
if (pInfo->rtnNextDurationBlocks) {
2024-04-11 11:35:14 +00:00
qDebug("%s table merge scan return already fetched new duration blocks. index %d num of blocks %d",
GET_TASKID(pTaskInfo), pInfo->nextDurationBlocksIdx, pInfo->numNextDurationBlocks);
2024-04-11 09:25:58 +00:00
2023-12-15 07:04:47 +00:00
if (pInfo->nextDurationBlocksIdx < pInfo->numNextDurationBlocks) {
2023-12-15 09:16:20 +00:00
pBlock = pInfo->nextDurationBlocks[pInfo->nextDurationBlocksIdx];
2023-12-15 07:04:47 +00:00
++pInfo->nextDurationBlocksIdx;
2023-12-15 09:16:20 +00:00
} else {
for (int32_t i = 0; i < pInfo->numNextDurationBlocks; ++i) {
blockDataDestroy(pInfo->nextDurationBlocks[i]);
2023-12-15 13:55:25 +00:00
pInfo->nextDurationBlocks[i] = NULL;
2023-12-05 01:51:14 +00:00
}
2024-04-11 09:25:58 +00:00
2023-12-15 09:16:20 +00:00
pInfo->rtnNextDurationBlocks = false;
pInfo->nextDurationBlocksIdx = 0;
pInfo->numNextDurationBlocks = 0;
continue;
2023-12-15 07:04:47 +00:00
}
} else {
bool bFinished = false;
bool bSkipped = false;
code = doGetBlockForTableMergeScan(pOperator, &bFinished, &bSkipped);
if (code != 0) {
return code;
}
2023-12-15 09:16:20 +00:00
pBlock = pInfo->pReaderBlock;
2024-04-11 11:35:14 +00:00
qDebug("%s table merge scan fetch block. finished %d skipped %d next-duration-block %d new-fileset %d",
GET_TASKID(pTaskInfo), bFinished, bSkipped, pInfo->bNextDurationBlockEvent, pInfo->bNewFilesetEvent);
2023-12-15 07:04:47 +00:00
if (bFinished) {
pInfo->bNewFilesetEvent = false;
2023-12-05 01:51:14 +00:00
break;
}
2023-04-04 06:50:58 +00:00
2023-12-15 07:04:47 +00:00
if (pInfo->bNextDurationBlockEvent || pInfo->bNewFilesetEvent) {
if (!bSkipped) {
2024-08-22 05:49:38 +00:00
code = createOneDataBlock(pBlock, true, &pInfo->nextDurationBlocks[pInfo->numNextDurationBlocks]);
2024-07-27 10:55:34 +00:00
if (code) {
2024-08-22 05:49:38 +00:00
*ppBlock = NULL;
return code;
2024-07-27 10:55:34 +00:00
}
2023-12-15 07:04:47 +00:00
++pInfo->numNextDurationBlocks;
2023-12-15 13:55:25 +00:00
if (pInfo->numNextDurationBlocks > 2) {
2024-04-11 11:35:14 +00:00
qError("%s table merge scan prefetch %d next duration blocks. end early.", GET_TASKID(pTaskInfo),
pInfo->numNextDurationBlocks);
2023-12-15 13:55:25 +00:00
pInfo->bNewFilesetEvent = false;
break;
}
2023-12-15 07:04:47 +00:00
}
2024-04-11 11:35:14 +00:00
2023-12-15 07:04:47 +00:00
if (pInfo->bNewFilesetEvent) {
pInfo->rtnNextDurationBlocks = true;
2024-08-22 05:49:38 +00:00
*ppBlock = NULL;
return code;
2023-12-15 07:04:47 +00:00
}
2024-04-11 11:35:14 +00:00
2023-12-15 07:04:47 +00:00
if (pInfo->bNextDurationBlockEvent) {
pInfo->bNextDurationBlockEvent = false;
continue;
}
2023-12-05 01:51:14 +00:00
}
2023-12-15 07:04:47 +00:00
if (bSkipped) continue;
2022-10-27 12:38:57 +00:00
}
2024-04-11 11:35:14 +00:00
2023-09-01 05:24:47 +00:00
pBlock->info.id.groupId = tableListGetTableGroupId(pInfo->base.pTableListInfo, pBlock->info.id.uid);
2022-10-27 12:38:57 +00:00
2022-11-04 10:46:48 +00:00
pOperator->resultInfo.totalRows += pBlock->info.rows;
2022-12-01 10:34:26 +00:00
pInfo->base.readRecorder.elapsedTime += (taosGetTimestampUs() - st) / 1000.0;
2024-08-22 05:49:38 +00:00
*ppBlock = pBlock;
2024-08-29 11:55:09 +00:00
2024-08-22 05:49:38 +00:00
return code;
2022-10-27 12:38:57 +00:00
}
2022-11-04 10:46:48 +00:00
2024-08-22 05:49:38 +00:00
*ppBlock = NULL;
return code;
2022-10-27 12:38:57 +00:00
}
2024-07-19 08:15:37 +00:00
int32_t generateSortByTsPkInfo(SArray* colMatchInfo, int32_t order, SArray** ppSortArray) {
2024-09-11 08:37:06 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
SArray* pSortInfo = taosArrayInit(1, sizeof(SBlockOrderInfo));
2024-08-05 04:22:25 +00:00
QUERY_CHECK_NULL(pSortInfo, code, lino, _end, terrno);
SBlockOrderInfo biTs = {0};
SBlockOrderInfo biPk = {0};
2023-12-15 07:04:47 +00:00
int32_t tsTargetSlotId = 0;
int32_t pkTargetSlotId = -1;
for (int32_t i = 0; i < taosArrayGetSize(colMatchInfo); ++i) {
2022-10-24 08:44:44 +00:00
SColMatchItem* colInfo = taosArrayGet(colMatchInfo, i);
2024-08-05 08:09:01 +00:00
QUERY_CHECK_NULL(colInfo, code, lino, _end, terrno);
if (colInfo->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
2022-10-24 08:44:44 +00:00
tsTargetSlotId = colInfo->dstSlotId;
biTs.order = order;
biTs.slotId = tsTargetSlotId;
biTs.nullFirst = (order == TSDB_ORDER_ASC);
biTs.compFn = getKeyComparFunc(TSDB_DATA_TYPE_TIMESTAMP, order);
}
2024-07-19 08:15:37 +00:00
// TODO: order by just ts
if (colInfo->isPk) {
pkTargetSlotId = colInfo->dstSlotId;
biPk.order = order;
biPk.slotId = pkTargetSlotId;
biPk.nullFirst = (order == TSDB_ORDER_ASC);
biPk.compFn = getKeyComparFunc(colInfo->dataType.type, order);
}
}
2024-07-19 08:15:37 +00:00
void* tmp = taosArrayPush(pSortInfo, &biTs);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
if (pkTargetSlotId != -1) {
2024-07-19 08:15:37 +00:00
tmp = taosArrayPush(pSortInfo, &biPk);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
}
2022-06-14 10:17:18 +00:00
2024-07-19 08:15:37 +00:00
(*ppSortArray) = pSortInfo;
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
2022-06-14 10:17:18 +00:00
}
void tableMergeScanTsdbNotifyCb(ETsdReaderNotifyType type, STsdReaderNotifyInfo* info, void* param) {
STableMergeScanInfo* pTmsInfo = param;
2023-12-15 07:04:47 +00:00
if (type == TSD_READER_NOTIFY_DURATION_START) {
pTmsInfo->bNewFilesetEvent = true;
} else if (type == TSD_READER_NOTIFY_NEXT_DURATION_BLOCK) {
pTmsInfo->bNextDurationBlockEvent = true;
}
2023-12-15 13:55:25 +00:00
qDebug("table merge scan receive notification. type %d, fileset %d", type, info->duration.filesetId);
return;
}
int32_t startDurationForGroupTableMergeScan(SOperatorInfo* pOperator) {
STableMergeScanInfo* pInfo = pOperator->info;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2024-05-08 08:22:02 +00:00
int32_t code = TSDB_CODE_SUCCESS;
2024-07-19 08:15:37 +00:00
int32_t lino = 0;
int32_t numOfTable = pInfo->tableEndIndex - pInfo->tableStartIndex + 1;
2023-12-15 13:55:25 +00:00
qDebug("%s table merge scan start duration ", GET_TASKID(pTaskInfo));
2023-12-15 07:04:47 +00:00
pInfo->bNewFilesetEvent = false;
pInfo->bNextDurationBlockEvent = false;
pInfo->sortBufSize = 2048 * pInfo->bufPageSize;
int32_t numOfBufPage = pInfo->sortBufSize / pInfo->bufPageSize;
pInfo->pSortHandle = NULL;
code = tsortCreateSortHandle(pInfo->pSortInfo, SORT_BLOCK_TS_MERGE, pInfo->bufPageSize, numOfBufPage,
2024-07-29 02:35:06 +00:00
pInfo->pSortInputBlock, pTaskInfo->id.str, 0, 0, 0, &pInfo->pSortHandle);
if (code) {
return code;
}
2024-03-12 08:53:56 +00:00
if (pInfo->bSortRowId && numOfTable != 1) {
int32_t memSize = 512 * 1024 * 1024;
2024-03-01 09:05:24 +00:00
code = tsortSetSortByRowId(pInfo->pSortHandle, memSize);
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _end);
}
2024-05-08 08:22:02 +00:00
tsortSetMergeLimit(pInfo->pSortHandle, pInfo->mergeLimit);
2024-07-19 08:15:37 +00:00
tsortSetMergeLimitReachedFp(pInfo->pSortHandle, tableMergeScanDoSkipTable, pOperator);
tsortSetAbortCheckFn(pInfo->pSortHandle, isTaskKilled, pOperator->pTaskInfo);
2024-07-24 09:08:08 +00:00
tsortSetFetchRawDataFp(pInfo->pSortHandle, getBlockForTableMergeScan, NULL, NULL);
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _end);
2024-07-19 08:15:37 +00:00
STableMergeScanSortSourceParam* param = taosMemoryCalloc(1, sizeof(STableMergeScanSortSourceParam));
2024-08-05 04:22:25 +00:00
QUERY_CHECK_NULL(param, code, lino, _end, terrno);
param->pOperator = pOperator;
SSortSource* ps = taosMemoryCalloc(1, sizeof(SSortSource));
2024-09-06 07:58:52 +00:00
if (ps == NULL) {
taosMemoryFree(param);
QUERY_CHECK_NULL(ps, code, lino, _end, terrno);
}
ps->param = param;
ps->onlyRef = false;
2024-07-19 08:15:37 +00:00
code = tsortAddSource(pInfo->pSortHandle, ps);
QUERY_CHECK_CODE(code, lino, _end);
if (numOfTable == 1) {
tsortSetSingleTableMerge(pInfo->pSortHandle);
} else {
code = tsortOpen(pInfo->pSortHandle);
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _end);
}
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
}
void stopDurationForGroupTableMergeScan(SOperatorInfo* pOperator) {
STableMergeScanInfo* pInfo = pOperator->info;
2024-07-19 08:15:37 +00:00
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2023-12-15 13:55:25 +00:00
qDebug("%s table merge scan stop duration ", GET_TASKID(pTaskInfo));
SSortExecInfo sortExecInfo = tsortGetSortExecInfo(pInfo->pSortHandle);
pInfo->sortExecInfo.sortMethod = sortExecInfo.sortMethod;
pInfo->sortExecInfo.sortBuffer = sortExecInfo.sortBuffer;
pInfo->sortExecInfo.loops += sortExecInfo.loops;
pInfo->sortExecInfo.readBytes += sortExecInfo.readBytes;
pInfo->sortExecInfo.writeBytes += sortExecInfo.writeBytes;
tsortDestroySortHandle(pInfo->pSortHandle);
pInfo->pSortHandle = NULL;
}
2024-07-19 08:15:37 +00:00
void startGroupTableMergeScan(SOperatorInfo* pOperator) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2022-06-14 10:17:18 +00:00
STableMergeScanInfo* pInfo = pOperator->info;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2024-07-19 08:15:37 +00:00
SReadHandle* pHandle = &pInfo->base.readHandle;
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
qDebug("%s table merge scan start group %" PRIu64, GET_TASKID(pTaskInfo), pInfo->groupId);
2022-06-14 10:17:18 +00:00
2022-06-25 05:52:52 +00:00
{
int32_t numOfTables = 0;
code = tableListGetSize(pInfo->base.pTableListInfo, &numOfTables);
QUERY_CHECK_CODE(code, lino, _end);
2024-08-29 11:55:09 +00:00
2022-06-25 05:52:52 +00:00
int32_t i = pInfo->tableStartIndex + 1;
2022-10-30 14:13:49 +00:00
for (; i < numOfTables; ++i) {
STableKeyInfo* tableKeyInfo = tableListGetInfo(pInfo->base.pTableListInfo, i);
2024-08-06 01:24:31 +00:00
QUERY_CHECK_NULL(tableKeyInfo, code, lino, _end, terrno);
2022-06-25 05:52:52 +00:00
if (tableKeyInfo->groupId != pInfo->groupId) {
break;
}
}
pInfo->tableEndIndex = i - 1;
}
2023-12-28 08:18:38 +00:00
pInfo->bGroupProcessed = false;
2022-06-25 05:52:52 +00:00
int32_t tableStartIdx = pInfo->tableStartIndex;
int32_t tableEndIdx = pInfo->tableEndIndex;
2022-06-14 10:17:18 +00:00
2024-07-19 08:15:37 +00:00
int32_t numOfTable = tableEndIdx - tableStartIdx + 1;
STableKeyInfo* startKeyInfo = tableListGetInfo(pInfo->base.pTableListInfo, tableStartIdx);
2024-07-19 08:15:37 +00:00
code = pAPI->tsdReader.tsdReaderOpen(pHandle->vnode, &pInfo->base.cond, startKeyInfo, numOfTable, pInfo->pReaderBlock,
(void**)&pInfo->base.dataReader, GET_TASKID(pTaskInfo), &pInfo->mSkipTables);
QUERY_CHECK_CODE(code, lino, _end);
if (pInfo->filesetDelimited) {
2023-12-06 01:39:38 +00:00
pAPI->tsdReader.tsdSetFilesetDelimited(pInfo->base.dataReader);
2023-09-01 05:24:47 +00:00
}
pAPI->tsdReader.tsdSetSetNotifyCb(pInfo->base.dataReader, tableMergeScanTsdbNotifyCb, pInfo);
2022-06-14 10:17:18 +00:00
2024-07-19 08:15:37 +00:00
code = startDurationForGroupTableMergeScan(pOperator);
QUERY_CHECK_CODE(code, lino, _end);
2022-06-14 10:17:18 +00:00
2024-07-19 08:15:37 +00:00
_end:
2022-06-14 10:17:18 +00:00
if (code != TSDB_CODE_SUCCESS) {
2024-07-19 08:15:37 +00:00
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
T_LONG_JMP(pTaskInfo->env, code);
2022-06-14 10:17:18 +00:00
}
}
2024-07-19 08:15:37 +00:00
void stopGroupTableMergeScan(SOperatorInfo* pOperator) {
STableMergeScanInfo* pInfo = pOperator->info;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
stopDurationForGroupTableMergeScan(pOperator);
if (pInfo->base.dataReader != NULL) {
pAPI->tsdReader.tsdReaderClose(pInfo->base.dataReader);
pInfo->base.dataReader = NULL;
2022-07-25 08:41:32 +00:00
}
2023-12-15 13:55:25 +00:00
for (int32_t i = 0; i < pInfo->numNextDurationBlocks; ++i) {
if (pInfo->nextDurationBlocks[i]) {
blockDataDestroy(pInfo->nextDurationBlocks[i]);
pInfo->nextDurationBlocks[i] = NULL;
}
pInfo->numNextDurationBlocks = 0;
pInfo->nextDurationBlocksIdx = 0;
}
resetLimitInfoForNextGroup(&pInfo->limitInfo);
2023-11-17 07:32:14 +00:00
taosHashCleanup(pInfo->mSkipTables);
2023-11-17 08:18:58 +00:00
pInfo->mSkipTables = NULL;
2024-07-19 08:15:37 +00:00
qDebug("%s table merge scan stop group %" PRIu64, GET_TASKID(pTaskInfo), pInfo->groupId);
2022-06-14 10:17:18 +00:00
}
// all data produced by this function only belongs to one group
// slimit/soffset does not need to be concerned here, since this function only deal with data within one group.
2022-07-27 02:52:25 +00:00
SSDataBlock* getSortedTableMergeScanBlockData(SSortHandle* pHandle, SSDataBlock* pResBlock, int32_t capacity,
SOperatorInfo* pOperator) {
2022-06-14 10:17:18 +00:00
STableMergeScanInfo* pInfo = pOperator->info;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2024-09-24 10:19:47 +00:00
STupleHandle* pTupleHandle = NULL;
2022-06-14 10:17:18 +00:00
2022-07-25 08:41:32 +00:00
blockDataCleanup(pResBlock);
2024-09-24 10:19:47 +00:00
2022-06-14 10:17:18 +00:00
while (1) {
2023-07-20 04:29:34 +00:00
while (1) {
pTupleHandle = NULL;
int32_t code = tsortNextTuple(pHandle, &pTupleHandle);
2024-08-26 06:58:12 +00:00
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, __LINE__, tstrerror(code));
T_LONG_JMP(pOperator->pTaskInfo->env, code);
}
if (pTupleHandle == NULL) {
2023-07-20 04:29:34 +00:00
break;
}
2024-07-26 12:48:06 +00:00
code = tsortAppendTupleToBlock(pInfo->pSortHandle, pResBlock, pTupleHandle);
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, __LINE__, tstrerror(code));
T_LONG_JMP(pOperator->pTaskInfo->env, terrno);
}
2023-07-20 04:29:34 +00:00
if (pResBlock->info.rows >= capacity) {
break;
}
2022-06-14 10:17:18 +00:00
}
2023-07-20 04:29:34 +00:00
if (tsortIsClosed(pHandle)) {
terrno = TSDB_CODE_TSC_QUERY_CANCELLED;
T_LONG_JMP(pOperator->pTaskInfo->env, terrno);
2022-06-14 10:17:18 +00:00
}
2024-07-19 08:15:37 +00:00
2023-07-20 04:29:34 +00:00
bool limitReached = applyLimitOffset(&pInfo->limitInfo, pResBlock, pTaskInfo);
qDebug("%s get sorted row block, rows:%" PRId64 ", limit:%" PRId64, GET_TASKID(pTaskInfo), pResBlock->info.rows,
2024-07-19 08:15:37 +00:00
pInfo->limitInfo.numOfOutputRows);
2023-07-20 04:29:34 +00:00
if (pTupleHandle == NULL || limitReached || pResBlock->info.rows > 0) {
break;
2024-07-19 08:15:37 +00:00
}
2023-06-26 10:43:00 +00:00
}
2022-07-25 08:41:32 +00:00
return (pResBlock->info.rows > 0) ? pResBlock : NULL;
2022-06-14 10:17:18 +00:00
}
2024-07-24 08:17:28 +00:00
int32_t doTableMergeScanNext(SOperatorInfo* pOperator, SSDataBlock** ppRes) {
2022-06-14 10:17:18 +00:00
if (pOperator->status == OP_EXEC_DONE) {
2024-07-24 08:17:28 +00:00
(*ppRes) = NULL;
return TSDB_CODE_SUCCESS;
2022-06-14 10:17:18 +00:00
}
2024-07-24 08:17:28 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2022-06-14 10:17:18 +00:00
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
STableMergeScanInfo* pInfo = pOperator->info;
2024-07-24 08:17:28 +00:00
code = pOperator->fpSet._openFn(pOperator);
QUERY_CHECK_CODE(code, lino, _end);
2024-04-03 10:35:50 +00:00
int64_t st = taosGetTimestampUs();
int32_t tableListSize = 0;
code = tableListGetSize(pInfo->base.pTableListInfo, &tableListSize);
QUERY_CHECK_CODE(code, lino, _end);
2022-06-25 05:52:52 +00:00
if (!pInfo->hasGroupId) {
pInfo->hasGroupId = true;
2022-06-14 10:17:18 +00:00
2022-06-25 05:52:52 +00:00
if (tableListSize == 0) {
2022-11-09 11:14:27 +00:00
setOperatorCompleted(pOperator);
2024-07-24 08:17:28 +00:00
(*ppRes) = NULL;
return code;
}
2022-06-25 05:52:52 +00:00
pInfo->tableStartIndex = 0;
2024-08-06 01:24:31 +00:00
STableKeyInfo* tmp = (STableKeyInfo*)tableListGetInfo(pInfo->base.pTableListInfo, pInfo->tableStartIndex);
QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
pInfo->groupId = tmp->groupId;
startGroupTableMergeScan(pOperator);
}
2022-06-25 05:52:52 +00:00
SSDataBlock* pBlock = NULL;
while (pInfo->tableStartIndex < tableListSize) {
if (isTaskKilled(pTaskInfo)) {
goto _end;
}
2022-07-27 02:52:25 +00:00
pBlock = getSortedTableMergeScanBlockData(pInfo->pSortHandle, pInfo->pResBlock, pOperator->resultInfo.capacity,
pOperator);
2023-12-28 08:18:38 +00:00
if (pBlock == NULL && !pInfo->bGroupProcessed && pInfo->needCountEmptyTable) {
STableKeyInfo* tbInfo = tableListGetInfo(pInfo->base.pTableListInfo, pInfo->tableStartIndex);
2024-08-06 01:24:31 +00:00
QUERY_CHECK_NULL(tbInfo, code, lino, _end, terrno);
2023-12-28 08:18:38 +00:00
pBlock = getOneRowResultBlock(pTaskInfo, &pInfo->base, pInfo->pResBlock, tbInfo);
}
2022-06-25 05:52:52 +00:00
if (pBlock != NULL) {
2022-11-28 04:32:40 +00:00
pBlock->info.id.groupId = pInfo->groupId;
2022-06-25 05:52:52 +00:00
pOperator->resultInfo.totalRows += pBlock->info.rows;
2023-12-28 08:18:38 +00:00
pInfo->bGroupProcessed = true;
2024-04-03 10:35:50 +00:00
break;
2022-06-25 05:52:52 +00:00
} else {
2023-12-15 07:04:47 +00:00
if (pInfo->bNewFilesetEvent) {
stopDurationForGroupTableMergeScan(pOperator);
2024-02-28 06:31:31 +00:00
code = startDurationForGroupTableMergeScan(pOperator);
2024-07-24 08:17:28 +00:00
QUERY_CHECK_CODE(code, lino, _end);
} else {
// Data of this group are all dumped, let's try the next group
stopGroupTableMergeScan(pOperator);
if (pInfo->tableEndIndex >= tableListSize - 1) {
setOperatorCompleted(pOperator);
break;
}
pInfo->tableStartIndex = pInfo->tableEndIndex + 1;
2024-08-06 01:24:31 +00:00
STableKeyInfo* tmp = tableListGetInfo(pInfo->base.pTableListInfo, pInfo->tableStartIndex);
QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
pInfo->groupId = tmp->groupId;
startGroupTableMergeScan(pOperator);
resetLimitInfoForNextGroup(&pInfo->limitInfo);
}
2022-06-25 05:52:52 +00:00
}
2022-06-23 11:58:12 +00:00
}
2024-07-19 08:15:37 +00:00
pOperator->cost.totalCost += (taosGetTimestampUs() - st) / 1000.0;
2024-04-03 10:35:50 +00:00
2024-07-24 08:17:28 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
pTaskInfo->code = code;
T_LONG_JMP(pTaskInfo->env, code);
} else {
(*ppRes) = pBlock;
2024-07-24 08:17:28 +00:00
}
2024-07-24 08:17:28 +00:00
return code;
}
static SSDataBlock* doTableMergeScan(SOperatorInfo* pOperator) {
SSDataBlock* pRes = NULL;
2024-07-29 02:35:06 +00:00
int32_t code = doTableMergeScanNext(pOperator, &pRes);
2024-07-24 08:17:28 +00:00
return pRes;
2022-06-14 10:17:18 +00:00
}
void destroyTableMergeScanOperatorInfo(void* param) {
2022-06-14 10:17:18 +00:00
STableMergeScanInfo* pTableScanInfo = (STableMergeScanInfo*)param;
2022-10-28 15:23:53 +00:00
// start one reader variable
2024-08-07 07:33:09 +00:00
if (pTableScanInfo->base.readerAPI.tsdReaderClose != NULL) {
pTableScanInfo->base.readerAPI.tsdReaderClose(pTableScanInfo->base.dataReader);
pTableScanInfo->base.dataReader = NULL;
}
2023-03-22 08:08:16 +00:00
2023-12-15 13:55:25 +00:00
for (int32_t i = 0; i < pTableScanInfo->numNextDurationBlocks; ++i) {
if (pTableScanInfo->nextDurationBlocks[i] != NULL) {
blockDataDestroy(pTableScanInfo->nextDurationBlocks[i]);
pTableScanInfo->nextDurationBlocks[i] = NULL;
}
}
2022-11-18 10:21:22 +00:00
tsortDestroySortHandle(pTableScanInfo->pSortHandle);
pTableScanInfo->pSortHandle = NULL;
2023-11-17 07:32:14 +00:00
taosHashCleanup(pTableScanInfo->mSkipTables);
2023-11-17 08:18:58 +00:00
pTableScanInfo->mSkipTables = NULL;
2024-07-18 16:09:28 +00:00
blockDataDestroy(pTableScanInfo->pSortInputBlock);
pTableScanInfo->pSortInputBlock = NULL;
// end one reader variable
cleanupQueryTableDataCond(&pTableScanInfo->base.cond);
destroyTableScanBase(&pTableScanInfo->base, &pTableScanInfo->base.readerAPI);
2022-06-14 10:17:18 +00:00
2024-07-19 03:49:05 +00:00
blockDataDestroy(pTableScanInfo->pResBlock);
2024-07-18 16:09:28 +00:00
pTableScanInfo->pResBlock = NULL;
2024-07-19 03:49:05 +00:00
// remove it from the task->result list
2024-07-18 16:09:28 +00:00
blockDataDestroy(pTableScanInfo->pReaderBlock);
pTableScanInfo->pReaderBlock = NULL;
2022-06-14 10:17:18 +00:00
taosArrayDestroy(pTableScanInfo->pSortInfo);
stopSubTablesTableMergeScan(pTableScanInfo);
2022-07-08 06:26:53 +00:00
taosMemoryFreeClear(param);
2022-06-14 10:17:18 +00:00
}
int32_t getTableMergeScanExplainExecInfo(SOperatorInfo* pOptr, void** pOptrExplain, uint32_t* len) {
if (pOptr == NULL) {
qError("%s failed at line %d since %s", __func__, __LINE__, tstrerror(TSDB_CODE_INVALID_PARA));
return TSDB_CODE_INVALID_PARA;
}
2022-06-14 11:44:48 +00:00
// TODO: merge these two info into one struct
STableMergeScanExecInfo* execInfo = taosMemoryCalloc(1, sizeof(STableMergeScanExecInfo));
2024-08-05 04:22:25 +00:00
if (!execInfo) {
return terrno;
}
2024-09-11 08:37:06 +00:00
STableMergeScanInfo* pInfo = pOptr->info;
2022-11-18 01:47:26 +00:00
execInfo->blockRecorder = pInfo->base.readRecorder;
execInfo->sortExecInfo = pInfo->sortExecInfo;
2022-06-14 11:44:48 +00:00
*pOptrExplain = execInfo;
*len = sizeof(STableMergeScanExecInfo);
2022-06-20 06:29:18 +00:00
2022-06-14 10:17:18 +00:00
return TSDB_CODE_SUCCESS;
}
2024-07-24 09:08:08 +00:00
int32_t createTableMergeScanOperatorInfo(STableScanPhysiNode* pTableScanNode, SReadHandle* readHandle,
2024-07-29 02:35:06 +00:00
STableListInfo* pTableListInfo, SExecTaskInfo* pTaskInfo,
SOperatorInfo** pOptrInfo) {
QRY_PARAM_CHECK(pOptrInfo);
2024-07-24 09:08:08 +00:00
2024-08-08 03:23:50 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2022-06-14 10:17:18 +00:00
STableMergeScanInfo* pInfo = taosMemoryCalloc(1, sizeof(STableMergeScanInfo));
SOperatorInfo* pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
if (pInfo == NULL || pOperator == NULL) {
code = terrno;
2022-06-14 10:17:18 +00:00
goto _error;
}
2022-06-14 10:17:18 +00:00
SDataBlockDescNode* pDescNode = pTableScanNode->scan.node.pOutputDataBlockDesc;
int32_t numOfCols = 0;
2024-07-24 09:08:08 +00:00
code = extractColMatchInfo(pTableScanNode->scan.pScanCols, pDescNode, &numOfCols, COL_MATCH_FROM_COL_ID,
2024-07-29 02:35:06 +00:00
&pInfo->base.matchInfo);
2024-08-08 03:23:50 +00:00
QUERY_CHECK_CODE(code, lino, _error);
2022-06-14 10:17:18 +00:00
2023-11-07 11:59:05 +00:00
code = initQueryTableDataCond(&pInfo->base.cond, pTableScanNode, readHandle);
2024-08-08 03:23:50 +00:00
QUERY_CHECK_CODE(code, lino, _error);
2022-06-14 10:17:18 +00:00
if (pTableScanNode->scan.pScanPseudoCols != NULL) {
2022-11-18 01:47:26 +00:00
SExprSupp* pSup = &pInfo->base.pseudoSup;
2024-08-05 03:57:18 +00:00
code = createExprInfo(pTableScanNode->scan.pScanPseudoCols, NULL, &pSup->pExprInfo, &pSup->numOfExprs);
QUERY_CHECK_CODE(code, lino, _error);
2024-07-19 08:15:37 +00:00
pSup->pCtx = createSqlFunctionCtx(pSup->pExprInfo, pSup->numOfExprs, &pSup->rowEntryInfoOffset,
&pTaskInfo->storageAPI.functionStore);
2024-08-05 04:22:25 +00:00
QUERY_CHECK_NULL(pSup->pCtx, code, lino, _error, terrno);
2022-06-14 10:17:18 +00:00
}
pInfo->scanInfo = (SScanInfo){.numOfAsc = pTableScanNode->scanSeq[0], .numOfDesc = pTableScanNode->scanSeq[1]};
2022-11-18 09:07:09 +00:00
pInfo->base.metaCache.pTableMetaEntryCache = taosLRUCacheInit(1024 * 128, -1, .5);
2024-08-08 03:23:50 +00:00
QUERY_CHECK_NULL(pInfo->base.metaCache.pTableMetaEntryCache, code, lino, _error, terrno);
2022-11-18 09:07:09 +00:00
2023-05-24 15:49:26 +00:00
pInfo->base.readerAPI = pTaskInfo->storageAPI.tsdReader;
2022-11-18 05:40:03 +00:00
pInfo->base.dataBlockLoadFlag = FUNC_DATA_REQUIRED_DATA_LOAD;
pInfo->base.scanFlag = MAIN_SCAN;
2022-11-18 01:47:26 +00:00
pInfo->base.readHandle = *readHandle;
pInfo->readIdx = -1;
pInfo->base.limitInfo.limit.limit = -1;
pInfo->base.limitInfo.slimit.limit = -1;
pInfo->base.pTableListInfo = pTableListInfo;
2022-11-18 05:40:03 +00:00
2022-06-14 10:17:18 +00:00
pInfo->sample.sampleRatio = pTableScanNode->ratio;
2022-06-20 06:29:18 +00:00
pInfo->sample.seed = taosGetTimestampSec();
2022-11-04 14:13:40 +00:00
2025-05-09 10:05:02 +00:00
code = filterInitFromNode((SNode*)pTableScanNode->scan.node.pConditions, &pOperator->exprSupp.pFilterInfo, 0,
&pTaskInfo->pStreamRuntimeInfo);
2024-08-08 03:23:50 +00:00
QUERY_CHECK_CODE(code, lino, _error);
2022-11-04 14:13:40 +00:00
initLimitInfo(pTableScanNode->scan.node.pLimit, pTableScanNode->scan.node.pSlimit, &pInfo->limitInfo);
2023-11-17 07:32:14 +00:00
pInfo->mergeLimit = -1;
bool hasLimit = pInfo->limitInfo.limit.limit != -1 || pInfo->limitInfo.limit.offset != -1;
if (hasLimit) {
pInfo->mergeLimit = pInfo->limitInfo.limit.offset != -1 ? pInfo->limitInfo.limit.limit + pInfo->limitInfo.limit.offset : pInfo->limitInfo.limit.limit;
2023-11-17 07:32:14 +00:00
pInfo->mSkipTables = NULL;
}
2023-07-16 12:28:54 +00:00
initResultSizeInfo(&pOperator->resultInfo, 1024);
pInfo->pResBlock = createDataBlockFromDescNode(pDescNode);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(pInfo->pResBlock, code, lino, _error, terrno);
2024-07-19 08:15:37 +00:00
code = blockDataEnsureCapacity(pInfo->pResBlock, pOperator->resultInfo.capacity);
QUERY_CHECK_CODE(code, lino, _error);
if (!hasLimit && blockDataGetRowSize(pInfo->pResBlock) >= 256 && !pTableScanNode->smallDataTsSort) {
pInfo->bSortRowId = true;
} else {
pInfo->bSortRowId = false;
}
2024-07-19 08:15:37 +00:00
code = prepareDataBlockBuf(pInfo->pResBlock, &pInfo->base.matchInfo);
QUERY_CHECK_CODE(code, lino, _error);
2024-04-08 10:04:06 +00:00
2024-07-19 08:15:37 +00:00
code = generateSortByTsPkInfo(pInfo->base.matchInfo.pList, pInfo->base.cond.order, &pInfo->pSortInfo);
QUERY_CHECK_CODE(code, lino, _error);
2024-07-27 10:55:34 +00:00
code = createOneDataBlock(pInfo->pResBlock, false, &pInfo->pReaderBlock);
QUERY_CHECK_CODE(code, lino, _error);
2023-07-16 12:28:54 +00:00
pInfo->needCountEmptyTable = tsCountAlwaysReturnValue && pTableScanNode->needCountEmptyTable;
2022-11-18 10:21:22 +00:00
int32_t rowSize = pInfo->pResBlock->info.rowSize;
2022-11-16 08:10:22 +00:00
uint32_t nCols = taosArrayGetSize(pInfo->pResBlock->pDataBlock);
2024-07-19 08:15:37 +00:00
2022-11-16 08:10:22 +00:00
pInfo->bufPageSize = getProperSortPageSize(rowSize, nCols);
2024-07-19 08:15:37 +00:00
// start one reader variable
2024-07-27 10:55:34 +00:00
code = createOneDataBlock(pInfo->pResBlock, false, &pInfo->pSortInputBlock);
QUERY_CHECK_CODE(code, lino, _error);
2023-12-15 02:40:54 +00:00
if (!tsExperimental) {
pInfo->filesetDelimited = false;
} else {
pInfo->filesetDelimited = pTableScanNode->filesetDelimited;
}
// end one reader variable
2022-11-11 01:12:57 +00:00
setOperatorInfo(pOperator, "TableMergeScanOperator", QUERY_NODE_PHYSICAL_PLAN_TABLE_MERGE_SCAN, false, OP_NOT_OPENED,
pInfo, pTaskInfo);
2022-06-20 06:40:13 +00:00
pOperator->exprSupp.numOfExprs = numOfCols;
2022-06-14 10:17:18 +00:00
2024-02-02 07:00:09 +00:00
pOperator->fpSet = createOperatorFpSet(
2024-08-27 09:04:44 +00:00
optrDummyOpenFn, pTableScanNode->paraTablesSort ? doTableMergeScanParaSubTablesNext : doTableMergeScanNext, NULL,
2024-02-02 07:00:09 +00:00
destroyTableMergeScanOperatorInfo, optrDefaultBufFn, getTableMergeScanExplainExecInfo, optrDefaultGetNextExtFn,
NULL);
2022-06-14 10:17:18 +00:00
pOperator->cost.openCost = 0;
2024-07-24 09:08:08 +00:00
*pOptrInfo = pOperator;
return code;
2022-06-14 10:17:18 +00:00
_error:
2024-08-08 03:23:50 +00:00
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
2024-08-06 02:19:22 +00:00
pTaskInfo->code = code;
2024-08-08 08:24:18 +00:00
if (pInfo != NULL) {
pInfo->base.pTableListInfo = NULL;
destroyTableMergeScanOperatorInfo(pInfo);
}
2024-08-07 07:53:23 +00:00
if (pOperator != NULL) {
pOperator->info = NULL;
destroyOperator(pOperator);
}
2024-07-24 09:08:08 +00:00
return code;
2022-06-14 10:17:18 +00:00
}
2022-11-18 03:53:33 +00:00
// ====================================================================================================================
// TableCountScanOperator
2024-09-11 08:37:06 +00:00
static void destoryTableCountScanOperator(void* param);
static int32_t buildVnodeGroupedStbTableCount(STableCountScanOperatorInfo* pInfo, STableCountScanSupp* pSupp,
SSDataBlock* pRes, char* dbName, tb_uid_t stbUid, SStorageAPI* pAPI);
static int32_t buildVnodeGroupedNtbTableCount(STableCountScanOperatorInfo* pInfo, STableCountScanSupp* pSupp,
SSDataBlock* pRes, char* dbName, SStorageAPI* pAPI);
static int32_t buildVnodeFilteredTbCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
STableCountScanSupp* pSupp, SSDataBlock* pRes, char* dbName);
static int32_t buildVnodeGroupedTableCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
STableCountScanSupp* pSupp, SSDataBlock* pRes, int32_t vgId, char* dbName);
static int32_t buildVnodeDbTableCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
STableCountScanSupp* pSupp, SSDataBlock* pRes);
static void buildSysDbGroupedTableCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
STableCountScanSupp* pSupp, SSDataBlock* pRes, size_t infodbTableNum,
size_t perfdbTableNum);
static void buildSysDbFilterTableCount(SOperatorInfo* pOperator, STableCountScanSupp* pSupp, SSDataBlock* pRes,
size_t infodbTableNum, size_t perfdbTableNum);
static const char* GROUP_TAG_DB_NAME = "db_name";
static const char* GROUP_TAG_STABLE_NAME = "stable_name";
2022-11-25 15:00:14 +00:00
int32_t tblCountScanGetGroupTagsSlotId(const SNodeList* scanCols, STableCountScanSupp* supp) {
if (scanCols != NULL) {
SNode* pNode = NULL;
FOREACH(pNode, scanCols) {
if (nodeType(pNode) != QUERY_NODE_TARGET) {
return TSDB_CODE_QRY_SYS_ERROR;
}
STargetNode* targetNode = (STargetNode*)pNode;
if (nodeType(targetNode->pExpr) != QUERY_NODE_COLUMN) {
return TSDB_CODE_QRY_SYS_ERROR;
}
SColumnNode* colNode = (SColumnNode*)(targetNode->pExpr);
if (strcmp(colNode->colName, GROUP_TAG_DB_NAME) == 0) {
supp->dbNameSlotId = targetNode->slotId;
} else if (strcmp(colNode->colName, GROUP_TAG_STABLE_NAME) == 0) {
supp->stbNameSlotId = targetNode->slotId;
}
}
}
return TSDB_CODE_SUCCESS;
}
int32_t tblCountScanGetCountSlotId(const SNodeList* pseudoCols, STableCountScanSupp* supp) {
if (pseudoCols != NULL) {
SNode* pNode = NULL;
FOREACH(pNode, pseudoCols) {
if (nodeType(pNode) != QUERY_NODE_TARGET) {
return TSDB_CODE_QRY_SYS_ERROR;
}
STargetNode* targetNode = (STargetNode*)pNode;
if (nodeType(targetNode->pExpr) != QUERY_NODE_FUNCTION) {
return TSDB_CODE_QRY_SYS_ERROR;
}
SFunctionNode* funcNode = (SFunctionNode*)(targetNode->pExpr);
if (funcNode->funcType == FUNCTION_TYPE_TABLE_COUNT) {
supp->tbCountSlotId = targetNode->slotId;
}
}
}
return TSDB_CODE_SUCCESS;
}
int32_t tblCountScanGetInputs(SNodeList* groupTags, SName* tableName, STableCountScanSupp* supp) {
if (groupTags != NULL) {
SNode* pNode = NULL;
FOREACH(pNode, groupTags) {
if (nodeType(pNode) != QUERY_NODE_COLUMN) {
return TSDB_CODE_QRY_SYS_ERROR;
}
SColumnNode* colNode = (SColumnNode*)pNode;
if (strcmp(colNode->colName, GROUP_TAG_DB_NAME) == 0) {
supp->groupByDbName = true;
}
if (strcmp(colNode->colName, GROUP_TAG_STABLE_NAME) == 0) {
supp->groupByStbName = true;
}
}
} else {
2023-02-24 01:48:34 +00:00
tstrncpy(supp->dbNameFilter, tNameGetDbNameP(tableName), TSDB_DB_NAME_LEN);
tstrncpy(supp->stbNameFilter, tNameGetTableName(tableName), TSDB_TABLE_NAME_LEN);
2022-11-25 15:00:14 +00:00
}
return TSDB_CODE_SUCCESS;
}
int32_t getTableCountScanSupp(SNodeList* groupTags, SName* tableName, SNodeList* scanCols, SNodeList* pseudoCols,
STableCountScanSupp* supp, SExecTaskInfo* taskInfo) {
int32_t code = 0;
code = tblCountScanGetInputs(groupTags, tableName, supp);
if (code != TSDB_CODE_SUCCESS) {
qError("%s get table count scan supp. get inputs error", GET_TASKID(taskInfo));
return code;
}
2023-05-25 09:51:03 +00:00
2022-11-25 15:00:14 +00:00
supp->dbNameSlotId = -1;
supp->stbNameSlotId = -1;
supp->tbCountSlotId = -1;
code = tblCountScanGetGroupTagsSlotId(scanCols, supp);
if (code != TSDB_CODE_SUCCESS) {
qError("%s get table count scan supp. get group tags slot id error", GET_TASKID(taskInfo));
return code;
}
2023-05-25 09:51:03 +00:00
2022-11-25 15:00:14 +00:00
code = tblCountScanGetCountSlotId(pseudoCols, supp);
if (code != TSDB_CODE_SUCCESS) {
qError("%s get table count scan supp. get count error", GET_TASKID(taskInfo));
return code;
}
return code;
}
2022-11-18 03:53:33 +00:00
2024-07-24 09:08:08 +00:00
int32_t createTableCountScanOperatorInfo(SReadHandle* readHandle, STableCountScanPhysiNode* pTblCountScanNode,
2024-07-29 02:35:06 +00:00
SExecTaskInfo* pTaskInfo, SOperatorInfo** pOptrInfo) {
QRY_PARAM_CHECK(pOptrInfo);
2022-11-18 03:53:33 +00:00
2024-07-24 09:08:08 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2022-11-25 15:00:14 +00:00
SScanPhysiNode* pScanNode = &pTblCountScanNode->scan;
STableCountScanOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(STableCountScanOperatorInfo));
2022-11-25 15:00:14 +00:00
SOperatorInfo* pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
2022-11-18 03:53:33 +00:00
if (!pInfo || !pOperator) {
code = terrno;
2022-11-18 03:53:33 +00:00
goto _error;
}
pInfo->readHandle = *readHandle;
SDataBlockDescNode* pDescNode = pScanNode->node.pOutputDataBlockDesc;
initResultSizeInfo(&pOperator->resultInfo, 1);
pInfo->pRes = createDataBlockFromDescNode(pDescNode);
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(pInfo->pRes, code, lino, _error, terrno);
2022-11-18 03:53:33 +00:00
2024-07-19 08:15:37 +00:00
code = blockDataEnsureCapacity(pInfo->pRes, pOperator->resultInfo.capacity);
QUERY_CHECK_CODE(code, lino, _error);
code = getTableCountScanSupp(pTblCountScanNode->pGroupTags, &pTblCountScanNode->scan.tableName,
pTblCountScanNode->scan.pScanCols, pTblCountScanNode->scan.pScanPseudoCols, &pInfo->supp,
pTaskInfo);
QUERY_CHECK_CODE(code, lino, _error);
2022-11-18 03:53:33 +00:00
setOperatorInfo(pOperator, "TableCountScanOperator", QUERY_NODE_PHYSICAL_PLAN_TABLE_COUNT_SCAN, false, OP_NOT_OPENED,
pInfo, pTaskInfo);
2024-08-27 09:04:44 +00:00
pOperator->fpSet = createOperatorFpSet(optrDummyOpenFn, doTableCountScanNext, NULL, destoryTableCountScanOperator,
2023-09-01 05:24:47 +00:00
optrDefaultBufFn, NULL, optrDefaultGetNextExtFn, NULL);
2024-07-24 09:08:08 +00:00
*pOptrInfo = pOperator;
return code;
2022-11-18 03:53:33 +00:00
_error:
if (pInfo != NULL) {
destoryTableCountScanOperator(pInfo);
}
2024-08-07 07:53:23 +00:00
if (pOperator != NULL) {
pOperator->info = NULL;
destroyOperator(pOperator);
}
2022-11-18 03:53:33 +00:00
pTaskInfo->code = code;
2024-07-24 09:08:08 +00:00
return code;
2022-11-18 03:53:33 +00:00
}
2024-07-19 08:15:37 +00:00
int32_t fillTableCountScanDataBlock(STableCountScanSupp* pSupp, char* dbName, char* stbName, int64_t count,
SSDataBlock* pRes) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
2022-11-26 15:03:12 +00:00
if (pSupp->dbNameSlotId != -1) {
QUERY_CHECK_CONDITION((strlen(dbName) > 0), code, lino, _end, TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR);
2022-11-26 15:03:12 +00:00
SColumnInfoData* colInfoData = taosArrayGet(pRes->pDataBlock, pSupp->dbNameSlotId);
2024-08-05 08:09:01 +00:00
QUERY_CHECK_NULL(colInfoData, code, lino, _end, terrno);
2022-12-03 05:47:51 +00:00
char varDbName[TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
tstrncpy(varDataVal(varDbName), dbName, TSDB_DB_NAME_LEN);
2022-11-26 15:03:12 +00:00
varDataSetLen(varDbName, strlen(dbName));
2024-07-19 08:15:37 +00:00
code = colDataSetVal(colInfoData, 0, varDbName, false);
QUERY_CHECK_CODE(code, lino, _end);
2022-11-26 15:03:12 +00:00
}
if (pSupp->stbNameSlotId != -1) {
SColumnInfoData* colInfoData = taosArrayGet(pRes->pDataBlock, pSupp->stbNameSlotId);
2024-08-05 08:09:01 +00:00
QUERY_CHECK_NULL(colInfoData, code, lino, _end, terrno);
if (strlen(stbName) != 0) {
2022-12-01 11:05:33 +00:00
char varStbName[TSDB_TABLE_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
tstrncpy(varDataVal(varStbName), stbName, TSDB_TABLE_NAME_LEN);
varDataSetLen(varStbName, strlen(stbName));
2024-07-19 08:15:37 +00:00
code = colDataSetVal(colInfoData, 0, varStbName, false);
QUERY_CHECK_CODE(code, lino, _end);
} else {
2023-02-20 02:13:11 +00:00
colDataSetNULL(colInfoData, 0);
}
2022-11-26 15:03:12 +00:00
}
if (pSupp->tbCountSlotId != -1) {
SColumnInfoData* colInfoData = taosArrayGet(pRes->pDataBlock, pSupp->tbCountSlotId);
2024-08-05 08:09:01 +00:00
QUERY_CHECK_NULL(colInfoData, code, lino, _end, terrno);
2024-07-19 08:15:37 +00:00
code = colDataSetVal(colInfoData, 0, (char*)&count, false);
QUERY_CHECK_CODE(code, lino, _end);
2022-11-26 15:03:12 +00:00
}
pRes->info.rows = 1;
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
2022-11-26 15:03:12 +00:00
}
static SSDataBlock* buildSysDbTableCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo) {
2022-11-26 15:03:12 +00:00
STableCountScanSupp* pSupp = &pInfo->supp;
SSDataBlock* pRes = pInfo->pRes;
size_t infodbTableNum;
2022-11-26 15:03:12 +00:00
getInfosDbMeta(NULL, &infodbTableNum);
2024-06-17 12:40:23 +00:00
infodbTableNum -= 1;
size_t perfdbTableNum;
2022-11-26 15:03:12 +00:00
getPerfDbMeta(NULL, &perfdbTableNum);
2023-03-22 08:08:16 +00:00
if (pSupp->groupByDbName || pSupp->groupByStbName) {
2022-12-01 11:05:33 +00:00
buildSysDbGroupedTableCount(pOperator, pInfo, pSupp, pRes, infodbTableNum, perfdbTableNum);
2022-11-26 15:03:12 +00:00
return (pRes->info.rows > 0) ? pRes : NULL;
} else {
2022-12-01 11:05:33 +00:00
buildSysDbFilterTableCount(pOperator, pSupp, pRes, infodbTableNum, perfdbTableNum);
2022-11-26 15:03:12 +00:00
return (pRes->info.rows > 0) ? pRes : NULL;
}
}
2022-12-01 11:05:33 +00:00
static void buildSysDbFilterTableCount(SOperatorInfo* pOperator, STableCountScanSupp* pSupp, SSDataBlock* pRes,
size_t infodbTableNum, size_t perfdbTableNum) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2022-12-01 11:05:33 +00:00
if (strcmp(pSupp->dbNameFilter, TSDB_INFORMATION_SCHEMA_DB) == 0) {
2024-07-19 08:15:37 +00:00
code = fillTableCountScanDataBlock(pSupp, TSDB_INFORMATION_SCHEMA_DB, "", infodbTableNum, pRes);
QUERY_CHECK_CODE(code, lino, _end);
2022-12-01 11:05:33 +00:00
} else if (strcmp(pSupp->dbNameFilter, TSDB_PERFORMANCE_SCHEMA_DB) == 0) {
2024-07-19 08:15:37 +00:00
code = fillTableCountScanDataBlock(pSupp, TSDB_PERFORMANCE_SCHEMA_DB, "", perfdbTableNum, pRes);
QUERY_CHECK_CODE(code, lino, _end);
2022-12-01 11:05:33 +00:00
} else if (strlen(pSupp->dbNameFilter) == 0) {
2024-07-19 08:15:37 +00:00
code = fillTableCountScanDataBlock(pSupp, "", "", infodbTableNum + perfdbTableNum, pRes);
QUERY_CHECK_CODE(code, lino, _end);
}
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
T_LONG_JMP(pTaskInfo->env, code);
2022-12-01 11:05:33 +00:00
}
setOperatorCompleted(pOperator);
}
static void buildSysDbGroupedTableCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
STableCountScanSupp* pSupp, SSDataBlock* pRes, size_t infodbTableNum,
size_t perfdbTableNum) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2022-12-01 11:05:33 +00:00
if (pInfo->currGrpIdx == 0) {
2023-03-22 08:08:16 +00:00
uint64_t groupId = 0;
if (pSupp->groupByDbName) {
groupId = calcGroupId(TSDB_INFORMATION_SCHEMA_DB, strlen(TSDB_INFORMATION_SCHEMA_DB));
} else {
groupId = calcGroupId("", 0);
}
2023-04-04 06:50:58 +00:00
2022-12-01 11:05:33 +00:00
pRes->info.id.groupId = groupId;
2024-07-19 08:15:37 +00:00
code = fillTableCountScanDataBlock(pSupp, TSDB_INFORMATION_SCHEMA_DB, "", infodbTableNum, pRes);
QUERY_CHECK_CODE(code, lino, _end);
2022-12-01 11:05:33 +00:00
} else if (pInfo->currGrpIdx == 1) {
2023-03-22 08:08:16 +00:00
uint64_t groupId = 0;
if (pSupp->groupByDbName) {
groupId = calcGroupId(TSDB_PERFORMANCE_SCHEMA_DB, strlen(TSDB_PERFORMANCE_SCHEMA_DB));
} else {
groupId = calcGroupId("", 0);
}
2022-12-01 11:05:33 +00:00
pRes->info.id.groupId = groupId;
2024-07-19 08:15:37 +00:00
code = fillTableCountScanDataBlock(pSupp, TSDB_PERFORMANCE_SCHEMA_DB, "", perfdbTableNum, pRes);
QUERY_CHECK_CODE(code, lino, _end);
2022-12-01 11:05:33 +00:00
} else {
setOperatorCompleted(pOperator);
}
pInfo->currGrpIdx++;
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
T_LONG_JMP(pTaskInfo->env, code);
2024-07-19 08:15:37 +00:00
}
2022-12-01 11:05:33 +00:00
}
2024-07-24 08:17:28 +00:00
static int32_t doTableCountScanNext(SOperatorInfo* pOperator, SSDataBlock** ppRes) {
2024-07-29 02:35:06 +00:00
int32_t code = TSDB_CODE_SUCCESS;
2022-11-25 15:00:14 +00:00
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
STableCountScanOperatorInfo* pInfo = pOperator->info;
STableCountScanSupp* pSupp = &pInfo->supp;
SSDataBlock* pRes = pInfo->pRes;
2022-11-26 15:03:12 +00:00
blockDataCleanup(pRes);
QRY_PARAM_CHECK(ppRes);
if (pOperator->status == OP_EXEC_DONE) {
2024-07-24 08:17:28 +00:00
return code;
}
2022-11-26 15:03:12 +00:00
if (pInfo->readHandle.mnd != NULL) {
2024-07-24 08:17:28 +00:00
(*ppRes) = buildSysDbTableCount(pOperator, pInfo);
return code;
2022-11-25 15:00:14 +00:00
}
2022-11-26 15:03:12 +00:00
code = buildVnodeDbTableCount(pOperator, pInfo, pSupp, pRes);
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed since %s", __func__, tstrerror(code));
pTaskInfo->code = code;
T_LONG_JMP(pTaskInfo->env, code);
}
if (pRes->info.rows > 0) {
*ppRes = pRes;
}
2024-07-24 08:17:28 +00:00
return code;
}
static int32_t buildVnodeDbTableCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
STableCountScanSupp* pSupp, SSDataBlock* pRes) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
const char* db = NULL;
int32_t vgId = 0;
char dbName[TSDB_DB_NAME_LEN] = {0};
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2024-07-19 08:15:37 +00:00
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
2022-11-26 15:03:12 +00:00
2022-12-01 11:05:33 +00:00
// get dbname
pAPI->metaFn.getBasicInfo(pInfo->readHandle.vnode, &db, &vgId, NULL, NULL);
2022-12-01 11:05:33 +00:00
SName sn = {0};
2024-07-19 08:15:37 +00:00
code = tNameFromString(&sn, db, T_NAME_ACCT | T_NAME_DB);
QUERY_CHECK_CODE(code, lino, _end);
2024-07-19 08:15:37 +00:00
code = tNameGetDbName(&sn, dbName);
QUERY_CHECK_CODE(code, lino, _end);
2022-12-01 11:05:33 +00:00
2023-03-22 08:08:16 +00:00
if (pSupp->groupByDbName || pSupp->groupByStbName) {
code = buildVnodeGroupedTableCount(pOperator, pInfo, pSupp, pRes, vgId, dbName);
2022-12-01 11:05:33 +00:00
} else {
code = buildVnodeFilteredTbCount(pOperator, pInfo, pSupp, pRes, dbName);
2022-12-01 11:05:33 +00:00
}
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
2024-07-19 08:15:37 +00:00
}
return code;
2022-12-01 11:05:33 +00:00
}
static int32_t buildVnodeGroupedTableCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
2024-09-11 08:37:06 +00:00
STableCountScanSupp* pSupp, SSDataBlock* pRes, int32_t vgId, char* dbName) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2024-07-19 08:15:37 +00:00
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
2022-12-01 11:05:33 +00:00
if (pSupp->groupByStbName) {
if (pInfo->stbUidList == NULL) {
pInfo->stbUidList = taosArrayInit(16, sizeof(tb_uid_t));
2024-07-25 11:11:32 +00:00
QUERY_CHECK_NULL(pInfo->stbUidList, code, lino, _end, terrno);
2024-07-19 08:15:37 +00:00
code = pAPI->metaFn.storeGetTableList(pInfo->readHandle.vnode, TSDB_SUPER_TABLE, pInfo->stbUidList);
QUERY_CHECK_CODE(code, lino, _end);
2022-12-01 11:05:33 +00:00
}
2022-12-01 11:05:33 +00:00
if (pInfo->currGrpIdx < taosArrayGetSize(pInfo->stbUidList)) {
tb_uid_t stbUid = *(tb_uid_t*)taosArrayGet(pInfo->stbUidList, pInfo->currGrpIdx);
2024-07-19 08:15:37 +00:00
code = buildVnodeGroupedStbTableCount(pInfo, pSupp, pRes, dbName, stbUid, pAPI);
QUERY_CHECK_CODE(code, lino, _end);
2022-12-01 11:05:33 +00:00
pInfo->currGrpIdx++;
} else if (pInfo->currGrpIdx == taosArrayGetSize(pInfo->stbUidList)) {
2024-07-19 08:15:37 +00:00
code = buildVnodeGroupedNtbTableCount(pInfo, pSupp, pRes, dbName, pAPI);
QUERY_CHECK_CODE(code, lino, _end);
2022-12-01 11:05:33 +00:00
pInfo->currGrpIdx++;
2022-11-26 15:03:12 +00:00
} else {
setOperatorCompleted(pOperator);
2022-11-26 15:03:12 +00:00
}
} else {
2022-12-01 11:05:33 +00:00
uint64_t groupId = calcGroupId(dbName, strlen(dbName));
pRes->info.id.groupId = groupId;
int64_t dbTableCount = 0;
pAPI->metaFn.getBasicInfo(pInfo->readHandle.vnode, NULL, NULL, &dbTableCount, NULL);
2024-07-19 08:15:37 +00:00
code = fillTableCountScanDataBlock(pSupp, dbName, "", dbTableCount, pRes);
QUERY_CHECK_CODE(code, lino, _end);
2022-12-01 11:05:33 +00:00
setOperatorCompleted(pOperator);
}
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
2024-07-19 08:15:37 +00:00
}
return code;
2022-12-01 11:05:33 +00:00
}
static int32_t buildVnodeFilteredTbCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
2024-09-11 08:37:06 +00:00
STableCountScanSupp* pSupp, SSDataBlock* pRes, char* dbName) {
2024-07-19 08:15:37 +00:00
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2024-07-19 08:15:37 +00:00
SStorageAPI* pAPI = &pTaskInfo->storageAPI;
2022-12-01 11:05:33 +00:00
if (strlen(pSupp->dbNameFilter) != 0) {
if (strlen(pSupp->stbNameFilter) != 0) {
2023-05-25 09:51:03 +00:00
uint64_t uid = 0;
2024-07-19 08:15:37 +00:00
code = pAPI->metaFn.getTableUidByName(pInfo->readHandle.vnode, pSupp->stbNameFilter, &uid);
QUERY_CHECK_CODE(code, lino, _end);
int64_t numOfChildTables = 0;
code = pAPI->metaFn.getNumOfChildTables(pInfo->readHandle.vnode, uid, &numOfChildTables, NULL, NULL);
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _end);
2024-07-19 08:15:37 +00:00
code = fillTableCountScanDataBlock(pSupp, dbName, pSupp->stbNameFilter, numOfChildTables, pRes);
QUERY_CHECK_CODE(code, lino, _end);
} else {
2023-05-25 09:51:03 +00:00
int64_t tbNumVnode = 0;
pAPI->metaFn.getBasicInfo(pInfo->readHandle.vnode, NULL, NULL, &tbNumVnode, NULL);
2024-07-19 08:15:37 +00:00
code = fillTableCountScanDataBlock(pSupp, dbName, "", tbNumVnode, pRes);
QUERY_CHECK_CODE(code, lino, _end);
2022-11-26 15:03:12 +00:00
}
2022-12-01 11:05:33 +00:00
} else {
int64_t tbNumVnode = 0;
pAPI->metaFn.getBasicInfo(pInfo->readHandle.vnode, NULL, NULL, &tbNumVnode, NULL);
2024-07-19 08:15:37 +00:00
code = fillTableCountScanDataBlock(pSupp, dbName, "", tbNumVnode, pRes);
QUERY_CHECK_CODE(code, lino, _end);
2022-11-26 15:03:12 +00:00
}
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
2024-07-23 08:34:28 +00:00
pTaskInfo->code = code;
2024-07-19 08:15:37 +00:00
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
2022-12-01 11:05:33 +00:00
setOperatorCompleted(pOperator);
return code;
2022-12-01 11:05:33 +00:00
}
2024-07-19 08:15:37 +00:00
static int32_t buildVnodeGroupedNtbTableCount(STableCountScanOperatorInfo* pInfo, STableCountScanSupp* pSupp,
SSDataBlock* pRes, char* dbName, SStorageAPI* pAPI) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
char fullStbName[TSDB_TABLE_FNAME_LEN] = {0};
2023-03-22 08:08:16 +00:00
if (pSupp->groupByDbName) {
snprintf(fullStbName, TSDB_TABLE_FNAME_LEN, "%s.%s", dbName, "");
}
2023-04-04 06:50:58 +00:00
2022-12-01 11:05:33 +00:00
uint64_t groupId = calcGroupId(fullStbName, strlen(fullStbName));
pRes->info.id.groupId = groupId;
2023-05-25 01:56:34 +00:00
2023-05-29 02:50:50 +00:00
int64_t numOfTables = 0;
2023-05-25 01:56:34 +00:00
pAPI->metaFn.getBasicInfo(pInfo->readHandle.vnode, NULL, NULL, NULL, &numOfTables);
2023-05-25 09:51:03 +00:00
2023-05-25 01:56:34 +00:00
if (numOfTables != 0) {
2024-07-19 08:15:37 +00:00
code = fillTableCountScanDataBlock(pSupp, dbName, "", numOfTables, pRes);
}
2024-07-19 08:15:37 +00:00
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
2022-12-01 11:05:33 +00:00
}
2024-07-19 08:15:37 +00:00
static int32_t buildVnodeGroupedStbTableCount(STableCountScanOperatorInfo* pInfo, STableCountScanSupp* pSupp,
SSDataBlock* pRes, char* dbName, tb_uid_t stbUid, SStorageAPI* pAPI) {
int32_t code = TSDB_CODE_SUCCESS;
int32_t lino = 0;
char stbName[TSDB_TABLE_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
2024-07-19 08:15:37 +00:00
code = pAPI->metaFn.getTableNameByUid(pInfo->readHandle.vnode, stbUid, stbName);
QUERY_CHECK_CODE(code, lino, _end);
2022-12-01 11:05:33 +00:00
char fullStbName[TSDB_TABLE_FNAME_LEN] = {0};
2023-03-22 08:08:16 +00:00
if (pSupp->groupByDbName) {
2024-07-19 08:15:37 +00:00
(void)snprintf(fullStbName, TSDB_TABLE_FNAME_LEN, "%s.%s", dbName, varDataVal(stbName));
2023-03-22 08:08:16 +00:00
} else {
2024-07-19 08:15:37 +00:00
(void)snprintf(fullStbName, TSDB_TABLE_FNAME_LEN, "%s", varDataVal(stbName));
2023-03-22 08:08:16 +00:00
}
2023-04-04 06:50:58 +00:00
2022-12-01 11:05:33 +00:00
uint64_t groupId = calcGroupId(fullStbName, strlen(fullStbName));
pRes->info.id.groupId = groupId;
2023-05-25 09:51:03 +00:00
int64_t ctbNum = 0;
code = pAPI->metaFn.getNumOfChildTables(pInfo->readHandle.vnode, stbUid, &ctbNum, NULL, NULL);
2024-07-19 08:15:37 +00:00
QUERY_CHECK_CODE(code, lino, _end);
code = fillTableCountScanDataBlock(pSupp, dbName, varDataVal(stbName), ctbNum, pRes);
QUERY_CHECK_CODE(code, lino, _end);
_end:
if (code != TSDB_CODE_SUCCESS) {
qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
}
return code;
2022-11-18 03:53:33 +00:00
}
static void destoryTableCountScanOperator(void* param) {
2022-11-25 15:00:14 +00:00
STableCountScanOperatorInfo* pTableCountScanInfo = param;
2022-11-18 03:53:33 +00:00
blockDataDestroy(pTableCountScanInfo->pRes);
2022-11-27 05:50:36 +00:00
taosArrayDestroy(pTableCountScanInfo->stbUidList);
2022-11-18 03:53:33 +00:00
taosMemoryFreeClear(param);
2023-09-01 05:24:47 +00:00
}