1227 lines
41 KiB
C
1227 lines
41 KiB
C
/*
|
|
* Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
|
|
*
|
|
* This program is free software: you can use, redistribute, and/or modify
|
|
* it under the terms of the GNU Affero General Public License, version 3
|
|
* or later ("AGPL"), as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope that it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE.
|
|
*
|
|
* You should have received a copy of the GNU Affero General Public License
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#include "executor.h"
|
|
#include "osDir.h"
|
|
#include "osMemory.h"
|
|
#include "streamInt.h"
|
|
#include "streamsm.h"
|
|
#include "tmisce.h"
|
|
#include "tstream.h"
|
|
#include "ttimer.h"
|
|
#include "wal.h"
|
|
|
|
static void streamTaskDestroyUpstreamInfo(SUpstreamInfo* pUpstreamInfo);
|
|
static void streamTaskUpdateUpstreamInfo(SStreamTask* pTask, int32_t nodeId, const SEpSet* pEpSet, bool* pUpdated);
|
|
static void streamTaskUpdateDownstreamInfo(SStreamTask* pTask, int32_t nodeId, const SEpSet* pEpSet, bool* pUpdate);
|
|
static void streamTaskDestroyActiveChkptInfo(SActiveCheckpointInfo* pInfo);
|
|
|
|
static int32_t addToTaskset(SArray* pArray, SStreamTask* pTask) {
|
|
int32_t childId = taosArrayGetSize(pArray);
|
|
pTask->info.selfChildId = childId;
|
|
void* p = taosArrayPush(pArray, &pTask);
|
|
return (p == NULL) ? TSDB_CODE_OUT_OF_MEMORY : TSDB_CODE_SUCCESS;
|
|
}
|
|
|
|
static int32_t doUpdateTaskEpset(SStreamTask* pTask, int32_t nodeId, SEpSet* pEpSet, bool* pUpdated) {
|
|
char buf[512] = {0};
|
|
if (pTask->info.nodeId == nodeId) { // execution task should be moved away
|
|
bool isEqual = isEpsetEqual(&pTask->info.epSet, pEpSet);
|
|
(void)epsetToStr(pEpSet, buf, tListLen(buf));
|
|
|
|
if (!isEqual) {
|
|
(*pUpdated) = true;
|
|
char tmp[512] = {0};
|
|
(void)epsetToStr(&pTask->info.epSet, tmp, tListLen(tmp)); // only for log file, ignore errors
|
|
|
|
epsetAssign(&pTask->info.epSet, pEpSet);
|
|
stDebug("s-task:0x%x (vgId:%d) self node epset is updated %s, old:%s", pTask->id.taskId, nodeId, buf, tmp);
|
|
} else {
|
|
stDebug("s-task:0x%x (vgId:%d) not updated task epset, since epset identical, %s", pTask->id.taskId, nodeId, buf);
|
|
}
|
|
}
|
|
|
|
// check for the dispatch info and the upstream task info
|
|
int32_t level = pTask->info.taskLevel;
|
|
if (level == TASK_LEVEL__SOURCE) {
|
|
streamTaskUpdateDownstreamInfo(pTask, nodeId, pEpSet, pUpdated);
|
|
} else if (level == TASK_LEVEL__AGG) {
|
|
streamTaskUpdateUpstreamInfo(pTask, nodeId, pEpSet, pUpdated);
|
|
streamTaskUpdateDownstreamInfo(pTask, nodeId, pEpSet, pUpdated);
|
|
} else { // TASK_LEVEL__SINK
|
|
streamTaskUpdateUpstreamInfo(pTask, nodeId, pEpSet, pUpdated);
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static void freeItem(void* p) {
|
|
SStreamContinueExecInfo* pInfo = p;
|
|
rpcFreeCont(pInfo->msg.pCont);
|
|
}
|
|
|
|
static void freeUpstreamItem(void* p) {
|
|
SStreamUpstreamEpInfo** pInfo = p;
|
|
taosMemoryFree(*pInfo);
|
|
}
|
|
|
|
static SStreamUpstreamEpInfo* createStreamTaskEpInfo(const SStreamTask* pTask) {
|
|
SStreamUpstreamEpInfo* pEpInfo = taosMemoryMalloc(sizeof(SStreamUpstreamEpInfo));
|
|
if (pEpInfo == NULL) {
|
|
terrno = TSDB_CODE_OUT_OF_MEMORY;
|
|
return NULL;
|
|
}
|
|
|
|
pEpInfo->childId = pTask->info.selfChildId;
|
|
pEpInfo->epSet = pTask->info.epSet;
|
|
pEpInfo->nodeId = pTask->info.nodeId;
|
|
pEpInfo->taskId = pTask->id.taskId;
|
|
pEpInfo->stage = -1;
|
|
|
|
return pEpInfo;
|
|
}
|
|
|
|
int32_t tNewStreamTask(int64_t streamId, int8_t taskLevel, SEpSet* pEpset, bool fillHistory, int64_t triggerParam,
|
|
SArray* pTaskList, bool hasFillhistory, int8_t subtableWithoutMd5, SStreamTask** p) {
|
|
*p = NULL;
|
|
|
|
SStreamTask* pTask = (SStreamTask*)taosMemoryCalloc(1, sizeof(SStreamTask));
|
|
if (pTask == NULL) {
|
|
stError("s-task:0x%" PRIx64 " failed malloc new stream task, size:%d, code:%s", streamId,
|
|
(int32_t)sizeof(SStreamTask), tstrerror(terrno));
|
|
return TSDB_CODE_OUT_OF_MEMORY;
|
|
}
|
|
|
|
pTask->ver = SSTREAM_TASK_VER;
|
|
pTask->id.taskId = tGenIdPI32();
|
|
pTask->id.streamId = streamId;
|
|
|
|
pTask->info.taskLevel = taskLevel;
|
|
pTask->info.fillHistory = fillHistory;
|
|
pTask->info.delaySchedParam = triggerParam;
|
|
pTask->subtableWithoutMd5 = subtableWithoutMd5;
|
|
|
|
int32_t code = streamCreateStateMachine(pTask);
|
|
if (pTask->status.pSM == NULL || code != TSDB_CODE_SUCCESS) {
|
|
taosMemoryFreeClear(pTask);
|
|
return code;
|
|
}
|
|
|
|
char buf[128] = {0};
|
|
sprintf(buf, "0x%" PRIx64 "-0x%x", pTask->id.streamId, pTask->id.taskId);
|
|
|
|
pTask->id.idStr = taosStrdup(buf);
|
|
pTask->status.schedStatus = TASK_SCHED_STATUS__INACTIVE;
|
|
pTask->status.taskStatus = fillHistory ? TASK_STATUS__SCAN_HISTORY : TASK_STATUS__READY;
|
|
pTask->inputq.status = TASK_INPUT_STATUS__NORMAL;
|
|
pTask->outputq.status = TASK_OUTPUT_STATUS__NORMAL;
|
|
|
|
pTask->taskCheckInfo.pList = taosArrayInit(4, sizeof(SDownstreamStatusInfo));
|
|
code = taosThreadMutexInit(&pTask->taskCheckInfo.checkInfoLock, NULL);
|
|
if (code) {
|
|
return code;
|
|
}
|
|
|
|
if (fillHistory) {
|
|
ASSERT(hasFillhistory);
|
|
}
|
|
|
|
epsetAssign(&(pTask->info.mnodeEpset), pEpset);
|
|
|
|
code = addToTaskset(pTaskList, pTask);
|
|
*p = pTask;
|
|
|
|
return code;
|
|
}
|
|
|
|
int32_t tDecodeStreamTaskChkInfo(SDecoder* pDecoder, SCheckpointInfo* pChkpInfo) {
|
|
int64_t skip64;
|
|
int8_t skip8;
|
|
int32_t skip32;
|
|
int16_t skip16;
|
|
SEpSet epSet;
|
|
|
|
if (tStartDecode(pDecoder) < 0) return -1;
|
|
if (tDecodeI64(pDecoder, &pChkpInfo->msgVer) < 0) return -1;
|
|
// if (ver <= SSTREAM_TASK_INCOMPATIBLE_VER) return -1;
|
|
|
|
if (tDecodeI64(pDecoder, &skip64) < 0) return -1;
|
|
if (tDecodeI32(pDecoder, &skip32) < 0) return -1;
|
|
if (tDecodeI32(pDecoder, &skip32) < 0) return -1;
|
|
if (tDecodeI8(pDecoder, &skip8) < 0) return -1;
|
|
if (tDecodeI8(pDecoder, &skip8) < 0) return -1;
|
|
if (tDecodeI16(pDecoder, &skip16) < 0) return -1;
|
|
|
|
if (tDecodeI8(pDecoder, &skip8) < 0) return -1;
|
|
if (tDecodeI8(pDecoder, &skip8) < 0) return -1;
|
|
|
|
if (tDecodeI32(pDecoder, &skip32) < 0) return -1;
|
|
if (tDecodeI32(pDecoder, &skip32) < 0) return -1;
|
|
if (tDecodeSEpSet(pDecoder, &epSet) < 0) return -1;
|
|
if (tDecodeSEpSet(pDecoder, &epSet) < 0) return -1;
|
|
|
|
if (tDecodeI64(pDecoder, &pChkpInfo->checkpointId) < 0) return -1;
|
|
if (tDecodeI64(pDecoder, &pChkpInfo->checkpointVer) < 0) return -1;
|
|
|
|
tEndDecode(pDecoder);
|
|
return 0;
|
|
}
|
|
|
|
int32_t tDecodeStreamTaskId(SDecoder* pDecoder, STaskId* pTaskId) {
|
|
int64_t ver;
|
|
if (tStartDecode(pDecoder) < 0) return -1;
|
|
if (tDecodeI64(pDecoder, &ver) < 0) return -1;
|
|
if (ver <= SSTREAM_TASK_INCOMPATIBLE_VER) return -1;
|
|
|
|
if (tDecodeI64(pDecoder, &pTaskId->streamId) < 0) return -1;
|
|
|
|
int32_t taskId = 0;
|
|
if (tDecodeI32(pDecoder, &taskId) < 0) return -1;
|
|
|
|
pTaskId->taskId = taskId;
|
|
tEndDecode(pDecoder);
|
|
return 0;
|
|
}
|
|
|
|
void tFreeStreamTask(SStreamTask* pTask) {
|
|
char* p = NULL;
|
|
int32_t taskId = pTask->id.taskId;
|
|
|
|
STaskExecStatisInfo* pStatis = &pTask->execInfo;
|
|
|
|
ETaskStatus status1 = TASK_STATUS__UNINIT;
|
|
streamMutexLock(&pTask->lock);
|
|
if (pTask->status.pSM != NULL) {
|
|
SStreamTaskState pStatus = streamTaskGetStatus(pTask);
|
|
p = pStatus.name;
|
|
status1 = pStatus.state;
|
|
}
|
|
streamMutexUnlock(&pTask->lock);
|
|
|
|
stDebug("start to free s-task:0x%x %p, state:%s", taskId, pTask, p);
|
|
|
|
SCheckpointInfo* pCkInfo = &pTask->chkInfo;
|
|
stDebug("s-task:0x%x task exec summary: create:%" PRId64 ", init:%" PRId64 ", start:%" PRId64
|
|
", updateCount:%d latestUpdate:%" PRId64 ", latestCheckPoint:%" PRId64 ", ver:%" PRId64
|
|
" nextProcessVer:%" PRId64 ", checkpointCount:%d",
|
|
taskId, pStatis->created, pStatis->checkTs, pStatis->readyTs, pStatis->updateCount, pStatis->latestUpdateTs,
|
|
pCkInfo->checkpointId, pCkInfo->checkpointVer, pCkInfo->nextProcessVer, pStatis->checkpoint);
|
|
|
|
// remove the ref by timer
|
|
while (pTask->status.timerActive > 0) {
|
|
stDebug("s-task:%s wait for task stop timer activities, ref:%d", pTask->id.idStr, pTask->status.timerActive);
|
|
taosMsleep(100);
|
|
}
|
|
|
|
if (pTask->schedInfo.pDelayTimer != NULL) {
|
|
(void)taosTmrStop(pTask->schedInfo.pDelayTimer);
|
|
pTask->schedInfo.pDelayTimer = NULL;
|
|
}
|
|
|
|
if (pTask->hTaskInfo.pTimer != NULL) {
|
|
(void)taosTmrStop(pTask->hTaskInfo.pTimer);
|
|
pTask->hTaskInfo.pTimer = NULL;
|
|
}
|
|
|
|
if (pTask->msgInfo.pRetryTmr != NULL) {
|
|
(void)taosTmrStop(pTask->msgInfo.pRetryTmr);
|
|
pTask->msgInfo.pRetryTmr = NULL;
|
|
}
|
|
|
|
if (pTask->inputq.queue) {
|
|
streamQueueClose(pTask->inputq.queue, pTask->id.taskId);
|
|
}
|
|
|
|
if (pTask->outputq.queue) {
|
|
streamQueueClose(pTask->outputq.queue, pTask->id.taskId);
|
|
}
|
|
|
|
if (pTask->exec.qmsg) {
|
|
taosMemoryFree(pTask->exec.qmsg);
|
|
}
|
|
|
|
if (pTask->exec.pExecutor) {
|
|
qDestroyTask(pTask->exec.pExecutor);
|
|
pTask->exec.pExecutor = NULL;
|
|
}
|
|
|
|
if (pTask->exec.pWalReader != NULL) {
|
|
walCloseReader(pTask->exec.pWalReader);
|
|
}
|
|
|
|
streamClearChkptReadyMsg(pTask->chkInfo.pActiveInfo);
|
|
|
|
if (pTask->msgInfo.pData != NULL) {
|
|
clearBufferedDispatchMsg(pTask);
|
|
}
|
|
|
|
if (pTask->outputInfo.type == TASK_OUTPUT__TABLE) {
|
|
tDeleteSchemaWrapper(pTask->outputInfo.tbSink.pSchemaWrapper);
|
|
taosMemoryFree(pTask->outputInfo.tbSink.pTSchema);
|
|
tSimpleHashCleanup(pTask->outputInfo.tbSink.pTblInfo);
|
|
tDeleteSchemaWrapper(pTask->outputInfo.tbSink.pTagSchema);
|
|
} else if (pTask->outputInfo.type == TASK_OUTPUT__SHUFFLE_DISPATCH) {
|
|
taosArrayDestroy(pTask->outputInfo.shuffleDispatcher.dbInfo.pVgroupInfos);
|
|
}
|
|
|
|
streamTaskCleanupCheckInfo(&pTask->taskCheckInfo);
|
|
streamFreeTaskState(pTask, pTask->status.removeBackendFiles ? 1 : 0);
|
|
|
|
if (pTask->pNameMap) {
|
|
tSimpleHashCleanup(pTask->pNameMap);
|
|
}
|
|
|
|
streamDestroyStateMachine(pTask->status.pSM);
|
|
pTask->status.pSM = NULL;
|
|
|
|
streamTaskDestroyUpstreamInfo(&pTask->upstreamInfo);
|
|
|
|
taosMemoryFree(pTask->outputInfo.pTokenBucket);
|
|
streamMutexDestroy(&pTask->lock);
|
|
|
|
taosArrayDestroy(pTask->msgInfo.pSendInfo);
|
|
pTask->msgInfo.pSendInfo = NULL;
|
|
streamMutexDestroy(&pTask->msgInfo.lock);
|
|
|
|
taosArrayDestroy(pTask->outputInfo.pNodeEpsetUpdateList);
|
|
pTask->outputInfo.pNodeEpsetUpdateList = NULL;
|
|
|
|
if (pTask->id.idStr != NULL) {
|
|
taosMemoryFree((void*)pTask->id.idStr);
|
|
}
|
|
|
|
streamTaskDestroyActiveChkptInfo(pTask->chkInfo.pActiveInfo);
|
|
pTask->chkInfo.pActiveInfo = NULL;
|
|
|
|
taosMemoryFree(pTask);
|
|
stDebug("s-task:0x%x free task completed", taskId);
|
|
}
|
|
|
|
void streamFreeTaskState(SStreamTask* pTask, int8_t remove) {
|
|
if (pTask->pState != NULL) {
|
|
stDebug("s-task:0x%x start to free task state", pTask->id.taskId);
|
|
streamStateClose(pTask->pState, remove);
|
|
|
|
if (remove) taskDbSetClearFileFlag(pTask->pBackend);
|
|
taskDbRemoveRef(pTask->pBackend);
|
|
pTask->pBackend = NULL;
|
|
pTask->pState = NULL;
|
|
} else {
|
|
if (remove) {
|
|
if (pTask->backendPath != NULL) {
|
|
taosRemoveDir(pTask->backendPath);
|
|
}
|
|
}
|
|
}
|
|
|
|
if (pTask->backendPath != NULL) {
|
|
taosMemoryFree(pTask->backendPath);
|
|
pTask->backendPath = NULL;
|
|
}
|
|
}
|
|
|
|
static void setInitialVersionInfo(SStreamTask* pTask, int64_t ver) {
|
|
SCheckpointInfo* pChkInfo = &pTask->chkInfo;
|
|
SDataRange* pRange = &pTask->dataRange;
|
|
|
|
// only set the version info for stream tasks without fill-history task
|
|
if ((pTask->info.fillHistory == 0) && (!HAS_RELATED_FILLHISTORY_TASK(pTask))) {
|
|
pChkInfo->checkpointVer = ver - 1; // only update when generating checkpoint
|
|
pChkInfo->processedVer = ver - 1; // already processed version
|
|
pChkInfo->nextProcessVer = ver; // next processed version
|
|
|
|
pRange->range.maxVer = ver;
|
|
pRange->range.minVer = ver;
|
|
} else {
|
|
// the initial value of processedVer/nextProcessVer/checkpointVer for stream task with related fill-history task
|
|
// is set at the mnode.
|
|
if (pTask->info.fillHistory == 1) {
|
|
pChkInfo->checkpointVer = pRange->range.maxVer;
|
|
pChkInfo->processedVer = pRange->range.maxVer;
|
|
pChkInfo->nextProcessVer = pRange->range.maxVer + 1;
|
|
} else {
|
|
pChkInfo->checkpointVer = pRange->range.minVer - 1;
|
|
pChkInfo->processedVer = pRange->range.minVer - 1;
|
|
pChkInfo->nextProcessVer = pRange->range.minVer;
|
|
|
|
{ // for compatible purpose, remove it later
|
|
if (pRange->range.minVer == 0) {
|
|
pChkInfo->checkpointVer = 0;
|
|
pChkInfo->processedVer = 0;
|
|
pChkInfo->nextProcessVer = 1;
|
|
stDebug("s-task:%s update the processedVer to 0 from -1 due to compatible purpose", pTask->id.idStr);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
int32_t streamTaskSetBackendPath(SStreamTask* pTask) {
|
|
int64_t streamId = 0;
|
|
int32_t taskId = 0;
|
|
|
|
if (pTask->info.fillHistory) {
|
|
streamId = pTask->hTaskInfo.id.taskId;
|
|
taskId = pTask->hTaskInfo.id.taskId;
|
|
} else {
|
|
streamId = pTask->streamTaskId.taskId;
|
|
taskId = pTask->streamTaskId.taskId;
|
|
}
|
|
|
|
char id[128] = {0};
|
|
int32_t nBytes = sprintf(id, "0x%" PRIx64 "-0x%x", streamId, taskId);
|
|
if (nBytes < 0 || nBytes >= sizeof(id)) {
|
|
return TSDB_CODE_OUT_OF_BUFFER;
|
|
}
|
|
|
|
int32_t len = strlen(pTask->pMeta->path);
|
|
pTask->backendPath = (char*)taosMemoryMalloc(len + nBytes + 2);
|
|
if (pTask->backendPath == NULL) {
|
|
return TSDB_CODE_OUT_OF_MEMORY;
|
|
}
|
|
|
|
(void)sprintf(pTask->backendPath, "%s%s%s", pTask->pMeta->path, TD_DIRSEP, id);
|
|
|
|
return 0;
|
|
}
|
|
int32_t streamTaskInit(SStreamTask* pTask, SStreamMeta* pMeta, SMsgCb* pMsgCb, int64_t ver) {
|
|
(void)createStreamTaskIdStr(pTask->id.streamId, pTask->id.taskId, &pTask->id.idStr);
|
|
pTask->refCnt = 1;
|
|
|
|
pTask->inputq.status = TASK_INPUT_STATUS__NORMAL;
|
|
pTask->outputq.status = TASK_OUTPUT_STATUS__NORMAL;
|
|
|
|
int32_t code1 = streamQueueOpen(512 << 10, &pTask->inputq.queue);
|
|
int32_t code2 = streamQueueOpen(512 << 10, &pTask->outputq.queue);
|
|
if (code1 || code2) {
|
|
stError("s-task:%s failed to prepare the input/output queue, initialize task failed", pTask->id.idStr);
|
|
return TSDB_CODE_OUT_OF_MEMORY;
|
|
}
|
|
|
|
pTask->status.schedStatus = TASK_SCHED_STATUS__INACTIVE;
|
|
pTask->status.timerActive = 0;
|
|
|
|
int32_t code = streamCreateStateMachine(pTask);
|
|
if (pTask->status.pSM == NULL || code != TSDB_CODE_SUCCESS) {
|
|
stError("s-task:%s failed create state-machine for stream task, initialization failed, code:%s", pTask->id.idStr,
|
|
tstrerror(code));
|
|
return code;
|
|
}
|
|
|
|
pTask->execInfo.created = taosGetTimestampMs();
|
|
setInitialVersionInfo(pTask, ver);
|
|
|
|
pTask->pMeta = pMeta;
|
|
pTask->pMsgCb = pMsgCb;
|
|
pTask->msgInfo.pSendInfo = taosArrayInit(4, sizeof(SDispatchEntry));
|
|
if (pTask->msgInfo.pSendInfo == NULL) {
|
|
stError("s-task:%s failed to create sendInfo struct for stream task, code:Out of memory", pTask->id.idStr);
|
|
return terrno;
|
|
}
|
|
|
|
code = taosThreadMutexInit(&pTask->msgInfo.lock, NULL);
|
|
if (code) {
|
|
return code;
|
|
}
|
|
|
|
TdThreadMutexAttr attr = {0};
|
|
code = taosThreadMutexAttrInit(&attr);
|
|
if (code != 0) {
|
|
stError("s-task:%s initElapsed mutex attr failed, code:%s", pTask->id.idStr, tstrerror(code));
|
|
return code;
|
|
}
|
|
|
|
code = taosThreadMutexAttrSetType(&attr, PTHREAD_MUTEX_RECURSIVE);
|
|
if (code != 0) {
|
|
stError("s-task:%s set mutex attr recursive, code:%s", pTask->id.idStr, tstrerror(code));
|
|
return code;
|
|
}
|
|
|
|
code = taosThreadMutexInit(&pTask->lock, &attr);
|
|
if (code) {
|
|
return code;
|
|
}
|
|
|
|
code = taosThreadMutexAttrDestroy(&attr);
|
|
if (code) {
|
|
return code;
|
|
}
|
|
|
|
streamTaskOpenAllUpstreamInput(pTask);
|
|
|
|
STaskOutputInfo* pOutputInfo = &pTask->outputInfo;
|
|
pOutputInfo->pTokenBucket = taosMemoryCalloc(1, sizeof(STokenBucket));
|
|
if (pOutputInfo->pTokenBucket == NULL) {
|
|
stError("s-task:%s failed to prepare the tokenBucket, code:%s", pTask->id.idStr,
|
|
tstrerror(TSDB_CODE_OUT_OF_MEMORY));
|
|
return TSDB_CODE_OUT_OF_MEMORY;
|
|
}
|
|
|
|
// 2MiB per second for sink task
|
|
// 50 times sink operator per second
|
|
code = streamTaskInitTokenBucket(pOutputInfo->pTokenBucket, 35, 35, tsSinkDataRate, pTask->id.idStr);
|
|
if (code) {
|
|
return code;
|
|
}
|
|
|
|
pOutputInfo->pNodeEpsetUpdateList = taosArrayInit(4, sizeof(SDownstreamTaskEpset));
|
|
if (pOutputInfo->pNodeEpsetUpdateList == NULL) {
|
|
stError("s-task:%s failed to prepare downstreamUpdateList, code:%s", pTask->id.idStr,
|
|
tstrerror(TSDB_CODE_OUT_OF_MEMORY));
|
|
return TSDB_CODE_OUT_OF_MEMORY;
|
|
}
|
|
|
|
pTask->taskCheckInfo.pList = taosArrayInit(4, sizeof(SDownstreamStatusInfo));
|
|
if (pTask->taskCheckInfo.pList == NULL) {
|
|
stError("s-task:%s failed to prepare taskCheckInfo list, code:%s", pTask->id.idStr,
|
|
tstrerror(TSDB_CODE_OUT_OF_MEMORY));
|
|
return TSDB_CODE_OUT_OF_MEMORY;
|
|
}
|
|
|
|
if (pTask->chkInfo.pActiveInfo == NULL) {
|
|
code = streamTaskCreateActiveChkptInfo(&pTask->chkInfo.pActiveInfo);
|
|
if (code) {
|
|
stError("s-task:%s failed to create active checkpoint info, code:%s", pTask->id.idStr, tstrerror(code));
|
|
return code;
|
|
}
|
|
}
|
|
|
|
return streamTaskSetBackendPath(pTask);
|
|
}
|
|
|
|
int32_t streamTaskGetNumOfDownstream(const SStreamTask* pTask) {
|
|
if (pTask->info.taskLevel == TASK_LEVEL__SINK) {
|
|
return 0;
|
|
}
|
|
|
|
int32_t type = pTask->outputInfo.type;
|
|
if (type == TASK_OUTPUT__TABLE) {
|
|
return 0;
|
|
} else if (type == TASK_OUTPUT__FIXED_DISPATCH) {
|
|
return 1;
|
|
} else {
|
|
SArray* vgInfo = pTask->outputInfo.shuffleDispatcher.dbInfo.pVgroupInfos;
|
|
return taosArrayGetSize(vgInfo);
|
|
}
|
|
}
|
|
|
|
int32_t streamTaskGetNumOfUpstream(const SStreamTask* pTask) { return taosArrayGetSize(pTask->upstreamInfo.pList); }
|
|
|
|
int32_t streamTaskSetUpstreamInfo(SStreamTask* pTask, const SStreamTask* pUpstreamTask) {
|
|
SStreamUpstreamEpInfo* pEpInfo = createStreamTaskEpInfo(pUpstreamTask);
|
|
if (pEpInfo == NULL) {
|
|
return TSDB_CODE_OUT_OF_MEMORY;
|
|
}
|
|
|
|
if (pTask->upstreamInfo.pList == NULL) {
|
|
pTask->upstreamInfo.pList = taosArrayInit(4, POINTER_BYTES);
|
|
}
|
|
|
|
void* p = taosArrayPush(pTask->upstreamInfo.pList, &pEpInfo);
|
|
return (p == NULL) ? TSDB_CODE_OUT_OF_MEMORY : TSDB_CODE_SUCCESS;
|
|
}
|
|
|
|
void streamTaskUpdateUpstreamInfo(SStreamTask* pTask, int32_t nodeId, const SEpSet* pEpSet, bool* pUpdated) {
|
|
char buf[512] = {0};
|
|
(void)epsetToStr(pEpSet, buf, tListLen(buf)); // ignore error since it is only for log file.
|
|
|
|
int32_t numOfUpstream = taosArrayGetSize(pTask->upstreamInfo.pList);
|
|
for (int32_t i = 0; i < numOfUpstream; ++i) {
|
|
SStreamUpstreamEpInfo* pInfo = taosArrayGetP(pTask->upstreamInfo.pList, i);
|
|
if (pInfo->nodeId == nodeId) {
|
|
bool equal = isEpsetEqual(&pInfo->epSet, pEpSet);
|
|
if (!equal) {
|
|
*pUpdated = true;
|
|
|
|
char tmp[512] = {0};
|
|
(void)epsetToStr(&pInfo->epSet, tmp, tListLen(tmp));
|
|
|
|
epsetAssign(&pInfo->epSet, pEpSet);
|
|
stDebug("s-task:0x%x update the upstreamInfo taskId:0x%x(nodeId:%d) newEpset:%s old:%s", pTask->id.taskId,
|
|
pInfo->taskId, nodeId, buf, tmp);
|
|
} else {
|
|
stDebug("s-task:0x%x not update upstreamInfo, since identical, task:0x%x(nodeId:%d) epset:%s", pTask->id.taskId,
|
|
pInfo->taskId, nodeId, buf);
|
|
}
|
|
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
void streamTaskDestroyUpstreamInfo(SUpstreamInfo* pUpstreamInfo) {
|
|
if (pUpstreamInfo->pList != NULL) {
|
|
taosArrayDestroyEx(pUpstreamInfo->pList, freeUpstreamItem);
|
|
pUpstreamInfo->numOfClosed = 0;
|
|
pUpstreamInfo->pList = NULL;
|
|
}
|
|
}
|
|
|
|
void streamTaskSetFixedDownstreamInfo(SStreamTask* pTask, const SStreamTask* pDownstreamTask) {
|
|
STaskDispatcherFixed* pDispatcher = &pTask->outputInfo.fixedDispatcher;
|
|
pDispatcher->taskId = pDownstreamTask->id.taskId;
|
|
pDispatcher->nodeId = pDownstreamTask->info.nodeId;
|
|
pDispatcher->epSet = pDownstreamTask->info.epSet;
|
|
|
|
pTask->outputInfo.type = TASK_OUTPUT__FIXED_DISPATCH;
|
|
pTask->msgInfo.msgType = TDMT_STREAM_TASK_DISPATCH;
|
|
}
|
|
|
|
void streamTaskUpdateDownstreamInfo(SStreamTask* pTask, int32_t nodeId, const SEpSet* pEpSet, bool* pUpdated) {
|
|
char buf[512] = {0};
|
|
(void)epsetToStr(pEpSet, buf, tListLen(buf)); // ignore the error since only for log files.
|
|
|
|
int32_t id = pTask->id.taskId;
|
|
int8_t type = pTask->outputInfo.type;
|
|
|
|
if (type == TASK_OUTPUT__SHUFFLE_DISPATCH) {
|
|
SArray* pVgs = pTask->outputInfo.shuffleDispatcher.dbInfo.pVgroupInfos;
|
|
|
|
for (int32_t i = 0; i < taosArrayGetSize(pVgs); i++) {
|
|
SVgroupInfo* pVgInfo = taosArrayGet(pVgs, i);
|
|
if (pVgInfo == NULL) {
|
|
continue;
|
|
}
|
|
|
|
if (pVgInfo->vgId == nodeId) {
|
|
bool isEqual = isEpsetEqual(&pVgInfo->epSet, pEpSet);
|
|
if (!isEqual) {
|
|
*pUpdated = true;
|
|
char tmp[512] = {0};
|
|
(void)epsetToStr(&pVgInfo->epSet, tmp, tListLen(tmp));
|
|
|
|
epsetAssign(&pVgInfo->epSet, pEpSet);
|
|
stDebug("s-task:0x%x update dispatch info, task:0x%x(nodeId:%d) newEpset:%s old:%s", id, pVgInfo->taskId,
|
|
nodeId, buf, tmp);
|
|
} else {
|
|
stDebug("s-task:0x%x not update dispatch info, since identical, task:0x%x(nodeId:%d) epset:%s", id,
|
|
pVgInfo->taskId, nodeId, buf);
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
} else if (type == TASK_OUTPUT__FIXED_DISPATCH) {
|
|
STaskDispatcherFixed* pDispatcher = &pTask->outputInfo.fixedDispatcher;
|
|
if (pDispatcher->nodeId == nodeId) {
|
|
bool equal = isEpsetEqual(&pDispatcher->epSet, pEpSet);
|
|
if (!equal) {
|
|
*pUpdated = true;
|
|
|
|
char tmp[512] = {0};
|
|
(void)epsetToStr(&pDispatcher->epSet, tmp, tListLen(tmp));
|
|
|
|
epsetAssign(&pDispatcher->epSet, pEpSet);
|
|
stDebug("s-task:0x%x update dispatch info, task:0x%x(nodeId:%d) newEpset:%s old:%s", id, pDispatcher->taskId,
|
|
nodeId, buf, tmp);
|
|
} else {
|
|
stDebug("s-task:0x%x not update dispatch info, since identical, task:0x%x(nodeId:%d) epset:%s", id,
|
|
pDispatcher->taskId, nodeId, buf);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
int32_t streamTaskStop(SStreamTask* pTask) {
|
|
int32_t vgId = pTask->pMeta->vgId;
|
|
int64_t st = taosGetTimestampMs();
|
|
const char* id = pTask->id.idStr;
|
|
|
|
int32_t code = streamTaskHandleEvent(pTask->status.pSM, TASK_EVENT_STOP);
|
|
if (code) {
|
|
stError("failed to handle STOP event, s-task:%s", id);
|
|
}
|
|
|
|
if (pTask->info.taskLevel != TASK_LEVEL__SINK && pTask->exec.pExecutor != NULL) {
|
|
code = qKillTask(pTask->exec.pExecutor, TSDB_CODE_SUCCESS);
|
|
if (code != TSDB_CODE_SUCCESS) {
|
|
stError("s-task:%s failed to kill task related query handle", id);
|
|
}
|
|
}
|
|
|
|
while (!streamTaskIsIdle(pTask)) {
|
|
stDebug("s-task:%s level:%d wait for task to be idle and then close, check again in 100ms", id,
|
|
pTask->info.taskLevel);
|
|
taosMsleep(100);
|
|
}
|
|
|
|
int64_t el = taosGetTimestampMs() - st;
|
|
stDebug("vgId:%d s-task:%s is closed in %" PRId64 " ms", vgId, id, el);
|
|
return code;
|
|
}
|
|
|
|
bool streamTaskUpdateEpsetInfo(SStreamTask* pTask, SArray* pNodeList) {
|
|
STaskExecStatisInfo* p = &pTask->execInfo;
|
|
|
|
int32_t numOfNodes = taosArrayGetSize(pNodeList);
|
|
int64_t prevTs = p->latestUpdateTs;
|
|
|
|
p->latestUpdateTs = taosGetTimestampMs();
|
|
p->updateCount += 1;
|
|
stDebug("s-task:0x%x update task nodeEp epset, updatedNodes:%d, updateCount:%d, prevTs:%" PRId64, pTask->id.taskId,
|
|
numOfNodes, p->updateCount, prevTs);
|
|
|
|
bool updated = false;
|
|
for (int32_t i = 0; i < numOfNodes; ++i) {
|
|
SNodeUpdateInfo* pInfo = taosArrayGet(pNodeList, i);
|
|
if (pInfo == NULL) {
|
|
continue;
|
|
}
|
|
|
|
int32_t code = doUpdateTaskEpset(pTask, pInfo->nodeId, &pInfo->newEp, &updated);
|
|
if (code) {
|
|
stError("s-task:0x%x failed to update the task nodeEp epset, code:%s", pTask->id.taskId, tstrerror(code));
|
|
}
|
|
}
|
|
|
|
return updated;
|
|
}
|
|
|
|
void streamTaskResetUpstreamStageInfo(SStreamTask* pTask) {
|
|
if (pTask->info.taskLevel == TASK_LEVEL__SOURCE) {
|
|
return;
|
|
}
|
|
|
|
int32_t size = taosArrayGetSize(pTask->upstreamInfo.pList);
|
|
for (int32_t i = 0; i < size; ++i) {
|
|
SStreamUpstreamEpInfo* pInfo = taosArrayGetP(pTask->upstreamInfo.pList, i);
|
|
pInfo->stage = -1;
|
|
}
|
|
|
|
stDebug("s-task:%s reset all upstream tasks stage info", pTask->id.idStr);
|
|
}
|
|
|
|
void streamTaskOpenAllUpstreamInput(SStreamTask* pTask) {
|
|
int32_t num = taosArrayGetSize(pTask->upstreamInfo.pList);
|
|
if (num == 0) {
|
|
return;
|
|
}
|
|
|
|
for (int32_t i = 0; i < num; ++i) {
|
|
SStreamUpstreamEpInfo* pInfo = taosArrayGetP(pTask->upstreamInfo.pList, i);
|
|
pInfo->dataAllowed = true;
|
|
}
|
|
|
|
pTask->upstreamInfo.numOfClosed = 0;
|
|
stDebug("s-task:%s opening up inputQ for %d upstream tasks", pTask->id.idStr, num);
|
|
}
|
|
|
|
void streamTaskCloseUpstreamInput(SStreamTask* pTask, int32_t taskId) {
|
|
SStreamUpstreamEpInfo* pInfo = NULL;
|
|
streamTaskGetUpstreamTaskEpInfo(pTask, taskId, &pInfo);
|
|
|
|
if ((pInfo != NULL) && pInfo->dataAllowed) {
|
|
pInfo->dataAllowed = false;
|
|
int32_t t = atomic_add_fetch_32(&pTask->upstreamInfo.numOfClosed, 1);
|
|
ASSERT(t <= streamTaskGetNumOfUpstream(pTask));
|
|
}
|
|
}
|
|
|
|
void streamTaskOpenUpstreamInput(SStreamTask* pTask, int32_t taskId) {
|
|
SStreamUpstreamEpInfo* pInfo = NULL;
|
|
streamTaskGetUpstreamTaskEpInfo(pTask, taskId, &pInfo);
|
|
|
|
if (pInfo != NULL && (!pInfo->dataAllowed)) {
|
|
int32_t t = atomic_sub_fetch_32(&pTask->upstreamInfo.numOfClosed, 1);
|
|
ASSERT(t >= 0);
|
|
pInfo->dataAllowed = true;
|
|
}
|
|
}
|
|
|
|
bool streamTaskIsAllUpstreamClosed(SStreamTask* pTask) {
|
|
return pTask->upstreamInfo.numOfClosed == taosArrayGetSize(pTask->upstreamInfo.pList);
|
|
}
|
|
|
|
bool streamTaskSetSchedStatusWait(SStreamTask* pTask) {
|
|
bool ret = false;
|
|
|
|
streamMutexLock(&pTask->lock);
|
|
if (pTask->status.schedStatus == TASK_SCHED_STATUS__INACTIVE) {
|
|
pTask->status.schedStatus = TASK_SCHED_STATUS__WAITING;
|
|
ret = true;
|
|
}
|
|
streamMutexUnlock(&pTask->lock);
|
|
|
|
return ret;
|
|
}
|
|
|
|
int8_t streamTaskSetSchedStatusActive(SStreamTask* pTask) {
|
|
streamMutexLock(&pTask->lock);
|
|
int8_t status = pTask->status.schedStatus;
|
|
if (status == TASK_SCHED_STATUS__WAITING) {
|
|
pTask->status.schedStatus = TASK_SCHED_STATUS__ACTIVE;
|
|
}
|
|
streamMutexUnlock(&pTask->lock);
|
|
|
|
return status;
|
|
}
|
|
|
|
int8_t streamTaskSetSchedStatusInactive(SStreamTask* pTask) {
|
|
streamMutexLock(&pTask->lock);
|
|
int8_t status = pTask->status.schedStatus;
|
|
ASSERT(status == TASK_SCHED_STATUS__WAITING || status == TASK_SCHED_STATUS__ACTIVE ||
|
|
status == TASK_SCHED_STATUS__INACTIVE);
|
|
pTask->status.schedStatus = TASK_SCHED_STATUS__INACTIVE;
|
|
streamMutexUnlock(&pTask->lock);
|
|
|
|
return status;
|
|
}
|
|
|
|
int32_t streamTaskClearHTaskAttr(SStreamTask* pTask, int32_t resetRelHalt) {
|
|
int32_t code = 0;
|
|
SStreamMeta* pMeta = pTask->pMeta;
|
|
STaskId sTaskId = {.streamId = pTask->streamTaskId.streamId, .taskId = pTask->streamTaskId.taskId};
|
|
if (pTask->info.fillHistory == 0) {
|
|
return code;
|
|
}
|
|
|
|
SStreamTask** ppStreamTask = (SStreamTask**)taosHashGet(pMeta->pTasksMap, &sTaskId, sizeof(sTaskId));
|
|
if (ppStreamTask != NULL) {
|
|
stDebug("s-task:%s clear the related stream task:0x%x attr to fill-history task", pTask->id.idStr,
|
|
(int32_t)sTaskId.taskId);
|
|
|
|
streamMutexLock(&(*ppStreamTask)->lock);
|
|
CLEAR_RELATED_FILLHISTORY_TASK((*ppStreamTask));
|
|
|
|
if (resetRelHalt) {
|
|
stDebug("s-task:0x%" PRIx64 " set the persistent status attr to be ready, prev:%s, status in sm:%s",
|
|
sTaskId.taskId, streamTaskGetStatusStr((*ppStreamTask)->status.taskStatus),
|
|
streamTaskGetStatus(*ppStreamTask).name);
|
|
(*ppStreamTask)->status.taskStatus = TASK_STATUS__READY;
|
|
}
|
|
|
|
code = streamMetaSaveTask(pMeta, *ppStreamTask);
|
|
streamMutexUnlock(&(*ppStreamTask)->lock);
|
|
}
|
|
|
|
return code;
|
|
}
|
|
|
|
int32_t streamBuildAndSendDropTaskMsg(SMsgCb* pMsgCb, int32_t vgId, SStreamTaskId* pTaskId, int64_t resetRelHalt) {
|
|
SVDropStreamTaskReq* pReq = rpcMallocCont(sizeof(SVDropStreamTaskReq));
|
|
if (pReq == NULL) {
|
|
return terrno;
|
|
}
|
|
|
|
pReq->head.vgId = vgId;
|
|
pReq->taskId = pTaskId->taskId;
|
|
pReq->streamId = pTaskId->streamId;
|
|
pReq->resetRelHalt = resetRelHalt; // todo: remove this attribute
|
|
|
|
SRpcMsg msg = {.msgType = TDMT_STREAM_TASK_DROP, .pCont = pReq, .contLen = sizeof(SVDropStreamTaskReq)};
|
|
int32_t code = tmsgPutToQueue(pMsgCb, WRITE_QUEUE, &msg);
|
|
if (code != TSDB_CODE_SUCCESS) {
|
|
stError("vgId:%d failed to send drop task:0x%x msg, code:%s", vgId, pTaskId->taskId, tstrerror(code));
|
|
} else {
|
|
stDebug("vgId:%d build and send drop task:0x%x msg", vgId, pTaskId->taskId);
|
|
}
|
|
|
|
return code;
|
|
}
|
|
|
|
int32_t streamSendChkptReportMsg(SStreamTask* pTask, SCheckpointInfo* pCheckpointInfo, int8_t dropRelHTask) {
|
|
int32_t code;
|
|
int32_t tlen = 0;
|
|
int32_t vgId = pTask->pMeta->vgId;
|
|
const char* id = pTask->id.idStr;
|
|
SActiveCheckpointInfo* pActive = pCheckpointInfo->pActiveInfo;
|
|
|
|
SCheckpointReport req = {.streamId = pTask->id.streamId,
|
|
.taskId = pTask->id.taskId,
|
|
.nodeId = vgId,
|
|
.dropHTask = dropRelHTask,
|
|
.transId = pActive->transId,
|
|
.checkpointId = pActive->activeId,
|
|
.checkpointVer = pCheckpointInfo->processedVer,
|
|
.checkpointTs = pCheckpointInfo->startTs};
|
|
|
|
tEncodeSize(tEncodeStreamTaskChkptReport, &req, tlen, code);
|
|
if (code < 0) {
|
|
stError("s-task:%s vgId:%d encode stream task checkpoint-report failed, code:%s", id, vgId, tstrerror(code));
|
|
return -1;
|
|
}
|
|
|
|
void* buf = rpcMallocCont(tlen);
|
|
if (buf == NULL) {
|
|
stError("s-task:%s vgId:%d encode stream task checkpoint-report msg failed, code:%s", id, vgId,
|
|
tstrerror(TSDB_CODE_OUT_OF_MEMORY));
|
|
return -1;
|
|
}
|
|
|
|
SEncoder encoder;
|
|
tEncoderInit(&encoder, buf, tlen);
|
|
if ((code = tEncodeStreamTaskChkptReport(&encoder, &req)) < 0) {
|
|
rpcFreeCont(buf);
|
|
stError("s-task:%s vgId:%d encode stream task checkpoint-report msg failed, code:%s", id, vgId, tstrerror(code));
|
|
return -1;
|
|
}
|
|
tEncoderClear(&encoder);
|
|
|
|
SRpcMsg msg = {0};
|
|
initRpcMsg(&msg, TDMT_MND_STREAM_CHKPT_REPORT, buf, tlen);
|
|
stDebug("s-task:%s vgId:%d build and send task checkpoint-report to mnode", id, vgId);
|
|
|
|
return tmsgSendReq(&pTask->info.mnodeEpset, &msg);
|
|
}
|
|
|
|
STaskId streamTaskGetTaskId(const SStreamTask* pTask) {
|
|
STaskId id = {.streamId = pTask->id.streamId, .taskId = pTask->id.taskId};
|
|
return id;
|
|
}
|
|
|
|
void streamTaskInitForLaunchHTask(SHistoryTaskInfo* pInfo) {
|
|
pInfo->waitInterval = LAUNCH_HTASK_INTERVAL;
|
|
pInfo->tickCount = ceil(LAUNCH_HTASK_INTERVAL / WAIT_FOR_MINIMAL_INTERVAL);
|
|
pInfo->retryTimes = 0;
|
|
}
|
|
|
|
void streamTaskSetRetryInfoForLaunch(SHistoryTaskInfo* pInfo) {
|
|
ASSERT(pInfo->tickCount == 0);
|
|
|
|
pInfo->waitInterval *= RETRY_LAUNCH_INTERVAL_INC_RATE;
|
|
pInfo->tickCount = ceil(pInfo->waitInterval / WAIT_FOR_MINIMAL_INTERVAL);
|
|
pInfo->retryTimes += 1;
|
|
}
|
|
|
|
void streamTaskStatusInit(STaskStatusEntry* pEntry, const SStreamTask* pTask) {
|
|
pEntry->id.streamId = pTask->id.streamId;
|
|
pEntry->id.taskId = pTask->id.taskId;
|
|
pEntry->stage = -1;
|
|
pEntry->nodeId = pTask->info.nodeId;
|
|
pEntry->status = TASK_STATUS__STOP;
|
|
}
|
|
|
|
void streamTaskStatusCopy(STaskStatusEntry* pDst, const STaskStatusEntry* pSrc) {
|
|
pDst->stage = pSrc->stage;
|
|
pDst->inputQUsed = pSrc->inputQUsed;
|
|
pDst->inputRate = pSrc->inputRate;
|
|
pDst->procsTotal = pSrc->procsTotal;
|
|
pDst->procsThroughput = pSrc->procsThroughput;
|
|
pDst->outputTotal = pSrc->outputTotal;
|
|
pDst->outputThroughput = pSrc->outputThroughput;
|
|
pDst->processedVer = pSrc->processedVer;
|
|
pDst->verRange = pSrc->verRange;
|
|
pDst->sinkQuota = pSrc->sinkQuota;
|
|
pDst->sinkDataSize = pSrc->sinkDataSize;
|
|
pDst->checkpointInfo = pSrc->checkpointInfo;
|
|
pDst->startCheckpointId = pSrc->startCheckpointId;
|
|
pDst->startCheckpointVer = pSrc->startCheckpointVer;
|
|
pDst->status = pSrc->status;
|
|
|
|
pDst->startTime = pSrc->startTime;
|
|
pDst->hTaskId = pSrc->hTaskId;
|
|
}
|
|
|
|
STaskStatusEntry streamTaskGetStatusEntry(SStreamTask* pTask) {
|
|
SStreamMeta* pMeta = pTask->pMeta;
|
|
STaskExecStatisInfo* pExecInfo = &pTask->execInfo;
|
|
|
|
STaskStatusEntry entry = {
|
|
.id = streamTaskGetTaskId(pTask),
|
|
.status = streamTaskGetStatus(pTask).state,
|
|
.nodeId = pMeta->vgId,
|
|
.stage = pMeta->stage,
|
|
|
|
.inputQUsed = SIZE_IN_MiB(streamQueueGetItemSize(pTask->inputq.queue)),
|
|
.startTime = pExecInfo->readyTs,
|
|
.checkpointInfo.latestId = pTask->chkInfo.checkpointId,
|
|
.checkpointInfo.latestVer = pTask->chkInfo.checkpointVer,
|
|
.checkpointInfo.latestTime = pTask->chkInfo.checkpointTime,
|
|
.checkpointInfo.latestSize = 0,
|
|
.checkpointInfo.remoteBackup = 0,
|
|
.checkpointInfo.consensusChkptId = 0,
|
|
.checkpointInfo.consensusTs = taosGetTimestampMs(),
|
|
.hTaskId = pTask->hTaskInfo.id.taskId,
|
|
.procsTotal = SIZE_IN_MiB(pExecInfo->inputDataSize),
|
|
.outputTotal = SIZE_IN_MiB(pExecInfo->outputDataSize),
|
|
.procsThroughput = SIZE_IN_KiB(pExecInfo->procsThroughput),
|
|
.outputThroughput = SIZE_IN_KiB(pExecInfo->outputThroughput),
|
|
.startCheckpointId = pExecInfo->startCheckpointId,
|
|
.startCheckpointVer = pExecInfo->startCheckpointVer,
|
|
};
|
|
return entry;
|
|
}
|
|
|
|
static int32_t taskPauseCallback(SStreamTask* pTask, void* param) {
|
|
SStreamMeta* pMeta = pTask->pMeta;
|
|
int32_t code = 0;
|
|
|
|
int32_t num = atomic_add_fetch_32(&pMeta->numOfPausedTasks, 1);
|
|
stInfo("vgId:%d s-task:%s pause stream task. paused task num:%d", pMeta->vgId, pTask->id.idStr, num);
|
|
|
|
// in case of fill-history task, stop the tsdb file scan operation.
|
|
if (pTask->info.fillHistory == 1) {
|
|
void* pExecutor = pTask->exec.pExecutor;
|
|
code = qKillTask(pExecutor, TSDB_CODE_SUCCESS);
|
|
}
|
|
|
|
stDebug("vgId:%d s-task:%s set pause flag and pause task", pMeta->vgId, pTask->id.idStr);
|
|
return code;
|
|
}
|
|
|
|
void streamTaskPause(SStreamTask* pTask) {
|
|
(void)streamTaskHandleEventAsync(pTask->status.pSM, TASK_EVENT_PAUSE, taskPauseCallback, NULL);
|
|
}
|
|
|
|
void streamTaskResume(SStreamTask* pTask) {
|
|
SStreamTaskState prevState = streamTaskGetStatus(pTask);
|
|
|
|
SStreamMeta* pMeta = pTask->pMeta;
|
|
int32_t code = streamTaskRestoreStatus(pTask);
|
|
if (code == TSDB_CODE_SUCCESS) {
|
|
char* pNew = streamTaskGetStatus(pTask).name;
|
|
int32_t num = atomic_sub_fetch_32(&pMeta->numOfPausedTasks, 1);
|
|
stInfo("s-task:%s status:%s resume from %s, paused task(s):%d", pTask->id.idStr, pNew, prevState.name, num);
|
|
} else {
|
|
stInfo("s-task:%s status:%s no need to resume, paused task(s):%d", pTask->id.idStr, prevState.name,
|
|
pMeta->numOfPausedTasks);
|
|
}
|
|
}
|
|
|
|
bool streamTaskIsSinkTask(const SStreamTask* pTask) { return pTask->info.taskLevel == TASK_LEVEL__SINK; }
|
|
|
|
// this task must success
|
|
int32_t streamTaskSendCheckpointReq(SStreamTask* pTask) {
|
|
int32_t code;
|
|
int32_t tlen = 0;
|
|
int32_t vgId = pTask->pMeta->vgId;
|
|
const char* id = pTask->id.idStr;
|
|
|
|
SStreamTaskCheckpointReq req = {.streamId = pTask->id.streamId, .taskId = pTask->id.taskId, .nodeId = vgId};
|
|
tEncodeSize(tEncodeStreamTaskCheckpointReq, &req, tlen, code);
|
|
if (code < 0) {
|
|
stError("s-task:%s vgId:%d encode stream task req checkpoint failed, code:%s", id, vgId, tstrerror(code));
|
|
return -1;
|
|
}
|
|
|
|
void* buf = rpcMallocCont(tlen);
|
|
if (buf == NULL) {
|
|
stError("s-task:%s vgId:%d encode stream task req checkpoint msg failed, code:%s", id, vgId,
|
|
tstrerror(TSDB_CODE_OUT_OF_MEMORY));
|
|
return -1;
|
|
}
|
|
|
|
SEncoder encoder;
|
|
tEncoderInit(&encoder, buf, tlen);
|
|
if ((code = tEncodeStreamTaskCheckpointReq(&encoder, &req)) < 0) {
|
|
rpcFreeCont(buf);
|
|
stError("s-task:%s vgId:%d encode stream task req checkpoint msg failed, code:%s", id, vgId, tstrerror(code));
|
|
return -1;
|
|
}
|
|
tEncoderClear(&encoder);
|
|
|
|
SRpcMsg msg = {0};
|
|
initRpcMsg(&msg, TDMT_MND_STREAM_REQ_CHKPT, buf, tlen);
|
|
stDebug("s-task:%s vgId:%d build and send task checkpoint req", id, vgId);
|
|
|
|
return tmsgSendReq(&pTask->info.mnodeEpset, &msg);
|
|
}
|
|
|
|
void streamTaskGetUpstreamTaskEpInfo(SStreamTask* pTask, int32_t taskId, SStreamUpstreamEpInfo** pEpInfo) {
|
|
*pEpInfo = NULL;
|
|
|
|
int32_t num = taosArrayGetSize(pTask->upstreamInfo.pList);
|
|
for (int32_t i = 0; i < num; ++i) {
|
|
SStreamUpstreamEpInfo* pInfo = taosArrayGetP(pTask->upstreamInfo.pList, i);
|
|
if (pInfo == NULL) {
|
|
return;
|
|
}
|
|
|
|
if (pInfo->taskId == taskId) {
|
|
*pEpInfo = pInfo;
|
|
return;
|
|
}
|
|
}
|
|
|
|
stError("s-task:%s failed to find upstream task:0x%x", pTask->id.idStr, taskId);
|
|
}
|
|
|
|
SEpSet* streamTaskGetDownstreamEpInfo(SStreamTask* pTask, int32_t taskId) {
|
|
if (pTask->info.taskLevel == TASK_OUTPUT__FIXED_DISPATCH) {
|
|
if (pTask->outputInfo.fixedDispatcher.taskId == taskId) {
|
|
return &pTask->outputInfo.fixedDispatcher.epSet;
|
|
}
|
|
} else if (pTask->info.taskLevel == TASK_OUTPUT__SHUFFLE_DISPATCH) {
|
|
SArray* pList = pTask->outputInfo.shuffleDispatcher.dbInfo.pVgroupInfos;
|
|
for (int32_t i = 0; i < taosArrayGetSize(pList); ++i) {
|
|
SVgroupInfo* pVgInfo = taosArrayGet(pList, i);
|
|
if (pVgInfo == NULL) {
|
|
continue;
|
|
}
|
|
|
|
if (pVgInfo->taskId == taskId) {
|
|
return &pVgInfo->epSet;
|
|
}
|
|
}
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
|
|
int32_t createStreamTaskIdStr(int64_t streamId, int32_t taskId, const char** pId) {
|
|
char buf[128] = {0};
|
|
sprintf(buf, "0x%" PRIx64 "-0x%x", streamId, taskId);
|
|
*pId = taosStrdup(buf);
|
|
|
|
if (*pId == NULL) {
|
|
return TSDB_CODE_OUT_OF_MEMORY;
|
|
} else {
|
|
return TSDB_CODE_SUCCESS;
|
|
}
|
|
}
|
|
|
|
static int32_t streamTaskEnqueueRetrieve(SStreamTask* pTask, SStreamRetrieveReq* pReq) {
|
|
int32_t code;
|
|
SStreamDataBlock* pData;
|
|
|
|
code = taosAllocateQitem(sizeof(SStreamDataBlock), DEF_QITEM, sizeof(SStreamDataBlock), (void**)&pData);
|
|
if (code) {
|
|
stError("s-task:%s failed to allocated retrieve-block", pTask->id.idStr);
|
|
return terrno = code;
|
|
}
|
|
|
|
// enqueue
|
|
stDebug("s-task:%s (vgId:%d level:%d) recv retrieve req from task:0x%x(vgId:%d),QID:0x%" PRIx64, pTask->id.idStr,
|
|
pTask->pMeta->vgId, pTask->info.taskLevel, pReq->srcTaskId, pReq->srcNodeId, pReq->reqId);
|
|
|
|
pData->type = STREAM_INPUT__DATA_RETRIEVE;
|
|
pData->srcVgId = 0;
|
|
|
|
code = streamRetrieveReqToData(pReq, pData, pTask->id.idStr);
|
|
if (code != TSDB_CODE_SUCCESS) {
|
|
taosFreeQitem(pData);
|
|
return code;
|
|
}
|
|
|
|
code = streamTaskPutDataIntoInputQ(pTask, (SStreamQueueItem*)pData);
|
|
if (code != TSDB_CODE_SUCCESS) {
|
|
stError("s-task:%s failed to put retrieve-block into inputQ, inputQ is full, discard the retrieve msg",
|
|
pTask->id.idStr);
|
|
}
|
|
|
|
return code;
|
|
}
|
|
|
|
int32_t streamProcessRetrieveReq(SStreamTask* pTask, SStreamRetrieveReq* pReq) {
|
|
int32_t code = streamTaskEnqueueRetrieve(pTask, pReq);
|
|
if (code != 0) {
|
|
return code;
|
|
}
|
|
return streamTrySchedExec(pTask);
|
|
}
|
|
|
|
void streamTaskSetRemoveBackendFiles(SStreamTask* pTask) { pTask->status.removeBackendFiles = true; }
|
|
|
|
void streamTaskGetActiveCheckpointInfo(const SStreamTask* pTask, int32_t* pTransId, int64_t* pCheckpointId) {
|
|
if (pTransId != NULL) {
|
|
*pTransId = pTask->chkInfo.pActiveInfo->transId;
|
|
}
|
|
|
|
if (pCheckpointId != NULL) {
|
|
*pCheckpointId = pTask->chkInfo.pActiveInfo->activeId;
|
|
}
|
|
}
|
|
|
|
int32_t streamTaskSetActiveCheckpointInfo(SStreamTask* pTask, int64_t activeCheckpointId) {
|
|
pTask->chkInfo.pActiveInfo->activeId = activeCheckpointId;
|
|
return TSDB_CODE_SUCCESS;
|
|
}
|
|
|
|
void streamTaskSetFailedChkptInfo(SStreamTask* pTask, int32_t transId, int64_t checkpointId) {
|
|
pTask->chkInfo.pActiveInfo->transId = transId;
|
|
pTask->chkInfo.pActiveInfo->activeId = checkpointId;
|
|
pTask->chkInfo.pActiveInfo->failedId = checkpointId;
|
|
}
|
|
|
|
int32_t streamTaskCreateActiveChkptInfo(SActiveCheckpointInfo** pRes) {
|
|
SActiveCheckpointInfo* pInfo = taosMemoryCalloc(1, sizeof(SActiveCheckpointInfo));
|
|
if (pInfo == NULL) {
|
|
return TSDB_CODE_OUT_OF_MEMORY;
|
|
}
|
|
|
|
int32_t code = taosThreadMutexInit(&pInfo->lock, NULL);
|
|
if (code != TSDB_CODE_SUCCESS) {
|
|
return code;
|
|
}
|
|
|
|
pInfo->pDispatchTriggerList = taosArrayInit(4, sizeof(STaskTriggerSendInfo));
|
|
pInfo->pReadyMsgList = taosArrayInit(4, sizeof(STaskCheckpointReadyInfo));
|
|
pInfo->pCheckpointReadyRecvList = taosArrayInit(4, sizeof(STaskDownstreamReadyInfo));
|
|
|
|
*pRes = pInfo;
|
|
return code;
|
|
}
|
|
|
|
void streamTaskDestroyActiveChkptInfo(SActiveCheckpointInfo* pInfo) {
|
|
if (pInfo == NULL) {
|
|
return;
|
|
}
|
|
|
|
streamMutexDestroy(&pInfo->lock);
|
|
taosArrayDestroy(pInfo->pDispatchTriggerList);
|
|
pInfo->pDispatchTriggerList = NULL;
|
|
taosArrayDestroy(pInfo->pReadyMsgList);
|
|
pInfo->pReadyMsgList = NULL;
|
|
taosArrayDestroy(pInfo->pCheckpointReadyRecvList);
|
|
pInfo->pCheckpointReadyRecvList = NULL;
|
|
|
|
SStreamTmrInfo* pTriggerTmr = &pInfo->chkptTriggerMsgTmr;
|
|
if (pTriggerTmr->tmrHandle != NULL) {
|
|
(void)taosTmrStop(pTriggerTmr->tmrHandle);
|
|
pTriggerTmr->tmrHandle = NULL;
|
|
}
|
|
|
|
SStreamTmrInfo* pReadyTmr = &pInfo->chkptReadyMsgTmr;
|
|
if (pReadyTmr->tmrHandle != NULL) {
|
|
(void)taosTmrStop(pReadyTmr->tmrHandle);
|
|
pReadyTmr->tmrHandle = NULL;
|
|
}
|
|
|
|
taosMemoryFree(pInfo);
|
|
}
|
|
|
|
void streamTaskClearActiveInfo(SActiveCheckpointInfo* pInfo) {
|
|
pInfo->activeId = 0; // clear the checkpoint id
|
|
pInfo->transId = 0;
|
|
pInfo->allUpstreamTriggerRecv = 0;
|
|
pInfo->dispatchTrigger = false;
|
|
pInfo->failedId = 0;
|
|
|
|
taosArrayClear(pInfo->pDispatchTriggerList);
|
|
taosArrayClear(pInfo->pCheckpointReadyRecvList);
|
|
}
|
|
|
|
const char* streamTaskGetExecType(int32_t type) {
|
|
switch (type) {
|
|
case STREAM_EXEC_T_EXTRACT_WAL_DATA:
|
|
return "scan-wal-file";
|
|
case STREAM_EXEC_T_START_ALL_TASKS:
|
|
return "start-all-tasks";
|
|
case STREAM_EXEC_T_START_ONE_TASK:
|
|
return "start-one-task";
|
|
case STREAM_EXEC_T_RESTART_ALL_TASKS:
|
|
return "restart-all-tasks";
|
|
case STREAM_EXEC_T_STOP_ALL_TASKS:
|
|
return "stop-all-tasks";
|
|
case STREAM_EXEC_T_RESUME_TASK:
|
|
return "resume-task-from-idle";
|
|
case STREAM_EXEC_T_ADD_FAILED_TASK:
|
|
return "record-start-failed-task";
|
|
case 0:
|
|
return "exec-all-tasks";
|
|
default:
|
|
return "invalid-exec-type";
|
|
}
|
|
}
|