• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

taosdata / TDengine / #3561

19 Dec 2024 03:15AM UTC coverage: 58.812% (-1.3%) from 60.124%
#3561

push

travis-ci

web-flow
Merge pull request #29213 from taosdata/merge/mainto3.0

merge: from main to 3.0 branch

130770 of 287658 branches covered (45.46%)

Branch coverage included in aggregate %.

32 of 78 new or added lines in 4 files covered. (41.03%)

7347 existing lines in 166 files now uncovered.

205356 of 283866 relevant lines covered (72.34%)

7187865.64 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

71.82
/source/dnode/mnode/impl/src/mndStreamUtil.c
1
/*
2
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
3
 *
4
 * This program is free software: you can use, redistribute, and/or modify
5
 * it under the terms of the GNU Affero General Public License, version 3
6
 * or later ("AGPL"), as published by the Free Software Foundation.
7
 *
8
 * This program is distributed in the hope that it will be useful, but WITHOUT
9
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10
 * FITNESS FOR A PARTICULAR PURPOSE.
11
 *
12
 * You should have received a copy of the GNU Affero General Public License
13
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
14
 */
15

16
#include "mndDb.h"
17
#include "mndStb.h"
18
#include "mndStream.h"
19
#include "mndTrans.h"
20
#include "mndVgroup.h"
21
#include "taoserror.h"
22
#include "tmisce.h"
23

24
struct SStreamTaskIter {
25
  SStreamObj  *pStream;
26
  int32_t      level;
27
  int32_t      ordinalIndex;
28
  int32_t      totalLevel;
29
  SStreamTask *pTask;
30
};
31

32
int32_t doRemoveTasks(SStreamExecInfo *pExecNode, STaskId *pRemovedId);
33

34
int32_t createStreamTaskIter(SStreamObj *pStream, SStreamTaskIter **pIter) {
17,036✔
35
  *pIter = taosMemoryCalloc(1, sizeof(SStreamTaskIter));
17,036!
36
  if (*pIter == NULL) {
17,036!
37
    return terrno;
×
38
  }
39

40
  (*pIter)->level = -1;
17,036✔
41
  (*pIter)->ordinalIndex = 0;
17,036✔
42
  (*pIter)->pStream = pStream;
17,036✔
43
  (*pIter)->totalLevel = taosArrayGetSize(pStream->tasks);
17,036✔
44
  (*pIter)->pTask = NULL;
17,036✔
45

46
  return 0;
17,036✔
47
}
48

49
bool streamTaskIterNextTask(SStreamTaskIter *pIter) {
97,644✔
50
  if (pIter->level >= pIter->totalLevel) {
97,644!
51
    pIter->pTask = NULL;
×
52
    return false;
×
53
  }
54

55
  if (pIter->level == -1) {
97,644✔
56
    pIter->level += 1;
17,036✔
57
  }
58

59
  while (pIter->level < pIter->totalLevel) {
129,946✔
60
    SArray *pList = taosArrayGetP(pIter->pStream->tasks, pIter->level);
113,027✔
61
    if (pIter->ordinalIndex >= taosArrayGetSize(pList)) {
113,027✔
62
      pIter->level += 1;
32,302✔
63
      pIter->ordinalIndex = 0;
32,302✔
64
      pIter->pTask = NULL;
32,302✔
65
      continue;
32,302✔
66
    }
67

68
    pIter->pTask = taosArrayGetP(pList, pIter->ordinalIndex);
80,725✔
69
    pIter->ordinalIndex += 1;
80,725✔
70
    return true;
80,725✔
71
  }
72

73
  pIter->pTask = NULL;
16,919✔
74
  return false;
16,919✔
75
}
76

77
int32_t streamTaskIterGetCurrent(SStreamTaskIter *pIter, SStreamTask **pTask) {
80,725✔
78
  if (pTask) {
80,725!
79
    *pTask = pIter->pTask;
80,725✔
80
    if (*pTask != NULL) {
80,725!
81
      return TSDB_CODE_SUCCESS;
80,725✔
82
    }
83
  }
84

85
  return TSDB_CODE_INVALID_PARA;
×
86
}
87

88
void destroyStreamTaskIter(SStreamTaskIter *pIter) { taosMemoryFree(pIter); }
17,036!
89

90
static bool checkStatusForEachReplica(SVgObj *pVgroup) {
31,978✔
91
  for (int32_t i = 0; i < pVgroup->replica; ++i) {
66,987✔
92
    if (!pVgroup->vnodeGid[i].syncRestore) {
35,947✔
93
      mInfo("vgId:%d not restored, not ready for checkpoint or other operations", pVgroup->vgId);
930!
94
      return false;
930✔
95
    }
96

97
    ESyncState state = pVgroup->vnodeGid[i].syncState;
35,017✔
98
    if (state == TAOS_SYNC_STATE_OFFLINE || state == TAOS_SYNC_STATE_ERROR || state == TAOS_SYNC_STATE_LEARNER ||
35,017!
99
        state == TAOS_SYNC_STATE_CANDIDATE) {
100
      mInfo("vgId:%d state:%d , not ready for checkpoint or other operations, not check other vgroups", pVgroup->vgId,
8!
101
            state);
102
      return false;
8✔
103
    }
104
  }
105

106
  return true;
31,040✔
107
}
108

109
static int32_t mndAddSnodeInfo(SMnode *pMnode, SArray *pVgroupList) {
8,943✔
110
  SSnodeObj *pObj = NULL;
8,943✔
111
  void      *pIter = NULL;
8,943✔
112
  int32_t    code = 0;
8,943✔
113

114
  while (1) {
1,678✔
115
    pIter = sdbFetch(pMnode->pSdb, SDB_SNODE, pIter, (void **)&pObj);
10,621✔
116
    if (pIter == NULL) {
10,621✔
117
      break;
8,943✔
118
    }
119

120
    SNodeEntry entry = {.nodeId = SNODE_HANDLE};
1,678✔
121
    code = addEpIntoEpSet(&entry.epset, pObj->pDnode->fqdn, pObj->pDnode->port);
1,678✔
122
    if (code) {
1,678!
123
      sdbRelease(pMnode->pSdb, pObj);
×
124
      sdbCancelFetch(pMnode->pSdb, pIter);
×
125
      mError("failed to extract epset for fqdn:%s during task vgroup snapshot", pObj->pDnode->fqdn);
×
126
      return code;
×
127
    }
128

129
    char buf[256] = {0};
1,678✔
130
    code = epsetToStr(&entry.epset, buf, tListLen(buf));
1,678✔
131
    if (code != 0) {  // print error and continue
1,678!
132
      mError("failed to convert epset to str, code:%s", tstrerror(code));
×
133
    }
134

135
    void *p = taosArrayPush(pVgroupList, &entry);
1,678✔
136
    if (p == NULL) {
1,678!
137
      code = terrno;
×
138
      sdbRelease(pMnode->pSdb, pObj);
×
139
      sdbCancelFetch(pMnode->pSdb, pIter);
×
140
      mError("failed to put entry in vgroup list, nodeId:%d code:%s", entry.nodeId, tstrerror(code));
×
141
      return code;
×
142
    } else {
143
      mDebug("take snode snapshot, nodeId:%d %s", entry.nodeId, buf);
1,678✔
144
    }
145

146
    sdbRelease(pMnode->pSdb, pObj);
1,678✔
147
  }
148

149
  return code;
8,943✔
150
}
151

152
static int32_t mndCheckMnodeStatus(SMnode* pMnode) {
8,943✔
153
  int32_t    code = 0;
8,943✔
154
  ESdbStatus objStatus;
155
  void      *pIter = NULL;
8,943✔
156
  SMnodeObj *pObj = NULL;
8,943✔
157

158
  while (1) {
159
    pIter = sdbFetchAll(pMnode->pSdb, SDB_MNODE, pIter, (void **)&pObj, &objStatus, true);
18,136✔
160
    if (pIter == NULL) {
18,136✔
161
      break;
8,898✔
162
    }
163

164
    if (pObj->syncState != TAOS_SYNC_STATE_LEADER && pObj->syncState != TAOS_SYNC_STATE_FOLLOWER) {
9,238✔
165
      mDebug("mnode sync state:%d not leader/follower", pObj->syncState);
43!
166
      sdbRelease(pMnode->pSdb, pObj);
43✔
167
      sdbCancelFetch(pMnode->pSdb, pIter);
43✔
168
      return TSDB_CODE_FAILED;
43✔
169
    }
170

171
    if (objStatus != SDB_STATUS_READY) {
9,195✔
172
      mWarn("mnode status:%d not ready", objStatus);
2!
173
      sdbRelease(pMnode->pSdb, pObj);
2✔
174
      sdbCancelFetch(pMnode->pSdb, pIter);
2✔
175
      return TSDB_CODE_FAILED;
2✔
176
    }
177

178
    sdbRelease(pMnode->pSdb, pObj);
9,193✔
179
  }
180

181
  return TSDB_CODE_SUCCESS;
8,898✔
182
}
183

184
static int32_t mndCheckAndAddVgroupsInfo(SMnode *pMnode, SArray *pVgroupList, bool* allReady) {
8,943✔
185
  SSdb     *pSdb = pMnode->pSdb;
8,943✔
186
  void     *pIter = NULL;
8,943✔
187
  SVgObj   *pVgroup = NULL;
8,943✔
188
  int32_t   code = 0;
8,943✔
189
  SHashObj *pHash = NULL;
8,943✔
190

191
  pHash = taosHashInit(10, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT), false, HASH_NO_LOCK);
8,943✔
192
  if (pHash == NULL) {
8,943!
193
    mError("failed to prepare hashmap during take vgroup snapshot, code:%s", tstrerror(terrno));
×
194
    return terrno;
×
195
  }
196

197
  while (1) {
33,042✔
198
    pIter = sdbFetch(pSdb, SDB_VGROUP, pIter, (void **)&pVgroup);
41,985✔
199
    if (pIter == NULL) {
41,985✔
200
      break;
8,943✔
201
    }
202

203
    SNodeEntry entry = {.nodeId = pVgroup->vgId, .hbTimestamp = pVgroup->updateTime};
33,042✔
204
    entry.epset = mndGetVgroupEpset(pMnode, pVgroup);
33,042✔
205

206
    int8_t *pReplica = taosHashGet(pHash, &pVgroup->dbUid, sizeof(pVgroup->dbUid));
33,042✔
207
    if (pReplica == NULL) {  // not exist, add it into hash map
33,042✔
208
      code = taosHashPut(pHash, &pVgroup->dbUid, sizeof(pVgroup->dbUid), &pVgroup->replica, sizeof(pVgroup->replica));
14,606✔
209
      if (code) {
14,606!
210
        mError("failed to put info into hashmap during task vgroup snapshot, code:%s", tstrerror(code));
×
211
        sdbRelease(pSdb, pVgroup);
×
212
        sdbCancelFetch(pSdb, pIter);
×
213
        goto _end;  // take snapshot failed, and not all ready
×
214
      }
215
    } else {
216
      if (*pReplica != pVgroup->replica) {
18,436✔
217
        mInfo("vgId:%d replica:%d inconsistent with other vgroups replica:%d, not ready for stream operations",
414!
218
              pVgroup->vgId, pVgroup->replica, *pReplica);
219
        *allReady = false;  // task snap success, but not all ready
414✔
220
      }
221
    }
222

223
    // if not all ready till now, no need to check the remaining vgroups,
224
    // but still we need to put the info of the existed vgroups into the snapshot list
225
    if (*allReady) {
33,042✔
226
      *allReady = checkStatusForEachReplica(pVgroup);
31,978✔
227
    }
228

229
    char buf[256] = {0};
33,042✔
230
    code = epsetToStr(&entry.epset, buf, tListLen(buf));
33,042✔
231
    if (code != 0) {  // print error and continue
33,042!
232
      mError("failed to convert epset to str, code:%s", tstrerror(code));
×
233
    }
234

235
    void *p = taosArrayPush(pVgroupList, &entry);
33,042✔
236
    if (p == NULL) {
33,042!
237
      mError("failed to put entry in vgroup list, nodeId:%d code:out of memory", entry.nodeId);
×
238
      code = terrno;
×
239
      sdbRelease(pSdb, pVgroup);
×
240
      sdbCancelFetch(pSdb, pIter);
×
241
      goto _end;
×
242
    } else {
243
      mDebug("take node snapshot, nodeId:%d %s", entry.nodeId, buf);
33,042✔
244
    }
245

246
    sdbRelease(pSdb, pVgroup);
33,042✔
247
  }
248

249
_end:
8,943✔
250
  taosHashCleanup(pHash);
8,943✔
251
  return code;
8,943✔
252
}
253

254
int32_t mndTakeVgroupSnapshot(SMnode *pMnode, bool *allReady, SArray **pList) {
8,943✔
255
  int32_t   code = 0;
8,943✔
256
  SArray   *pVgroupList = NULL;
8,943✔
257

258
  *pList = NULL;
8,943✔
259
  *allReady = true;
8,943✔
260

261
  pVgroupList = taosArrayInit(4, sizeof(SNodeEntry));
8,943✔
262
  if (pVgroupList == NULL) {
8,943!
263
    mError("failed to prepare arraylist during take vgroup snapshot, code:%s", tstrerror(terrno));
×
264
    code = terrno;
×
265
    goto _err;
×
266
  }
267

268
  // 1. check for all vnodes status
269
  code = mndCheckAndAddVgroupsInfo(pMnode, pVgroupList, allReady);
8,943✔
270
  if (code) {
8,943!
271
    goto _err;
×
272
  }
273

274
  // 2. add snode info
275
  code = mndAddSnodeInfo(pMnode, pVgroupList);
8,943✔
276
  if (code) {
8,943!
277
    goto _err;
×
278
  }
279

280
  // 3. check for mnode status
281
  code = mndCheckMnodeStatus(pMnode);
8,943✔
282
  if (code != TSDB_CODE_SUCCESS) {
8,943✔
283
    *allReady = false;
45✔
284
  }
285

286
  *pList = pVgroupList;
8,943✔
287
  return code;
8,943✔
288

289
_err:
×
290
  *allReady = false;
×
291
  taosArrayDestroy(pVgroupList);
×
292
  return code;
×
293
}
294

295
int32_t mndGetStreamObj(SMnode *pMnode, int64_t streamId, SStreamObj **pStream) {
9,475✔
296
  void *pIter = NULL;
9,475✔
297
  SSdb *pSdb = pMnode->pSdb;
9,475✔
298
  *pStream = NULL;
9,475✔
299

300
  SStreamObj *p = NULL;
9,475✔
301
  while ((pIter = sdbFetch(pSdb, SDB_STREAM, pIter, (void **)&p)) != NULL) {
14,491✔
302
    if (p->uid == streamId) {
14,490✔
303
      sdbCancelFetch(pSdb, pIter);
9,474✔
304
      *pStream = p;
9,474✔
305
      return TSDB_CODE_SUCCESS;
9,474✔
306
    }
307
    sdbRelease(pSdb, p);
5,016✔
308
  }
309

310
  return TSDB_CODE_STREAM_TASK_NOT_EXIST;
1✔
311
}
312

313
void mndKillTransImpl(SMnode *pMnode, int32_t transId, const char *pDbName) {
×
314
  STrans *pTrans = mndAcquireTrans(pMnode, transId);
×
315
  if (pTrans != NULL) {
×
316
    mInfo("kill active transId:%d in Db:%s", transId, pDbName);
×
317
    int32_t code = mndKillTrans(pMnode, pTrans);
×
318
    mndReleaseTrans(pMnode, pTrans);
×
319
    if (code) {
×
320
      mError("failed to kill transId:%d, code:%s", pTrans->id, tstrerror(code));
×
321
    }
322
  } else {
323
    mError("failed to acquire trans in Db:%s, transId:%d", pDbName, transId);
×
324
  }
325
}
×
326

327
int32_t extractNodeEpset(SMnode *pMnode, SEpSet *pEpSet, bool *hasEpset, int32_t taskId, int32_t nodeId) {
16,825✔
328
  *hasEpset = false;
16,825✔
329

330
  pEpSet->numOfEps = 0;
16,825✔
331
  if (nodeId == SNODE_HANDLE) {
16,825✔
332
    SSnodeObj *pObj = NULL;
114✔
333
    void      *pIter = NULL;
114✔
334

335
    pIter = sdbFetch(pMnode->pSdb, SDB_SNODE, pIter, (void **)&pObj);
114✔
336
    if (pIter != NULL) {
114!
337
      int32_t code = addEpIntoEpSet(pEpSet, pObj->pDnode->fqdn, pObj->pDnode->port);
114✔
338
      sdbRelease(pMnode->pSdb, pObj);
114✔
339
      sdbCancelFetch(pMnode->pSdb, pIter);
114✔
340
      if (code) {
114!
341
        *hasEpset = false;
×
342
        mError("failed to set epset");
×
343
      } else {
344
        *hasEpset = true;
114✔
345
      }
346
      return code;
114✔
347
    } else {
348
      mError("failed to acquire snode epset");
×
349
      return TSDB_CODE_INVALID_PARA;
×
350
    }
351
  } else {
352
    SVgObj *pVgObj = mndAcquireVgroup(pMnode, nodeId);
16,711✔
353
    if (pVgObj != NULL) {
16,711✔
354
      SEpSet epset = mndGetVgroupEpset(pMnode, pVgObj);
16,710✔
355
      mndReleaseVgroup(pMnode, pVgObj);
16,710✔
356

357
      epsetAssign(pEpSet, &epset);
16,710✔
358
      *hasEpset = true;
16,710✔
359
      return TSDB_CODE_SUCCESS;
16,710✔
360
    } else {
361
      mDebug("orphaned task:0x%x need to be dropped, nodeId:%d, no redo action", taskId, nodeId);
1!
362
      return TSDB_CODE_SUCCESS;
1✔
363
    }
364
  }
365
}
366

367
int32_t mndGetStreamTask(STaskId *pId, SStreamObj *pStream, SStreamTask **pTask) {
117✔
368
  *pTask = NULL;
117✔
369

370
  SStreamTask     *p = NULL;
117✔
371
  SStreamTaskIter *pIter = NULL;
117✔
372
  int32_t          code = createStreamTaskIter(pStream, &pIter);
117✔
373
  if (code) {
117!
374
    mError("failed to create stream task iter:%s", pStream->name);
×
375
    return code;
×
376
  }
377

378
  while (streamTaskIterNextTask(pIter)) {
382!
379
    code = streamTaskIterGetCurrent(pIter, &p);
382✔
380
    if (code) {
382!
381
      continue;
×
382
    }
383

384
    if (p->id.taskId == pId->taskId) {
382✔
385
      destroyStreamTaskIter(pIter);
117✔
386
      *pTask = p;
117✔
387
      return 0;
117✔
388
    }
389
  }
390

391
  destroyStreamTaskIter(pIter);
×
392
  return TSDB_CODE_FAILED;
×
393
}
394

395
int32_t mndGetNumOfStreamTasks(const SStreamObj *pStream) {
17,954✔
396
  int32_t num = 0;
17,954✔
397
  for (int32_t i = 0; i < taosArrayGetSize(pStream->tasks); ++i) {
52,979✔
398
    SArray *pLevel = taosArrayGetP(pStream->tasks, i);
35,025✔
399
    num += taosArrayGetSize(pLevel);
35,025✔
400
  }
401

402
  return num;
17,954✔
403
}
404

405
int32_t mndGetNumOfStreams(SMnode *pMnode, char *dbName, int32_t *pNumOfStreams) {
58✔
406
  SSdb   *pSdb = pMnode->pSdb;
58✔
407
  SDbObj *pDb = mndAcquireDb(pMnode, dbName);
58✔
408
  if (pDb == NULL) {
58!
409
    TAOS_RETURN(TSDB_CODE_MND_DB_NOT_SELECTED);
×
410
  }
411

412
  int32_t numOfStreams = 0;
58✔
413
  void   *pIter = NULL;
58✔
414
  while (1) {
×
415
    SStreamObj *pStream = NULL;
58✔
416
    pIter = sdbFetch(pSdb, SDB_STREAM, pIter, (void **)&pStream);
58✔
417
    if (pIter == NULL) break;
58!
418

419
    if (pStream->sourceDbUid == pDb->uid) {
×
420
      numOfStreams++;
×
421
    }
422

423
    sdbRelease(pSdb, pStream);
×
424
  }
425

426
  *pNumOfStreams = numOfStreams;
58✔
427
  mndReleaseDb(pMnode, pDb);
58✔
428
  return 0;
58✔
429
}
430

431
static void freeTaskList(void *param) {
1,520✔
432
  SArray **pList = (SArray **)param;
1,520✔
433
  taosArrayDestroy(*pList);
1,520✔
434
}
1,520✔
435

436
int32_t mndInitExecInfo() {
1,367✔
437
  int32_t code = taosThreadMutexInit(&execInfo.lock, NULL);
1,367✔
438
  if (code) {
1,367!
439
    return code;
×
440
  }
441

442
  _hash_fn_t fn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_VARCHAR);
1,367✔
443

444
  execInfo.pTaskList = taosArrayInit(4, sizeof(STaskId));
1,367✔
445
  execInfo.pTaskMap = taosHashInit(64, fn, true, HASH_NO_LOCK);
1,367✔
446
  execInfo.transMgmt.pDBTrans = taosHashInit(32, fn, true, HASH_NO_LOCK);
1,367✔
447
  execInfo.pTransferStateStreams = taosHashInit(32, fn, true, HASH_NO_LOCK);
1,367✔
448
  execInfo.pChkptStreams = taosHashInit(32, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT), true, HASH_NO_LOCK);
1,367✔
449
  execInfo.pStreamConsensus = taosHashInit(32, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT), true, HASH_NO_LOCK);
1,367✔
450
  execInfo.pNodeList = taosArrayInit(4, sizeof(SNodeEntry));
1,367✔
451
  execInfo.pKilledChkptTrans = taosArrayInit(4, sizeof(SStreamTaskResetMsg));
1,367✔
452

453
  if (execInfo.pTaskList == NULL || execInfo.pTaskMap == NULL || execInfo.transMgmt.pDBTrans == NULL ||
1,367!
454
      execInfo.pTransferStateStreams == NULL || execInfo.pChkptStreams == NULL || execInfo.pStreamConsensus == NULL ||
1,367!
455
      execInfo.pNodeList == NULL || execInfo.pKilledChkptTrans == NULL) {
1,367!
456
    mError("failed to initialize the stream runtime env, code:%s", tstrerror(terrno));
×
457
    return terrno;
×
458
  }
459

460
  execInfo.role = NODE_ROLE_UNINIT;
1,367✔
461
  execInfo.switchFromFollower = false;
1,367✔
462

463
  taosHashSetFreeFp(execInfo.pTransferStateStreams, freeTaskList);
1,367✔
464
  taosHashSetFreeFp(execInfo.pChkptStreams, freeTaskList);
1,367✔
465
  taosHashSetFreeFp(execInfo.pStreamConsensus, freeTaskList);
1,367✔
466
  return 0;
1,367✔
467
}
468

469
void removeExpiredNodeInfo(const SArray *pNodeSnapshot) {
514✔
470
  SArray *pValidList = taosArrayInit(4, sizeof(SNodeEntry));
514✔
471
  if (pValidList == NULL) {  // not continue
514!
472
    return;
×
473
  }
474

475
  int32_t size = taosArrayGetSize(pNodeSnapshot);
514✔
476
  int32_t oldSize = taosArrayGetSize(execInfo.pNodeList);
514✔
477

478
  for (int32_t i = 0; i < oldSize; ++i) {
3,486✔
479
    SNodeEntry *p = taosArrayGet(execInfo.pNodeList, i);
2,972✔
480
    if (p == NULL) {
2,972!
481
      continue;
×
482
    }
483

484
    for (int32_t j = 0; j < size; ++j) {
11,620✔
485
      SNodeEntry *pEntry = taosArrayGet(pNodeSnapshot, j);
10,603✔
486
      if (pEntry == NULL) {
10,603!
487
        continue;
×
488
      }
489

490
      if (pEntry->nodeId == p->nodeId) {
10,603✔
491
        p->hbTimestamp = pEntry->hbTimestamp;
1,955✔
492

493
        void *px = taosArrayPush(pValidList, p);
1,955✔
494
        if (px == NULL) {
1,955!
495
          mError("failed to put node into list, nodeId:%d", p->nodeId);
×
496
        } else {
497
          mDebug("vgId:%d ts:%" PRId64 " HbMsgId:%d is valid", p->nodeId, p->hbTimestamp, p->lastHbMsgId);
1,955✔
498
        }
499
        break;
1,955✔
500
      }
501
    }
502
  }
503

504
  taosArrayDestroy(execInfo.pNodeList);
514✔
505
  execInfo.pNodeList = pValidList;
514✔
506

507
  mDebug("remain %d valid node entries after clean expired nodes info, prev size:%d",
514✔
508
         (int32_t)taosArrayGetSize(pValidList), oldSize);
509
}
510

511
int32_t doRemoveTasks(SStreamExecInfo *pExecNode, STaskId *pRemovedId) {
7,271✔
512
  void *p = taosHashGet(pExecNode->pTaskMap, pRemovedId, sizeof(*pRemovedId));
7,271✔
513
  if (p == NULL) {
7,271✔
514
    return TSDB_CODE_SUCCESS;
124✔
515
  }
516

517
  int32_t code = taosHashRemove(pExecNode->pTaskMap, pRemovedId, sizeof(*pRemovedId));
7,147✔
518
  if (code) {
7,147!
519
    return code;
×
520
  }
521

522
  for (int32_t k = 0; k < taosArrayGetSize(pExecNode->pTaskList); ++k) {
21,045!
523
    STaskId *pId = taosArrayGet(pExecNode->pTaskList, k);
21,045✔
524
    if (pId == NULL) {
21,045!
525
      continue;
×
526
    }
527

528
    if (pId->taskId == pRemovedId->taskId && pId->streamId == pRemovedId->streamId) {
21,045!
529
      taosArrayRemove(pExecNode->pTaskList, k);
7,147✔
530

531
      int32_t num = taosArrayGetSize(pExecNode->pTaskList);
7,147✔
532
      mInfo("s-task:0x%x removed from buffer, remain:%d in buffer list", (int32_t)pRemovedId->taskId, num);
7,147!
533
      break;
7,147✔
534
    }
535
  }
536

537
  return TSDB_CODE_SUCCESS;
7,147✔
538
}
539

540
void removeTasksInBuf(SArray *pTaskIds, SStreamExecInfo *pExecInfo) {
1,497✔
541
  for (int32_t i = 0; i < taosArrayGetSize(pTaskIds); ++i) {
1,497!
542
    STaskId *pId = taosArrayGet(pTaskIds, i);
×
543
    if (pId == NULL) {
×
544
      continue;
×
545
    }
546

547
    int32_t code = doRemoveTasks(pExecInfo, pId);
×
548
    if (code) {
×
549
      mError("failed to remove task in buffer list, 0x%" PRIx64, pId->taskId);
×
550
    }
551
  }
552
}
1,497✔
553

554
void removeStreamTasksInBuf(SStreamObj *pStream, SStreamExecInfo *pExecNode) {
1,341✔
555
  SStreamTaskIter *pIter = NULL;
1,341✔
556
  streamMutexLock(&pExecNode->lock);
1,341✔
557

558
  // 1. remove task entries
559
  int32_t code = createStreamTaskIter(pStream, &pIter);
1,341✔
560
  if (code) {
1,341!
561
    streamMutexUnlock(&pExecNode->lock);
×
562
    mError("failed to create stream task iter:%s", pStream->name);
×
563
    return;
×
564
  }
565

566
  while (streamTaskIterNextTask(pIter)) {
8,612✔
567
    SStreamTask *pTask = NULL;
7,271✔
568
    code = streamTaskIterGetCurrent(pIter, &pTask);
7,271✔
569
    if (code) {
7,271!
570
      continue;
×
571
    }
572

573
    STaskId id = {.streamId = pTask->id.streamId, .taskId = pTask->id.taskId};
7,271✔
574
    code = doRemoveTasks(pExecNode, &id);
7,271✔
575
    if (code) {
7,271!
576
      mError("failed to remove task in buffer list, 0x%" PRIx64, id.taskId);
×
577
    }
578
  }
579

580
  if (taosHashGetSize(pExecNode->pTaskMap) != taosArrayGetSize(pExecNode->pTaskList)) {
1,341!
581
    streamMutexUnlock(&pExecNode->lock);
×
582
    destroyStreamTaskIter(pIter);
×
583
    mError("task map size, task list size, not equal");
×
584
    return;
×
585
  }
586

587
  // 2. remove stream entry in consensus hash table and checkpoint-report hash table
588
  code = mndClearConsensusCheckpointId(execInfo.pStreamConsensus, pStream->uid);
1,341✔
589
  if (code) {
1,341!
590
    mError("failed to clear consensus checkpointId, code:%s", tstrerror(code));
×
591
  }
592

593
  code = mndClearChkptReportInfo(execInfo.pChkptStreams, pStream->uid);
1,341✔
594
  if (code) {
1,341✔
595
    mError("failed to clear the checkpoint report info, code:%s", tstrerror(code));
389!
596
  }
597

598
  streamMutexUnlock(&pExecNode->lock);
1,341✔
599
  destroyStreamTaskIter(pIter);
1,341✔
600
}
601

602
static bool taskNodeExists(SArray *pList, int32_t nodeId) {
6,419✔
603
  size_t num = taosArrayGetSize(pList);
6,419✔
604

605
  for (int32_t i = 0; i < num; ++i) {
19,014!
606
    SNodeEntry *pEntry = taosArrayGet(pList, i);
19,014✔
607
    if (pEntry == NULL) {
19,014!
608
      continue;
×
609
    }
610

611
    if (pEntry->nodeId == nodeId) {
19,014✔
612
      return true;
6,419✔
613
    }
614
  }
615

616
  return false;
×
617
}
618

619
int32_t removeExpiredNodeEntryAndTaskInBuf(SArray *pNodeSnapshot) {
514✔
620
  SArray *pRemovedTasks = taosArrayInit(4, sizeof(STaskId));
514✔
621
  if (pRemovedTasks == NULL) {
514!
622
    return terrno;
×
623
  }
624

625
  int32_t numOfTask = taosArrayGetSize(execInfo.pTaskList);
514✔
626
  for (int32_t i = 0; i < numOfTask; ++i) {
6,985✔
627
    STaskId *pId = taosArrayGet(execInfo.pTaskList, i);
6,471✔
628
    if (pId == NULL) {
6,471!
629
      continue;
×
630
    }
631

632
    STaskStatusEntry *pEntry = taosHashGet(execInfo.pTaskMap, pId, sizeof(*pId));
6,471✔
633
    if (pEntry == NULL) {
6,471!
634
      continue;
×
635
    }
636

637
    if (pEntry->nodeId == SNODE_HANDLE) {
6,471✔
638
      continue;
52✔
639
    }
640

641
    bool existed = taskNodeExists(pNodeSnapshot, pEntry->nodeId);
6,419✔
642
    if (!existed) {
6,419!
643
      void *p = taosArrayPush(pRemovedTasks, pId);
×
644
      if (p == NULL) {
×
645
        mError("failed to put task entry into remove list, taskId:0x%" PRIx64, pId->taskId);
×
646
      }
647
    }
648
  }
649

650
  removeTasksInBuf(pRemovedTasks, &execInfo);
514✔
651

652
  mDebug("remove invalid stream tasks:%d, remain:%d", (int32_t)taosArrayGetSize(pRemovedTasks),
514✔
653
         (int32_t)taosArrayGetSize(execInfo.pTaskList));
654

655
  removeExpiredNodeInfo(pNodeSnapshot);
514✔
656

657
  taosArrayDestroy(pRemovedTasks);
514✔
658
  return 0;
514✔
659
}
660

661
int32_t mndScanCheckpointReportInfo(SRpcMsg *pReq) {
6,884✔
662
  SMnode *pMnode = pReq->info.node;
6,884✔
663
  void   *pIter = NULL;
6,884✔
664
  int32_t code = 0;
6,884✔
665
  SArray *pDropped = taosArrayInit(4, sizeof(int64_t));
6,884✔
666
  if (pDropped == NULL) {
6,884!
667
    return terrno;
×
668
  }
669

670
  mDebug("start to scan checkpoint report info");
6,884✔
671
  streamMutexLock(&execInfo.lock);
6,884✔
672

673
  while ((pIter = taosHashIterate(execInfo.pChkptStreams, pIter)) != NULL) {
11,594✔
674
    SChkptReportInfo *px = (SChkptReportInfo *)pIter;
5,265✔
675
    if (taosArrayGetSize(px->pTaskList) == 0) {
5,265✔
676
      continue;
4,705✔
677
    }
678

679
    STaskChkptInfo *pInfo = taosArrayGet(px->pTaskList, 0);
560✔
680
    if (pInfo == NULL) {
560!
681
      continue;
×
682
    }
683

684
    SStreamObj *pStream = NULL;
560✔
685
    code = mndGetStreamObj(pMnode, pInfo->streamId, &pStream);
560✔
686
    if (pStream == NULL || code != 0) {
560!
687
      mDebug("failed to acquire stream:0x%" PRIx64 " remove it from checkpoint-report list", pInfo->streamId);
×
688
      void *p = taosArrayPush(pDropped, &pInfo->streamId);
×
689
      if (p == NULL) {
×
690
        mError("failed to put stream into drop list:0x%" PRIx64, pInfo->streamId);
×
691
      }
692
      continue;
×
693
    }
694

695
    int32_t total = mndGetNumOfStreamTasks(pStream);
560✔
696
    int32_t existed = (int32_t)taosArrayGetSize(px->pTaskList);
560✔
697

698
    if (total == existed) {
560✔
699
      mDebug("stream:0x%" PRIx64 " %s all %d tasks send checkpoint-report, start to update checkpoint-info",
555✔
700
             pStream->uid, pStream->name, total);
701

702
      code = mndStreamTransConflictCheck(pMnode, pStream->uid, MND_STREAM_CHKPT_UPDATE_NAME, false);
555✔
703
      if (code == 0) {
555!
704
        code = mndCreateStreamChkptInfoUpdateTrans(pMnode, pStream, px->pTaskList);
555✔
705
        if (code == TSDB_CODE_SUCCESS || code == TSDB_CODE_ACTION_IN_PROGRESS) {  // remove this entry
555!
706
          taosArrayClear(px->pTaskList);
555✔
707
          px->reportChkpt = pInfo->checkpointId;
555✔
708
          mDebug("stream:0x%" PRIx64 " clear checkpoint-report list", pInfo->streamId);
555✔
709
        } else {
710
          mDebug("stream:0x%" PRIx64 " not launch chkpt-meta update trans, due to checkpoint not finished yet",
×
711
                 pInfo->streamId);
712
        }
713
        break;
555✔
714
      } else {
715
        mDebug("stream:0x%" PRIx64 " active checkpoint trans not finished yet, wait", pInfo->streamId);
×
716
      }
717
    } else {
718
      mDebug("stream:0x%" PRIx64 " %s %d/%d tasks send checkpoint-report, %d not send", pInfo->streamId, pStream->name,
5✔
719
             existed, total, total - existed);
720
    }
721

722
    sdbRelease(pMnode->pSdb, pStream);
5✔
723
  }
724

725
  int32_t size = taosArrayGetSize(pDropped);
6,884✔
726
  if (size > 0) {
6,884!
727
    for (int32_t i = 0; i < size; ++i) {
×
728
      int64_t *pStreamId = (int64_t *)taosArrayGet(pDropped, i);
×
729
      if (pStreamId == NULL) {
×
730
        continue;
×
731
      }
732

733
      code = taosHashRemove(execInfo.pChkptStreams, pStreamId, sizeof(*pStreamId));
×
734
      if (code) {
×
735
        mError("failed to remove stream in buf:0x%" PRIx64, *pStreamId);
×
736
      }
737
    }
738

739
    int32_t numOfStreams = taosHashGetSize(execInfo.pChkptStreams);
×
740
    mDebug("drop %d stream(s) in checkpoint-report list, remain:%d", size, numOfStreams);
×
741
  }
742

743
  streamMutexUnlock(&execInfo.lock);
6,884✔
744

745
  taosArrayDestroy(pDropped);
6,884✔
746
  return TSDB_CODE_SUCCESS;
6,884✔
747
}
748

749
int32_t mndCreateSetConsensusChkptIdTrans(SMnode *pMnode, SStreamObj *pStream, int32_t taskId, int64_t checkpointId,
117✔
750
                                          int64_t ts) {
751
  char msg[128] = {0};
117✔
752
  snprintf(msg, tListLen(msg), "set consen-chkpt-id for task:0x%x", taskId);
117✔
753

754
  STrans *pTrans = NULL;
117✔
755
  int32_t code = doCreateTrans(pMnode, pStream, NULL, TRN_CONFLICT_NOTHING, MND_STREAM_CHKPT_CONSEN_NAME, msg, &pTrans);
117✔
756
  if (pTrans == NULL || code != 0) {
117!
757
    return terrno;
×
758
  }
759

760
  STaskId      id = {.streamId = pStream->uid, .taskId = taskId};
117✔
761
  SStreamTask *pTask = NULL;
117✔
762
  code = mndGetStreamTask(&id, pStream, &pTask);
117✔
763
  if (code) {
117!
764
    mError("failed to get task:0x%x in stream:%s, failed to create consensus-checkpointId", taskId, pStream->name);
×
765
    sdbRelease(pMnode->pSdb, pStream);
×
766
    return code;
×
767
  }
768

769
  code = mndStreamRegisterTrans(pTrans, MND_STREAM_CHKPT_CONSEN_NAME, pStream->uid);
117✔
770
  if (code) {
117!
771
    sdbRelease(pMnode->pSdb, pStream);
×
772
    return code;
×
773
  }
774

775
  code = mndStreamSetChkptIdAction(pMnode, pTrans, pTask, checkpointId, ts);
117✔
776
  if (code != 0) {
117!
777
    sdbRelease(pMnode->pSdb, pStream);
×
778
    mndTransDrop(pTrans);
×
779
    return code;
×
780
  }
781

782
  code = mndPersistTransLog(pStream, pTrans, SDB_STATUS_READY);
117✔
783
  if (code) {
117!
784
    sdbRelease(pMnode->pSdb, pStream);
×
785
    mndTransDrop(pTrans);
×
786
    return code;
×
787
  }
788

789
  code = mndTransPrepare(pMnode, pTrans);
117✔
790
  if (code != TSDB_CODE_SUCCESS && code != TSDB_CODE_ACTION_IN_PROGRESS) {
117!
791
    mError("trans:%d, failed to prepare set consensus-chkptId trans since %s", pTrans->id, terrstr());
×
792
    sdbRelease(pMnode->pSdb, pStream);
×
793
    mndTransDrop(pTrans);
×
794
    return code;
×
795
  }
796

797
  sdbRelease(pMnode->pSdb, pStream);
117✔
798
  mndTransDrop(pTrans);
117✔
799

800
  return TSDB_CODE_ACTION_IN_PROGRESS;
117✔
801
}
802

803
int32_t mndGetConsensusInfo(SHashObj *pHash, int64_t streamId, int32_t numOfTasks, SCheckpointConsensusInfo **pInfo) {
129✔
804
  *pInfo = NULL;
129✔
805

806
  void *px = taosHashGet(pHash, &streamId, sizeof(streamId));
129✔
807
  if (px != NULL) {
129✔
808
    *pInfo = px;
99✔
809
    return 0;
99✔
810
  }
811

812
  SCheckpointConsensusInfo p = {
30✔
813
      .pTaskList = taosArrayInit(4, sizeof(SCheckpointConsensusEntry)),
30✔
814
      .numOfTasks = numOfTasks,
815
      .streamId = streamId,
816
  };
817

818
  if (p.pTaskList == NULL) {
30!
819
    return terrno;
×
820
  }
821

822
  int32_t code = taosHashPut(pHash, &streamId, sizeof(streamId), &p, sizeof(p));
30✔
823
  if (code == 0) {
30!
824
    void *pChkptInfo = (SCheckpointConsensusInfo *)taosHashGet(pHash, &streamId, sizeof(streamId));
30✔
825
    *pInfo = pChkptInfo;
30✔
826
  } else {
827
    *pInfo = NULL;
×
828
  }
829

830
  return code;
30✔
831
}
832

833
// no matter existed or not, add the request into info list anyway, since we need to send rsp mannually
834
// discard the msg may lead to the lost of connections.
835
void mndAddConsensusTasks(SCheckpointConsensusInfo *pInfo, const SRestoreCheckpointInfo *pRestoreInfo) {
129✔
836
  SCheckpointConsensusEntry info = {.ts = taosGetTimestampMs()};
129✔
837
  memcpy(&info.req, pRestoreInfo, sizeof(info.req));
129✔
838

839
  for (int32_t i = 0; i < taosArrayGetSize(pInfo->pTaskList); ++i) {
401✔
840
    SCheckpointConsensusEntry *p = taosArrayGet(pInfo->pTaskList, i);
280✔
841
    if (p == NULL) {
280!
842
      continue;
×
843
    }
844

845
    if (p->req.taskId == info.req.taskId) {
280✔
846
      mDebug("s-task:0x%x already in consensus-checkpointId list for stream:0x%" PRIx64 ", update ts %" PRId64
8✔
847
             "->%" PRId64 " total existed:%d",
848
             pRestoreInfo->taskId, pRestoreInfo->streamId, p->req.startTs, info.req.startTs,
849
             (int32_t)taosArrayGetSize(pInfo->pTaskList));
850
      p->req.startTs = info.req.startTs;
8✔
851
      return;
8✔
852
    }
853
  }
854

855
  void *p = taosArrayPush(pInfo->pTaskList, &info);
121✔
856
  if (p == NULL) {
121!
857
    mError("s-task:0x%x failed to put task into consensus-checkpointId list, code: out of memory", info.req.taskId);
×
858
  } else {
859
    int32_t num = taosArrayGetSize(pInfo->pTaskList);
121✔
860
    mDebug("s-task:0x%x checkpointId:%" PRId64 " added into consensus-checkpointId list, stream:0x%" PRIx64
121✔
861
           " waiting tasks:%d",
862
           pRestoreInfo->taskId, pRestoreInfo->checkpointId, pRestoreInfo->streamId, num);
863
  }
864
}
865

866
void mndClearConsensusRspEntry(SCheckpointConsensusInfo *pInfo) {
29✔
867
  taosArrayDestroy(pInfo->pTaskList);
29✔
868
  pInfo->pTaskList = NULL;
29✔
869
}
29✔
870

871
int64_t mndClearConsensusCheckpointId(SHashObj *pHash, int64_t streamId) {
1,370✔
872
  int32_t code = 0;
1,370✔
873
  int32_t numOfStreams = taosHashGetSize(pHash);
1,370✔
874
  if (numOfStreams == 0) {
1,370✔
875
    return code;
1,341✔
876
  }
877

878
  code = taosHashRemove(pHash, &streamId, sizeof(streamId));
29✔
879
  if (code == 0) {
29!
880
    mDebug("drop stream:0x%" PRIx64 " in consensus-checkpointId list, remain:%d", streamId, numOfStreams);
29✔
881
  } else {
882
    mError("failed to remove stream:0x%" PRIx64 " in consensus-checkpointId list, remain:%d", streamId, numOfStreams);
×
883
  }
884

885
  return code;
29✔
886
}
887

888
int64_t mndClearChkptReportInfo(SHashObj *pHash, int64_t streamId) {
1,341✔
889
  int32_t code = 0;
1,341✔
890
  int32_t numOfStreams = taosHashGetSize(pHash);
1,341✔
891
  if (numOfStreams == 0) {
1,341✔
892
    return code;
328✔
893
  }
894

895
  code = taosHashRemove(pHash, &streamId, sizeof(streamId));
1,013✔
896
  if (code == 0) {
1,013✔
897
    mDebug("drop stream:0x%" PRIx64 " in chkpt-report list, remain:%d", streamId, numOfStreams);
624✔
898
  } else {
899
    mError("failed to remove stream:0x%" PRIx64 " in chkpt-report list, remain:%d", streamId, numOfStreams);
389!
900
  }
901

902
  return code;
1,013✔
903
}
904

905
int32_t mndResetChkptReportInfo(SHashObj *pHash, int64_t streamId) {
×
906
  SChkptReportInfo *pInfo = taosHashGet(pHash, &streamId, sizeof(streamId));
×
907
  if (pInfo != NULL) {
×
908
    taosArrayClear(pInfo->pTaskList);
×
909
    mDebug("stream:0x%" PRIx64 " checkpoint-report list cleared, prev report checkpointId:%" PRId64, streamId,
×
910
           pInfo->reportChkpt);
911
    return 0;
×
912
  }
913

914
  return TSDB_CODE_MND_STREAM_NOT_EXIST;
×
915
}
916

917
static void mndShowStreamStatus(char *dst, int8_t status) {
809✔
918
  if (status == STREAM_STATUS__NORMAL) {
809✔
919
    tstrncpy(dst, "ready", MND_STREAM_TRIGGER_NAME_SIZE);
785✔
920
  } else if (status == STREAM_STATUS__STOP) {
24!
921
    tstrncpy(dst, "stop", MND_STREAM_TRIGGER_NAME_SIZE);
×
922
  } else if (status == STREAM_STATUS__FAILED) {
24!
923
    tstrncpy(dst, "failed", MND_STREAM_TRIGGER_NAME_SIZE);
×
924
  } else if (status == STREAM_STATUS__RECOVER) {
24!
925
    tstrncpy(dst, "recover", MND_STREAM_TRIGGER_NAME_SIZE);
×
926
  } else if (status == STREAM_STATUS__PAUSE) {
24!
927
    tstrncpy(dst, "paused", MND_STREAM_TRIGGER_NAME_SIZE);
24✔
928
  }
929
}
809✔
930

931
static void mndShowStreamTrigger(char *dst, SStreamObj *pStream) {
809✔
932
  int8_t trigger = pStream->conf.trigger;
809✔
933
  if (trigger == STREAM_TRIGGER_AT_ONCE) {
809✔
934
    tstrncpy(dst, "at once", MND_STREAM_TRIGGER_NAME_SIZE);
558✔
935
  } else if (trigger == STREAM_TRIGGER_WINDOW_CLOSE) {
251✔
936
    tstrncpy(dst, "window close", MND_STREAM_TRIGGER_NAME_SIZE);
132✔
937
  } else if (trigger == STREAM_TRIGGER_MAX_DELAY) {
119✔
938
    tstrncpy(dst, "max delay", MND_STREAM_TRIGGER_NAME_SIZE);
49✔
939
  } else if (trigger == STREAM_TRIGGER_FORCE_WINDOW_CLOSE) {
70!
940
    tstrncpy(dst, "force window close", MND_STREAM_TRIGGER_NAME_SIZE);
70✔
941
  }
942
}
809✔
943

944
static void int64ToHexStr(int64_t id, char *pBuf, int32_t bufLen) {
37,220✔
945
  memset(pBuf, 0, bufLen);
37,220✔
946
  pBuf[2] = '0';
37,220✔
947
  pBuf[3] = 'x';
37,220✔
948

949
  int32_t len = tintToHex(id, &pBuf[4]);
37,220✔
950
  varDataSetLen(pBuf, len + 2);
37,220✔
951
}
37,220✔
952

953
static int32_t isAllTaskPaused(SStreamObj *pStream, bool *pRes) {
809✔
954
  int32_t          code = TSDB_CODE_SUCCESS;
809✔
955
  int32_t          lino = 0;
809✔
956
  SStreamTaskIter *pIter = NULL;
809✔
957
  bool             isPaused =  true;
809✔
958

959
  taosRLockLatch(&pStream->lock);
809✔
960
  code = createStreamTaskIter(pStream, &pIter);
809✔
961
  TSDB_CHECK_CODE(code, lino, _end);
809!
962

963
  while (streamTaskIterNextTask(pIter)) {
4,995✔
964
    SStreamTask *pTask = NULL;
4,186✔
965
    code = streamTaskIterGetCurrent(pIter, &pTask);
4,186✔
966
    TSDB_CHECK_CODE(code, lino, _end);
4,186!
967

968
    STaskId           id = {.streamId = pTask->id.streamId, .taskId = pTask->id.taskId};
4,186✔
969
    STaskStatusEntry *pe = taosHashGet(execInfo.pTaskMap, &id, sizeof(id));
4,186✔
970
    if (pe == NULL) {
4,186✔
971
      continue;
116✔
972
    }
973
    if (pe->status != TASK_STATUS__PAUSE) {
4,070✔
974
      isPaused = false;
4,056✔
975
    }
976
  }
977
  (*pRes) = isPaused;
809✔
978

979
_end:
809✔
980
  destroyStreamTaskIter(pIter);
809✔
981
  taosRUnLockLatch(&pStream->lock);
809✔
982
  if (code != TSDB_CODE_SUCCESS) {
809!
NEW
983
    mError("error happens when get stream status, lino:%d, code:%s", lino, tstrerror(code));
×
984
  }
985
  return code;
809✔
986
}
987

988
int32_t setStreamAttrInResBlock(SStreamObj *pStream, SSDataBlock *pBlock, int32_t numOfRows) {
809✔
989
  int32_t code = 0;
809✔
990
  int32_t cols = 0;
809✔
991
  int32_t lino = 0;
809✔
992

993
  char streamName[TSDB_TABLE_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
809✔
994
  STR_WITH_MAXSIZE_TO_VARSTR(streamName, mndGetDbStr(pStream->name), sizeof(streamName));
809✔
995
  SColumnInfoData *pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
809✔
996
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
809!
997

998
  code = colDataSetVal(pColInfo, numOfRows, (const char *)streamName, false);
809✔
999
  TSDB_CHECK_CODE(code, lino, _end);
809!
1000

1001
  // create time
1002
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
809✔
1003
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
809!
1004
  code = colDataSetVal(pColInfo, numOfRows, (const char *)&pStream->createTime, false);
809✔
1005
  TSDB_CHECK_CODE(code, lino, _end);
809!
1006

1007
  // stream id
1008
  char buf[128] = {0};
809✔
1009
  int64ToHexStr(pStream->uid, buf, tListLen(buf));
809✔
1010
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
809✔
1011
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
809!
1012
  code = colDataSetVal(pColInfo, numOfRows, buf, false);
809✔
1013
  TSDB_CHECK_CODE(code, lino, _end);
809!
1014

1015
  // related fill-history stream id
1016
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
809✔
1017
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
809!
1018
  if (pStream->hTaskUid != 0) {
809!
1019
    int64ToHexStr(pStream->hTaskUid, buf, tListLen(buf));
×
1020
    code = colDataSetVal(pColInfo, numOfRows, buf, false);
×
1021
  } else {
1022
    code = colDataSetVal(pColInfo, numOfRows, buf, true);
809✔
1023
  }
1024
  TSDB_CHECK_CODE(code, lino, _end);
809!
1025

1026
  // related fill-history stream id
1027
  char sql[TSDB_SHOW_SQL_LEN + VARSTR_HEADER_SIZE] = {0};
809✔
1028
  STR_WITH_MAXSIZE_TO_VARSTR(sql, pStream->sql, sizeof(sql));
809✔
1029
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
809✔
1030
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
809!
1031
  code = colDataSetVal(pColInfo, numOfRows, (const char *)sql, false);
809✔
1032
  TSDB_CHECK_CODE(code, lino, _end);
809!
1033

1034
  char status[20 + VARSTR_HEADER_SIZE] = {0};
809✔
1035
  char status2[MND_STREAM_TRIGGER_NAME_SIZE] = {0};
809✔
1036
  bool isPaused = false;
809✔
1037
  code = isAllTaskPaused(pStream, &isPaused);
809✔
1038
  TSDB_CHECK_CODE(code, lino, _end);
809!
1039

1040
  int8_t streamStatus = atomic_load_8(&pStream->status);
809✔
1041
  if (isPaused) {
809✔
1042
    streamStatus = STREAM_STATUS__PAUSE;
24✔
1043
  }
1044
  mndShowStreamStatus(status2, streamStatus);
809✔
1045
  STR_WITH_MAXSIZE_TO_VARSTR(status, status2, sizeof(status));
809✔
1046
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
809✔
1047
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
809!
1048

1049
  code = colDataSetVal(pColInfo, numOfRows, (const char *)&status, false);
809✔
1050
  TSDB_CHECK_CODE(code, lino, _end);
809!
1051

1052
  char sourceDB[TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
809✔
1053
  STR_WITH_MAXSIZE_TO_VARSTR(sourceDB, mndGetDbStr(pStream->sourceDb), sizeof(sourceDB));
809✔
1054
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
809✔
1055
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
809!
1056

1057
  code = colDataSetVal(pColInfo, numOfRows, (const char *)&sourceDB, false);
809✔
1058
  TSDB_CHECK_CODE(code, lino, _end);
809!
1059

1060
  char targetDB[TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
809✔
1061
  STR_WITH_MAXSIZE_TO_VARSTR(targetDB, mndGetDbStr(pStream->targetDb), sizeof(targetDB));
809✔
1062
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
809✔
1063
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
809!
1064

1065
  code = colDataSetVal(pColInfo, numOfRows, (const char *)&targetDB, false);
809✔
1066
  TSDB_CHECK_CODE(code, lino, _end);
809!
1067

1068
  if (pStream->targetSTbName[0] == 0) {
809✔
1069
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
2✔
1070
    TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
2!
1071

1072
    code = colDataSetVal(pColInfo, numOfRows, NULL, true);
2✔
1073
  } else {
1074
    char targetSTB[TSDB_TABLE_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
807✔
1075
    STR_WITH_MAXSIZE_TO_VARSTR(targetSTB, mndGetStbStr(pStream->targetSTbName), sizeof(targetSTB));
807✔
1076
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
807✔
1077
    TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
807!
1078

1079
    code = colDataSetVal(pColInfo, numOfRows, (const char *)&targetSTB, false);
807✔
1080
  }
1081
  TSDB_CHECK_CODE(code, lino, _end);
809!
1082

1083
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
809✔
1084
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
809!
1085

1086
  code = colDataSetVal(pColInfo, numOfRows, (const char *)&pStream->conf.watermark, false);
809✔
1087
  TSDB_CHECK_CODE(code, lino, _end);
809!
1088

1089
  char trigger[20 + VARSTR_HEADER_SIZE] = {0};
809✔
1090
  char trigger2[MND_STREAM_TRIGGER_NAME_SIZE] = {0};
809✔
1091
  mndShowStreamTrigger(trigger2, pStream);
809✔
1092
  STR_WITH_MAXSIZE_TO_VARSTR(trigger, trigger2, sizeof(trigger));
809✔
1093
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
809✔
1094
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
809!
1095

1096
  code = colDataSetVal(pColInfo, numOfRows, (const char *)&trigger, false);
809✔
1097
  TSDB_CHECK_CODE(code, lino, _end);
809!
1098

1099
  // sink_quota
1100
  char sinkQuota[20 + VARSTR_HEADER_SIZE] = {0};
809✔
1101
  sinkQuota[0] = '0';
809✔
1102
  char dstStr[20] = {0};
809✔
1103
  STR_TO_VARSTR(dstStr, sinkQuota)
809✔
1104
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
809✔
1105
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
809!
1106

1107
  code = colDataSetVal(pColInfo, numOfRows, (const char *)dstStr, false);
809✔
1108
  TSDB_CHECK_CODE(code, lino, _end);
809!
1109

1110
  // checkpoint interval
1111
  char tmp[20 + VARSTR_HEADER_SIZE] = {0};
809✔
1112
  (void)tsnprintf(varDataVal(tmp), sizeof(tmp) - VARSTR_HEADER_SIZE, "%d sec", tsStreamCheckpointInterval);
809✔
1113
  varDataSetLen(tmp, strlen(varDataVal(tmp)));
809✔
1114

1115
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
809✔
1116
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
809!
1117

1118
  code = colDataSetVal(pColInfo, numOfRows, (const char *)tmp, false);
809✔
1119
  TSDB_CHECK_CODE(code, lino, _end);
809!
1120

1121
  // checkpoint backup type
1122
  char backup[20 + VARSTR_HEADER_SIZE] = {0};
809✔
1123
  STR_TO_VARSTR(backup, "none")
809✔
1124
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
809✔
1125
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
809!
1126

1127
  code = colDataSetVal(pColInfo, numOfRows, (const char *)backup, false);
809✔
1128
  TSDB_CHECK_CODE(code, lino, _end);
809!
1129

1130
  // history scan idle
1131
  char scanHistoryIdle[20 + VARSTR_HEADER_SIZE] = {0};
809✔
1132
  tstrncpy(scanHistoryIdle, "100a", sizeof(scanHistoryIdle));
809✔
1133

1134
  memset(dstStr, 0, tListLen(dstStr));
809✔
1135
  STR_TO_VARSTR(dstStr, scanHistoryIdle)
809✔
1136
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
809✔
1137
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
809!
1138

1139
  code = colDataSetVal(pColInfo, numOfRows, (const char *)dstStr, false);
809✔
1140

1141
_end:
809✔
1142
  if (code) {
809!
1143
    mError("error happens when build stream attr result block, lino:%d, code:%s", lino, tstrerror(code));
×
1144
  }
1145
  return code;
809✔
1146
}
1147

1148
int32_t setTaskAttrInResBlock(SStreamObj *pStream, SStreamTask *pTask, SSDataBlock *pBlock, int32_t numOfRows,
36,191✔
1149
                              int32_t precision) {
1150
  SColumnInfoData *pColInfo = NULL;
36,191✔
1151
  int32_t          cols = 0;
36,191✔
1152
  int32_t          code = 0;
36,191✔
1153
  int32_t          lino = 0;
36,191✔
1154

1155
  STaskId id = {.streamId = pTask->id.streamId, .taskId = pTask->id.taskId};
36,191✔
1156

1157
  STaskStatusEntry *pe = taosHashGet(execInfo.pTaskMap, &id, sizeof(id));
36,191✔
1158
  if (pe == NULL) {
36,191!
1159
    mError("task:0x%" PRIx64 " not exists in any vnodes, streamName:%s, streamId:0x%" PRIx64 " createTs:%" PRId64
×
1160
           " no valid status/stage info",
1161
           id.taskId, pStream->name, pStream->uid, pStream->createTime);
1162
    return TSDB_CODE_STREAM_TASK_NOT_EXIST;
×
1163
  }
1164

1165
  // stream name
1166
  char streamName[TSDB_TABLE_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
36,191✔
1167
  STR_WITH_MAXSIZE_TO_VARSTR(streamName, mndGetDbStr(pStream->name), sizeof(streamName));
36,191✔
1168

1169
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1170
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1171

1172
  code = colDataSetVal(pColInfo, numOfRows, (const char *)streamName, false);
36,191✔
1173
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1174

1175
  // task id
1176
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1177
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1178

1179
  char idstr[128] = {0};
36,191✔
1180
  int64ToHexStr(pTask->id.taskId, idstr, tListLen(idstr));
36,191✔
1181
  code = colDataSetVal(pColInfo, numOfRows, idstr, false);
36,191✔
1182
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1183

1184
  // node type
1185
  char nodeType[20 + VARSTR_HEADER_SIZE] = {0};
36,191✔
1186
  varDataSetLen(nodeType, 5);
36,191✔
1187
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1188
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1189

1190
  if (pTask->info.nodeId > 0) {
36,191✔
1191
    memcpy(varDataVal(nodeType), "vnode", 5);
36,164✔
1192
  } else {
1193
    memcpy(varDataVal(nodeType), "snode", 5);
27✔
1194
  }
1195
  code = colDataSetVal(pColInfo, numOfRows, nodeType, false);
36,191✔
1196
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1197

1198
  // node id
1199
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1200
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1201

1202
  int64_t nodeId = TMAX(pTask->info.nodeId, 0);
36,191✔
1203
  code = colDataSetVal(pColInfo, numOfRows, (const char *)&nodeId, false);
36,191✔
1204
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1205

1206
  // level
1207
  char level[20 + VARSTR_HEADER_SIZE] = {0};
36,191✔
1208
  if (pTask->info.taskLevel == TASK_LEVEL__SOURCE) {
36,191✔
1209
    STR_WITH_SIZE_TO_VARSTR(level, "source", 6);
20,130✔
1210
  } else if (pTask->info.taskLevel == TASK_LEVEL__AGG) {
16,061✔
1211
    STR_WITH_SIZE_TO_VARSTR(level, "agg", 3);
1,409✔
1212
  } else if (pTask->info.taskLevel == TASK_LEVEL__SINK) {
14,652!
1213
    STR_WITH_SIZE_TO_VARSTR(level, "sink", 4);
14,652✔
1214
  }
1215

1216
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1217
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1218

1219
  code = colDataSetVal(pColInfo, numOfRows, (const char *)level, false);
36,191✔
1220
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1221

1222
  // status
1223
  char status[20 + VARSTR_HEADER_SIZE] = {0};
36,191✔
1224

1225
  const char *pStatus = streamTaskGetStatusStr(pe->status);
36,191✔
1226
  STR_TO_VARSTR(status, pStatus);
36,191✔
1227

1228
  // status
1229
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1230
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1231

1232
  code = colDataSetVal(pColInfo, numOfRows, (const char *)status, false);
36,191✔
1233
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1234

1235
  // stage
1236
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1237
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1238

1239
  code = colDataSetVal(pColInfo, numOfRows, (const char *)&pe->stage, false);
36,191✔
1240
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1241

1242
  // input queue
1243
  char        vbuf[40] = {0};
36,191✔
1244
  char        buf[38] = {0};
36,191✔
1245
  const char *queueInfoStr = "%4.2f MiB (%6.2f%)";
36,191✔
1246
  snprintf(buf, tListLen(buf), queueInfoStr, pe->inputQUsed, pe->inputRate);
36,191✔
1247
  STR_TO_VARSTR(vbuf, buf);
36,191✔
1248

1249
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1250
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1251

1252
  code = colDataSetVal(pColInfo, numOfRows, (const char *)vbuf, false);
36,191✔
1253
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1254

1255
  // input total
1256
  const char *formatTotalMb = "%7.2f MiB";
36,191✔
1257
  const char *formatTotalGb = "%7.2f GiB";
36,191✔
1258
  if (pe->procsTotal < 1024) {
36,191!
1259
    snprintf(buf, tListLen(buf), formatTotalMb, pe->procsTotal);
36,191✔
1260
  } else {
1261
    snprintf(buf, tListLen(buf), formatTotalGb, pe->procsTotal / 1024);
×
1262
  }
1263

1264
  memset(vbuf, 0, tListLen(vbuf));
36,191✔
1265
  STR_TO_VARSTR(vbuf, buf);
36,191✔
1266

1267
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1268
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1269

1270
  code = colDataSetVal(pColInfo, numOfRows, (const char *)vbuf, false);
36,191✔
1271
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1272

1273
  // process throughput
1274
  const char *formatKb = "%7.2f KiB/s";
36,191✔
1275
  const char *formatMb = "%7.2f MiB/s";
36,191✔
1276
  if (pe->procsThroughput < 1024) {
36,191✔
1277
    snprintf(buf, tListLen(buf), formatKb, pe->procsThroughput);
36,067✔
1278
  } else {
1279
    snprintf(buf, tListLen(buf), formatMb, pe->procsThroughput / 1024);
124✔
1280
  }
1281

1282
  memset(vbuf, 0, tListLen(vbuf));
36,191✔
1283
  STR_TO_VARSTR(vbuf, buf);
36,191✔
1284

1285
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1286
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1287

1288
  code = colDataSetVal(pColInfo, numOfRows, (const char *)vbuf, false);
36,191✔
1289
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1290

1291
  // output total
1292
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1293
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1294

1295
  if (pTask->info.taskLevel == TASK_LEVEL__SINK) {
36,191✔
1296
    colDataSetNULL(pColInfo, numOfRows);
14,652!
1297
  } else {
1298
    (void)tsnprintf(buf, sizeof(buf), formatTotalMb, pe->outputTotal);
21,539✔
1299
    memset(vbuf, 0, tListLen(vbuf));
21,539✔
1300
    STR_TO_VARSTR(vbuf, buf);
21,539✔
1301

1302
    code = colDataSetVal(pColInfo, numOfRows, (const char *)vbuf, false);
21,539✔
1303
    TSDB_CHECK_CODE(code, lino, _end);
21,539!
1304
  }
1305

1306
  // output throughput
1307
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1308
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1309

1310
  if (pTask->info.taskLevel == TASK_LEVEL__SINK) {
36,191✔
1311
    colDataSetNULL(pColInfo, numOfRows);
14,652!
1312
  } else {
1313
    if (pe->outputThroughput < 1024) {
21,539✔
1314
      snprintf(buf, tListLen(buf), formatKb, pe->outputThroughput);
21,495✔
1315
    } else {
1316
      snprintf(buf, tListLen(buf), formatMb, pe->outputThroughput / 1024);
44✔
1317
    }
1318

1319
    memset(vbuf, 0, tListLen(vbuf));
21,539✔
1320
    STR_TO_VARSTR(vbuf, buf);
21,539✔
1321

1322
    code = colDataSetVal(pColInfo, numOfRows, (const char *)vbuf, false);
21,539✔
1323
    TSDB_CHECK_CODE(code, lino, _end);
21,539!
1324
  }
1325
  // info
1326
  if (pTask->info.taskLevel == TASK_LEVEL__SINK) {
36,191✔
1327
    const char *sinkStr = "%.2f MiB";
14,652✔
1328
    snprintf(buf, tListLen(buf), sinkStr, pe->sinkDataSize);
14,652✔
1329
  } else if (pTask->info.taskLevel == TASK_LEVEL__SOURCE) {  // offset info
21,539✔
1330
    if (pTask->info.trigger == STREAM_TRIGGER_FORCE_WINDOW_CLOSE) {
20,130✔
1331
      int32_t ret = taosFormatUtcTime(buf, tListLen(buf), pe->processedVer, precision);
5,685✔
1332
      if (ret != 0) {
5,685!
1333
        mError("failed to format processed timewindow, skey:%" PRId64, pe->processedVer);
×
1334
        memset(buf, 0, tListLen(buf));
×
1335
      }
1336
    } else {
1337
      const char *offsetStr = "%" PRId64 " [%" PRId64 ", %" PRId64 "]";
14,445✔
1338
      snprintf(buf, tListLen(buf), offsetStr, pe->processedVer, pe->verRange.minVer, pe->verRange.maxVer);
14,445✔
1339
    }
1340
  } else {
1341
    memset(buf, 0, tListLen(buf));
1,409✔
1342
  }
1343

1344
  STR_TO_VARSTR(vbuf, buf);
36,191✔
1345

1346
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1347
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1348

1349
  code = colDataSetVal(pColInfo, numOfRows, (const char *)vbuf, false);
36,191✔
1350
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1351

1352
  // start_time
1353
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1354
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1355

1356
  code = colDataSetVal(pColInfo, numOfRows, (const char *)&pe->startTime, false);
36,191✔
1357
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1358

1359
  // start id
1360
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1361
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1362

1363
  code = colDataSetVal(pColInfo, numOfRows, (const char *)&pe->startCheckpointId, false);
36,191✔
1364
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1365

1366
  // start ver
1367
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1368
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1369

1370
  code = colDataSetVal(pColInfo, numOfRows, (const char *)&pe->startCheckpointVer, false);
36,191✔
1371
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1372

1373
  // checkpoint time
1374
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1375
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1376

1377
  if (pe->checkpointInfo.latestTime != 0) {
36,191✔
1378
    code = colDataSetVal(pColInfo, numOfRows, (const char *)&pe->checkpointInfo.latestTime, false);
2,261✔
1379
  } else {
1380
    code = colDataSetVal(pColInfo, numOfRows, 0, true);
33,930✔
1381
  }
1382
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1383

1384
  // checkpoint_id
1385
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1386
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1387

1388
  code = colDataSetVal(pColInfo, numOfRows, (const char *)&pe->checkpointInfo.latestId, false);
36,191✔
1389
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1390

1391
  // checkpoint version
1392
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1393
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1394

1395
  code = colDataSetVal(pColInfo, numOfRows, (const char *)&pe->checkpointInfo.latestVer, false);
36,191✔
1396
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1397

1398
  // checkpoint size
1399
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1400
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1401

1402
  colDataSetNULL(pColInfo, numOfRows);
36,191!
1403

1404
  // checkpoint backup status
1405
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1406
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1407

1408
  code = colDataSetVal(pColInfo, numOfRows, 0, true);
36,191✔
1409
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1410

1411
  // ds_err_info
1412
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1413
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1414

1415
  code = colDataSetVal(pColInfo, numOfRows, 0, true);
36,191✔
1416
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1417

1418
  // history_task_id
1419
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1420
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1421

1422
  if (pe->hTaskId != 0) {
36,191✔
1423
    int64ToHexStr(pe->hTaskId, idstr, tListLen(idstr));
220✔
1424
    code = colDataSetVal(pColInfo, numOfRows, idstr, false);
220✔
1425
  } else {
1426
    code = colDataSetVal(pColInfo, numOfRows, 0, true);
35,971✔
1427
  }
1428
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1429

1430
  // history_task_status
1431
  pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
36,191✔
1432
  TSDB_CHECK_NULL(pColInfo, code, lino, _end, terrno);
36,191!
1433

1434
  code = colDataSetVal(pColInfo, numOfRows, 0, true);
36,191✔
1435
  TSDB_CHECK_CODE(code, lino, _end);
36,191!
1436

1437
_end:
36,191✔
1438
  if (code) {
36,191!
1439
    mError("error happens during build task attr result blocks, lino:%d, code:%s", lino, tstrerror(code));
×
1440
  }
1441
  return code;
36,191✔
1442
}
1443

1444
static bool isNodeEpsetChanged(const SEpSet *pPrevEpset, const SEpSet *pCurrent) {
4,059✔
1445
  const SEp *pEp = GET_ACTIVE_EP(pPrevEpset);
4,059✔
1446
  const SEp *p = GET_ACTIVE_EP(pCurrent);
4,059✔
1447

1448
  if (pEp->port == p->port && strncmp(pEp->fqdn, p->fqdn, TSDB_FQDN_LEN) == 0) {
4,059!
1449
    return false;
4,059✔
1450
  }
1451
  return true;
×
1452
}
1453

1454
void mndDestroyVgroupChangeInfo(SVgroupChangeInfo *pInfo) {
1,199✔
1455
  if (pInfo != NULL) {
1,199!
1456
    taosArrayDestroy(pInfo->pUpdateNodeList);
1,199✔
1457
    taosHashCleanup(pInfo->pDBMap);
1,199✔
1458
  }
1459
}
1,199✔
1460

1461
// 1. increase the replica does not affect the stream process.
1462
// 2. decreasing the replica may affect the stream task execution in the way that there is one or more running stream
1463
// tasks on the will be removed replica.
1464
// 3. vgroup redistribution is an combination operation of first increase replica and then decrease replica. So we
1465
// will handle it as mentioned in 1 & 2 items.
1466
int32_t mndFindChangedNodeInfo(SMnode *pMnode, const SArray *pPrevNodeList, const SArray *pNodeList,
1,199✔
1467
                               SVgroupChangeInfo *pInfo) {
1468
  int32_t code = 0;
1,199✔
1469
  int32_t lino = 0;
1,199✔
1470

1471
  if (pInfo == NULL) {
1,199!
1472
    return TSDB_CODE_INVALID_PARA;
×
1473
  }
1474

1475
  pInfo->pUpdateNodeList = taosArrayInit(4, sizeof(SNodeUpdateInfo));
1,199✔
1476
  pInfo->pDBMap = taosHashInit(32, taosGetDefaultHashFunction(TSDB_DATA_TYPE_VARCHAR), true, HASH_NO_LOCK);
1,199✔
1477

1478
  if (pInfo->pUpdateNodeList == NULL || pInfo->pDBMap == NULL) {
1,199!
1479
    mndDestroyVgroupChangeInfo(pInfo);
×
1480
    TSDB_CHECK_NULL(NULL, code, lino, _err, terrno);
×
1481
  }
1482

1483
  int32_t numOfNodes = taosArrayGetSize(pPrevNodeList);
1,199✔
1484
  for (int32_t i = 0; i < numOfNodes; ++i) {
5,995✔
1485
    SNodeEntry *pPrevEntry = taosArrayGet(pPrevNodeList, i);
4,796✔
1486
    if (pPrevEntry == NULL) {
4,796!
1487
      continue;
×
1488
    }
1489

1490
    int32_t num = taosArrayGetSize(pNodeList);
4,796✔
1491
    for (int32_t j = 0; j < num; ++j) {
16,096✔
1492
      SNodeEntry *pCurrent = taosArrayGet(pNodeList, j);
15,378✔
1493
      if (pCurrent == NULL) {
15,378!
1494
        continue;
×
1495
      }
1496

1497
      if (pCurrent->nodeId == pPrevEntry->nodeId) {
15,378✔
1498
        if (pPrevEntry->stageUpdated || isNodeEpsetChanged(&pPrevEntry->epset, &pCurrent->epset)) {
4,078!
1499
          const SEp *pPrevEp = GET_ACTIVE_EP(&pPrevEntry->epset);
19✔
1500

1501
          char buf[256] = {0};
19✔
1502
          code = epsetToStr(&pCurrent->epset, buf, tListLen(buf));  // ignore this error
19✔
1503
          if (code) {
19!
1504
            mError("failed to convert epset string, code:%s", tstrerror(code));
×
1505
            TSDB_CHECK_CODE(code, lino, _err);
×
1506
          }
1507

1508
          mDebug("nodeId:%d restart/epset changed detected, old:%s:%d -> new:%s, stageUpdate:%d", pCurrent->nodeId,
19✔
1509
                 pPrevEp->fqdn, pPrevEp->port, buf, pPrevEntry->stageUpdated);
1510

1511
          SNodeUpdateInfo updateInfo = {.nodeId = pPrevEntry->nodeId};
19✔
1512
          epsetAssign(&updateInfo.prevEp, &pPrevEntry->epset);
19✔
1513
          epsetAssign(&updateInfo.newEp, &pCurrent->epset);
19✔
1514

1515
          void *p = taosArrayPush(pInfo->pUpdateNodeList, &updateInfo);
19✔
1516
          TSDB_CHECK_NULL(p, code, lino, _err, terrno);
19!
1517
        }
1518

1519
        // todo handle the snode info
1520
        if (pCurrent->nodeId != SNODE_HANDLE) {
4,078✔
1521
          SVgObj *pVgroup = mndAcquireVgroup(pMnode, pCurrent->nodeId);
3,907✔
1522
          code = taosHashPut(pInfo->pDBMap, pVgroup->dbName, strlen(pVgroup->dbName), NULL, 0);
3,907✔
1523
          mndReleaseVgroup(pMnode, pVgroup);
3,907✔
1524
          TSDB_CHECK_CODE(code, lino, _err);
3,907!
1525
        }
1526

1527
        break;
4,078✔
1528
      }
1529
    }
1530
  }
1531

1532
  return code;
1,199✔
1533

1534
_err:
×
1535
  mError("failed to find node change info, code:%s at %s line:%d", tstrerror(code), __func__, lino);
×
1536
  mndDestroyVgroupChangeInfo(pInfo);
×
1537
  return code;
×
1538
}
1539

1540
static int32_t doCheckForUpdated(SMnode *pMnode, SArray **ppNodeSnapshot) {
1,350✔
1541
  bool              allReady = false;
1,350✔
1542
  bool              nodeUpdated = false;
1,350✔
1543
  SVgroupChangeInfo changeInfo = {0};
1,350✔
1544

1545
  int32_t numOfNodes = extractStreamNodeList(pMnode);
1,350✔
1546

1547
  if (numOfNodes == 0) {
1,350✔
1548
    mDebug("stream task node change checking done, no vgroups exist, do nothing");
635✔
1549
    execInfo.ts = taosGetTimestampSec();
635✔
1550
    return false;
635✔
1551
  }
1552

1553
  for (int32_t i = 0; i < numOfNodes; ++i) {
3,640✔
1554
    SNodeEntry *pNodeEntry = taosArrayGet(execInfo.pNodeList, i);
2,944✔
1555
    if (pNodeEntry == NULL) {
2,944!
1556
      continue;
×
1557
    }
1558

1559
    if (pNodeEntry->stageUpdated) {
2,944✔
1560
      mDebug("stream task not ready due to node update detected, checkpoint not issued");
19✔
1561
      return true;
19✔
1562
    }
1563
  }
1564

1565
  int32_t code = mndTakeVgroupSnapshot(pMnode, &allReady, ppNodeSnapshot);
696✔
1566
  if (code) {
696!
1567
    mError("failed to get the vgroup snapshot, ignore it and continue");
×
1568
  }
1569

1570
  if (!allReady) {
696✔
1571
    mWarn("not all vnodes ready, quit from vnodes status check");
11!
1572
    return true;
11✔
1573
  }
1574

1575
  code = mndFindChangedNodeInfo(pMnode, execInfo.pNodeList, *ppNodeSnapshot, &changeInfo);
685✔
1576
  if (code) {
685!
1577
    nodeUpdated = false;
×
1578
  } else {
1579
    nodeUpdated = (taosArrayGetSize(changeInfo.pUpdateNodeList) > 0);
685✔
1580
    if (nodeUpdated) {
685!
1581
      mDebug("stream tasks not ready due to node update");
×
1582
    }
1583
  }
1584

1585
  mndDestroyVgroupChangeInfo(&changeInfo);
685✔
1586
  return nodeUpdated;
685✔
1587
}
1588

1589
// check if the node update happens or not
1590
bool mndStreamNodeIsUpdated(SMnode *pMnode) {
1,350✔
1591
  SArray *pNodeSnapshot = NULL;
1,350✔
1592

1593
  streamMutexLock(&execInfo.lock);
1,350✔
1594
  bool updated = doCheckForUpdated(pMnode, &pNodeSnapshot);
1,350✔
1595
  streamMutexUnlock(&execInfo.lock);
1,350✔
1596

1597
  taosArrayDestroy(pNodeSnapshot);
1,350✔
1598
  return updated;
1,350✔
1599
}
1600

1601
int32_t mndCheckForSnode(SMnode *pMnode, SDbObj *pSrcDb) {
1,631✔
1602
  SSdb      *pSdb = pMnode->pSdb;
1,631✔
1603
  void      *pIter = NULL;
1,631✔
1604
  SSnodeObj *pObj = NULL;
1,631✔
1605

1606
  if (pSrcDb->cfg.replications == 1) {
1,631✔
1607
    return TSDB_CODE_SUCCESS;
1,628✔
1608
  } else {
1609
    while (1) {
1610
      pIter = sdbFetch(pSdb, SDB_SNODE, pIter, (void **)&pObj);
3✔
1611
      if (pIter == NULL) {
3✔
1612
        break;
2✔
1613
      }
1614

1615
      sdbRelease(pSdb, pObj);
1✔
1616
      sdbCancelFetch(pSdb, pIter);
1✔
1617
      return TSDB_CODE_SUCCESS;
1✔
1618
    }
1619

1620
    mError("snode not existed when trying to create stream in db with multiple replica");
2!
1621
    return TSDB_CODE_SNODE_NOT_DEPLOYED;
2✔
1622
  }
1623
}
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc