• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

taosdata / TDengine / #3566

25 Dec 2024 06:56AM UTC coverage: 62.422% (+11.3%) from 51.098%
#3566

push

travis-ci

web-flow
Merge pull request #29314 from taosdata/fix/TD-33275.2

fix: add more UT cases

138034 of 284473 branches covered (48.52%)

Branch coverage included in aggregate %.

215318 of 281594 relevant lines covered (76.46%)

9007186.78 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

69.57
/source/dnode/mnode/impl/src/mndSubscribe.c
1
/*
2
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
3
 *
4
 * This program is free software: you can use, redistribute, and/or modify
5
 * it under the terms of the GNU Affero General Public License, version 3
6
 * or later ("AGPL"), as published by the Free Software Foundation.
7
 *
8
 * This program is distributed in the hope that it will be useful, but WITHOUT
9
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10
 * FITNESS FOR A PARTICULAR PURPOSE.
11
 *
12
 * You should have received a copy of the GNU Affero General Public License
13
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
14
 */
15

16
#define _DEFAULT_SOURCE
17
#include "mndSubscribe.h"
18
#include "mndConsumer.h"
19
#include "mndScheduler.h"
20
#include "mndShow.h"
21
#include "mndTopic.h"
22
#include "mndTrans.h"
23
#include "mndVgroup.h"
24
#include "tcompare.h"
25
#include "tname.h"
26

27
#define MND_SUBSCRIBE_VER_NUMBER   3
28
#define MND_SUBSCRIBE_RESERVE_SIZE 64
29

30
//#define MND_CONSUMER_LOST_HB_CNT          6
31

32
static int32_t mqRebInExecCnt = 0;
33

34
static SSdbRaw *mndSubActionEncode(SMqSubscribeObj *);
35
static SSdbRow *mndSubActionDecode(SSdbRaw *pRaw);
36
static int32_t  mndSubActionInsert(SSdb *pSdb, SMqSubscribeObj *);
37
static int32_t  mndSubActionDelete(SSdb *pSdb, SMqSubscribeObj *);
38
static int32_t  mndSubActionUpdate(SSdb *pSdb, SMqSubscribeObj *pOldSub, SMqSubscribeObj *pNewSub);
39
static int32_t  mndProcessRebalanceReq(SRpcMsg *pMsg);
40
static int32_t  mndProcessDropCgroupReq(SRpcMsg *pMsg);
41
static int32_t  mndRetrieveSubscribe(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows);
42
static void     mndCancelGetNextSubscribe(SMnode *pMnode, void *pIter);
43
static int32_t  mndCheckConsumer(SRpcMsg *pMsg, SHashObj *hash);
44

45
static int32_t mndSetSubCommitLogs(STrans *pTrans, SMqSubscribeObj *pSub) {
1,005✔
46
  if (pTrans == NULL || pSub == NULL) {
1,005!
47
    return TSDB_CODE_INVALID_PARA;
×
48
  }
49
  int32_t  code = 0;
1,005✔
50
  SSdbRaw *pCommitRaw = mndSubActionEncode(pSub);
1,005✔
51
  MND_TMQ_NULL_CHECK(pCommitRaw);
1,005!
52
  code = mndTransAppendCommitlog(pTrans, pCommitRaw);
1,005✔
53
  if (code != 0) {
1,005!
54
    sdbFreeRaw(pCommitRaw);
×
55
    goto END;
×
56
  }
57
  code = sdbSetRawStatus(pCommitRaw, SDB_STATUS_READY);
1,005✔
58

59
END:
1,005✔
60
  return code;
1,005✔
61
}
62

63
int32_t mndInitSubscribe(SMnode *pMnode) {
1,778✔
64
  SSdbTable table = {
1,778✔
65
      .sdbType = SDB_SUBSCRIBE,
66
      .keyType = SDB_KEY_BINARY,
67
      .encodeFp = (SdbEncodeFp)mndSubActionEncode,
68
      .decodeFp = (SdbDecodeFp)mndSubActionDecode,
69
      .insertFp = (SdbInsertFp)mndSubActionInsert,
70
      .updateFp = (SdbUpdateFp)mndSubActionUpdate,
71
      .deleteFp = (SdbDeleteFp)mndSubActionDelete,
72
  };
73

74
  if (pMnode == NULL) {
1,778!
75
    return TSDB_CODE_INVALID_PARA;
×
76
  }
77
  mndSetMsgHandle(pMnode, TDMT_VND_TMQ_SUBSCRIBE_RSP, mndTransProcessRsp);
1,778✔
78
  mndSetMsgHandle(pMnode, TDMT_VND_TMQ_DELETE_SUB_RSP, mndTransProcessRsp);
1,778✔
79
  mndSetMsgHandle(pMnode, TDMT_MND_TMQ_TIMER, mndProcessRebalanceReq);
1,778✔
80
  mndSetMsgHandle(pMnode, TDMT_MND_TMQ_DROP_CGROUP, mndProcessDropCgroupReq);
1,778✔
81
  mndSetMsgHandle(pMnode, TDMT_MND_TMQ_DROP_CGROUP_RSP, mndTransProcessRsp);
1,778✔
82

83
  mndAddShowRetrieveHandle(pMnode, TSDB_MGMT_TABLE_SUBSCRIPTIONS, mndRetrieveSubscribe);
1,778✔
84
  mndAddShowFreeIterHandle(pMnode, TSDB_MGMT_TABLE_TOPICS, mndCancelGetNextSubscribe);
1,778✔
85

86
  return sdbSetTable(pMnode->pSdb, table);
1,778✔
87
}
88

89
static int32_t mndCreateSubscription(SMnode *pMnode, const SMqTopicObj *pTopic, const char *subKey, SMqSubscribeObj** pSub) {
475✔
90
  if(pMnode == NULL || pTopic == NULL || subKey == NULL || pSub == NULL) {
475!
91
    return TSDB_CODE_INVALID_PARA;
×
92
  }
93
  int32_t code = 0;
475✔
94
  MND_TMQ_RETURN_CHECK(tNewSubscribeObj(subKey, pSub));
475!
95
  (*pSub)->dbUid = pTopic->dbUid;
475✔
96
  (*pSub)->stbUid = pTopic->stbUid;
475✔
97
  (*pSub)->subType = pTopic->subType;
475✔
98
  (*pSub)->withMeta = pTopic->withMeta;
475✔
99

100
  MND_TMQ_RETURN_CHECK(mndSchedInitSubEp(pMnode, pTopic, *pSub));
475!
101
  return code;
475✔
102

103
END:
×
104
  tDeleteSubscribeObj(*pSub);
×
105
  taosMemoryFree(*pSub);
×
106
  return code;
×
107
}
108

109
static int32_t mndBuildSubChangeReq(void **pBuf, int32_t *pLen, SMqSubscribeObj *pSub, const SMqRebOutputVg *pRebVg,
2,555✔
110
                                    SSubplan *pPlan) {
111
  if (pSub == NULL || pRebVg == NULL || pBuf == NULL || pLen == NULL) {
2,555!
112
    return TSDB_CODE_INVALID_PARA;
×
113
  }
114
  SMqRebVgReq req = {0};
2,555✔
115
  int32_t     code = 0;
2,555✔
116
  SEncoder encoder = {0};
2,555✔
117

118
  req.oldConsumerId = pRebVg->oldConsumerId;
2,555✔
119
  req.newConsumerId = pRebVg->newConsumerId;
2,555✔
120
  req.vgId = pRebVg->pVgEp->vgId;
2,555✔
121
  if (pPlan) {
2,555✔
122
    pPlan->execNode.epSet = pRebVg->pVgEp->epSet;
2,112✔
123
    pPlan->execNode.nodeId = pRebVg->pVgEp->vgId;
2,112✔
124
    int32_t msgLen = 0;
2,112✔
125
    MND_TMQ_RETURN_CHECK(qSubPlanToString(pPlan, &req.qmsg, &msgLen));
2,112!
126
  } else {
127
    req.qmsg = taosStrdup("");
443!
128
    MND_TMQ_NULL_CHECK(req.qmsg);
443!
129
  }
130
  req.subType = pSub->subType;
2,555✔
131
  req.withMeta = pSub->withMeta;
2,555✔
132
  req.suid = pSub->stbUid;
2,555✔
133
  tstrncpy(req.subKey, pSub->key, TSDB_SUBSCRIBE_KEY_LEN);
2,555✔
134

135
  int32_t tlen = 0;
2,555✔
136
  tEncodeSize(tEncodeSMqRebVgReq, &req, tlen, code);
2,555!
137
  if (code < 0) {
2,555!
138
    goto END;
×
139
  }
140

141
  tlen += sizeof(SMsgHead);
2,555✔
142
  void *buf = taosMemoryMalloc(tlen);
2,555!
143
  MND_TMQ_NULL_CHECK(buf);
2,555!
144
  SMsgHead *pMsgHead = (SMsgHead *)buf;
2,555✔
145
  pMsgHead->contLen = htonl(tlen);
2,555✔
146
  pMsgHead->vgId = htonl(pRebVg->pVgEp->vgId);
2,555✔
147

148
  tEncoderInit(&encoder, POINTER_SHIFT(buf, sizeof(SMsgHead)), tlen);
2,555✔
149
  MND_TMQ_RETURN_CHECK(tEncodeSMqRebVgReq(&encoder, &req));
2,555!
150
  *pBuf = buf;
2,555✔
151
  *pLen = tlen;
2,555✔
152

153
END:
2,555✔
154
  tEncoderClear(&encoder);
2,555✔
155
  taosMemoryFree(req.qmsg);
2,555!
156
  return code;
2,555✔
157
}
158

159
static int32_t mndPersistSubChangeVgReq(SMnode *pMnode, STrans *pTrans, SMqSubscribeObj *pSub,
2,557✔
160
                                        const SMqRebOutputVg *pRebVg, SSubplan *pPlan) {
161
  if (pMnode == NULL || pTrans == NULL || pSub == NULL || pRebVg == NULL) {
2,557!
162
    return TSDB_CODE_INVALID_PARA;
×
163
  }
164
  int32_t code = 0;
2,557✔
165
  void   *buf  = NULL;
2,557✔
166

167
  if (pRebVg->oldConsumerId == pRebVg->newConsumerId) {
2,557✔
168
    if (pRebVg->oldConsumerId == -1) return 0;  // drop stream, no consumer, while split vnode,all consumerId is -1
2!
169
    code = TSDB_CODE_MND_INVALID_SUB_OPTION;
×
170
    goto END;
×
171
  }
172

173
  int32_t tlen = 0;
2,555✔
174
  MND_TMQ_RETURN_CHECK(mndBuildSubChangeReq(&buf, &tlen, pSub, pRebVg, pPlan));
2,555!
175
  int32_t vgId = pRebVg->pVgEp->vgId;
2,555✔
176
  SVgObj *pVgObj = mndAcquireVgroup(pMnode, vgId);
2,555✔
177
  if (pVgObj == NULL) {
2,555!
178
    code = TSDB_CODE_MND_VGROUP_NOT_EXIST;
×
179
    goto END;
×
180
  }
181

182
  STransAction action = {0};
2,555✔
183
  action.epSet = mndGetVgroupEpset(pMnode, pVgObj);
2,555✔
184
  action.pCont = buf;
2,555✔
185
  action.contLen = tlen;
2,555✔
186
  action.msgType = TDMT_VND_TMQ_SUBSCRIBE;
2,555✔
187

188
  mndReleaseVgroup(pMnode, pVgObj);
2,555✔
189
  MND_TMQ_RETURN_CHECK(mndTransAppendRedoAction(pTrans, &action));
2,555!
190
  return code;
2,555✔
191

192
END:
×
193
  taosMemoryFree(buf);
×
194
  return code;
×
195
}
196

197
static void mndSplitSubscribeKey(const char *key, char *topic, char *cgroup, bool fullName) {
4,110✔
198
  if (key == NULL || topic == NULL || cgroup == NULL) {
4,110!
199
    return;
×
200
  }
201
  int32_t i = 0;
4,110✔
202
  while (key[i] != TMQ_SEPARATOR_CHAR) {
34,992✔
203
    i++;
30,882✔
204
  }
205
  (void)memcpy(cgroup, key, i);
4,110✔
206
  cgroup[i] = 0;
4,110✔
207
  if (fullName) {
4,110✔
208
    tstrncpy(topic, &key[i + 1], TSDB_TOPIC_FNAME_LEN);
3,241✔
209
  } else {
210
    while (key[i] != '.') {
2,607✔
211
      i++;
1,738✔
212
    }
213
    tstrncpy(topic, &key[i + 1], TSDB_CGROUP_LEN);
869✔
214
  }
215
}
216

217
static int32_t mndGetOrCreateRebSub(SHashObj *pHash, const char *key, SMqRebInfo **pReb) {
1,365✔
218
  if (pHash == NULL || key == NULL) {
1,365!
219
    return TSDB_CODE_INVALID_PARA;
×
220
  }
221
  int32_t code = 0;
1,365✔
222
  SMqRebInfo* pRebInfo = taosHashGet(pHash, key, strlen(key) + 1);
1,365✔
223
  if (pRebInfo == NULL) {
1,365✔
224
    pRebInfo = tNewSMqRebSubscribe(key);
1,292✔
225
    if (pRebInfo == NULL) {
1,292!
226
      code = terrno;
×
227
      goto END;
×
228
    }
229
    code = taosHashPut(pHash, key, strlen(key) + 1, pRebInfo, sizeof(SMqRebInfo));
1,292✔
230
    taosMemoryFreeClear(pRebInfo);
1,292!
231
    if (code != 0) {
1,292!
232
      goto END;
×
233
    }
234
    pRebInfo = taosHashGet(pHash, key, strlen(key) + 1);
1,292✔
235
    MND_TMQ_NULL_CHECK(pRebInfo);
1,292!
236
  }
237
  if (pReb){
1,365✔
238
    *pReb = pRebInfo;
1,124✔
239
  }
240

241
END:
241✔
242
  return code;
1,365✔
243
}
244

245
static int32_t pushVgDataToHash(SArray *vgs, SHashObj *pHash, int64_t consumerId, char *key) {
3,107✔
246
  if (vgs == NULL || pHash == NULL || key == NULL) {
3,107!
247
    return TSDB_CODE_INVALID_PARA;
×
248
  }
249
  int32_t         code = 0;
3,107✔
250
  SMqVgEp       **pVgEp = (SMqVgEp **)taosArrayPop(vgs);
3,107✔
251
  MND_TMQ_NULL_CHECK(pVgEp);
3,107!
252
  SMqRebOutputVg outputVg = {consumerId, -1, *pVgEp};
3,107✔
253
  MND_TMQ_RETURN_CHECK(taosHashPut(pHash, &(*pVgEp)->vgId, sizeof(int32_t), &outputVg, sizeof(SMqRebOutputVg)));
3,107!
254
  mInfo("[rebalance] sub:%s mq rebalance remove vgId:%d from consumer:0x%" PRIx64, key, (*pVgEp)->vgId, consumerId);
3,107!
255
END:
×
256
  return code;
3,107✔
257
}
258

259
static int32_t processRemovedConsumers(SMqRebOutputObj *pOutput, SHashObj *pHash, const SMqRebInputObj *pInput) {
1,292✔
260
  if (pHash == NULL || pOutput == NULL || pInput == NULL) {
1,292!
261
    return TSDB_CODE_INVALID_PARA;
×
262
  }
263
  int32_t code = 0;
1,292✔
264
  int32_t numOfRemoved = taosArrayGetSize(pInput->pRebInfo->removedConsumers);
1,292✔
265
  int32_t actualRemoved = 0;
1,292✔
266
  for (int32_t i = 0; i < numOfRemoved; i++) {
1,832✔
267
    int64_t*      consumerId = (int64_t *)taosArrayGet(pInput->pRebInfo->removedConsumers, i);
540✔
268
    MND_TMQ_NULL_CHECK(consumerId);
540!
269
    SMqConsumerEp *pConsumerEp = taosHashGet(pOutput->pSub->consumerHash, consumerId, sizeof(int64_t));
540✔
270
    if (pConsumerEp == NULL) {
540!
271
      continue;
×
272
    }
273

274
    int32_t consumerVgNum = taosArrayGetSize(pConsumerEp->vgs);
540✔
275
    for (int32_t j = 0; j < consumerVgNum; j++) {
1,817✔
276
      MND_TMQ_RETURN_CHECK(pushVgDataToHash(pConsumerEp->vgs, pHash, *consumerId, pOutput->pSub->key));
1,277!
277
    }
278

279
    taosArrayDestroy(pConsumerEp->vgs);
540✔
280
    MND_TMQ_RETURN_CHECK(taosHashRemove(pOutput->pSub->consumerHash, consumerId, sizeof(int64_t)));
540!
281
    MND_TMQ_NULL_CHECK(taosArrayPush(pOutput->removedConsumers, consumerId));
1,080!
282
    actualRemoved++;
540✔
283
  }
284

285
  if (numOfRemoved != actualRemoved) {
1,292!
286
    mError("[rebalance] sub:%s mq rebalance removedNum:%d not matched with actual:%d", pOutput->pSub->key, numOfRemoved,
×
287
           actualRemoved);
288
  } else {
289
    mInfo("[rebalance] sub:%s removed %d consumers", pOutput->pSub->key, numOfRemoved);
1,292!
290
  }
291
END:
×
292
  return code;
1,292✔
293
}
294

295
static int32_t processNewConsumers(SMqRebOutputObj *pOutput, const SMqRebInputObj *pInput) {
1,292✔
296
  if (pOutput == NULL || pInput == NULL) {
1,292!
297
    return TSDB_CODE_INVALID_PARA;
×
298
  }
299
  int32_t code = 0;
1,292✔
300
  int32_t numOfNewConsumers = taosArrayGetSize(pInput->pRebInfo->newConsumers);
1,292✔
301

302
  for (int32_t i = 0; i < numOfNewConsumers; i++) {
1,876✔
303
    int64_t* consumerId = (int64_t *)taosArrayGet(pInput->pRebInfo->newConsumers, i);
584✔
304
    MND_TMQ_NULL_CHECK(consumerId);
584!
305
    SMqConsumerEp newConsumerEp = {0};
584✔
306
    newConsumerEp.consumerId = *consumerId;
584✔
307
    newConsumerEp.vgs = taosArrayInit(0, sizeof(void *));
584✔
308
    MND_TMQ_NULL_CHECK(newConsumerEp.vgs);
584!
309
    MND_TMQ_RETURN_CHECK(taosHashPut(pOutput->pSub->consumerHash, consumerId, sizeof(int64_t), &newConsumerEp, sizeof(SMqConsumerEp)));
584!
310
    MND_TMQ_NULL_CHECK(taosArrayPush(pOutput->newConsumers, consumerId));
1,168!
311
    mInfo("[rebalance] sub:%s mq rebalance add new consumer:0x%" PRIx64, pOutput->pSub->key, *consumerId);
584!
312
  }
313
END:
1,292✔
314
  return code;
1,292✔
315
}
316

317
static int32_t processUnassignedVgroups(SMqRebOutputObj *pOutput, SHashObj *pHash) {
1,292✔
318
  if (pOutput == NULL || pHash == NULL) {
1,292!
319
    return TSDB_CODE_INVALID_PARA;
×
320
  }
321
  int32_t code = 0;
1,292✔
322
  int32_t numOfVgroups = taosArrayGetSize(pOutput->pSub->unassignedVgs);
1,292✔
323
  for (int32_t i = 0; i < numOfVgroups; i++) {
3,110✔
324
    MND_TMQ_RETURN_CHECK(pushVgDataToHash(pOutput->pSub->unassignedVgs, pHash, -1, pOutput->pSub->key));
1,818!
325
  }
326
END:
1,292✔
327
  return code;
1,292✔
328
}
329

330
static int32_t processModifiedConsumers(SMqRebOutputObj *pOutput, SHashObj *pHash, int32_t minVgCnt,
1,292✔
331
                                     int32_t remainderVgCnt) {
332
  if (pOutput == NULL || pHash == NULL) {
1,292!
333
    return TSDB_CODE_INVALID_PARA;
×
334
  }
335
  int32_t code = 0;
1,292✔
336
  int32_t cnt = 0;
1,292✔
337
  void   *pIter = NULL;
1,292✔
338

339
  while (1) {
296✔
340
    pIter = taosHashIterate(pOutput->pSub->consumerHash, pIter);
1,588✔
341
    if (pIter == NULL) {
1,588✔
342
      break;
1,292✔
343
    }
344

345
    SMqConsumerEp *pConsumerEp = (SMqConsumerEp *)pIter;
296✔
346
    int32_t        consumerVgNum = taosArrayGetSize(pConsumerEp->vgs);
296✔
347

348
    MND_TMQ_NULL_CHECK(taosArrayPush(pOutput->modifyConsumers, &pConsumerEp->consumerId));
592!
349
    if (consumerVgNum > minVgCnt) {
296✔
350
      if (cnt < remainderVgCnt) {
8✔
351
        while (taosArrayGetSize(pConsumerEp->vgs) > minVgCnt + 1) {  // pop until equal minVg + 1
2!
352
          MND_TMQ_RETURN_CHECK(pushVgDataToHash(pConsumerEp->vgs, pHash, pConsumerEp->consumerId, pOutput->pSub->key));
×
353
        }
354
        cnt++;
2✔
355
      } else {
356
        while (taosArrayGetSize(pConsumerEp->vgs) > minVgCnt) {
18✔
357
          MND_TMQ_RETURN_CHECK(pushVgDataToHash(pConsumerEp->vgs, pHash, pConsumerEp->consumerId, pOutput->pSub->key));
12!
358
        }
359
      }
360
    }
361
  }
362
END:
1,292✔
363
  return code;
1,292✔
364
}
365

366
static int32_t processRemoveAddVgs(SMnode *pMnode, SMqRebOutputObj *pOutput) {
1,292✔
367
  if (pMnode == NULL || pOutput == NULL) {
1,292!
368
    return TSDB_CODE_INVALID_PARA;
×
369
  }
370
  int32_t code = 0;
1,292✔
371
  int32_t totalVgNum = 0;
1,292✔
372
  SVgObj *pVgroup = NULL;
1,292✔
373
  SMqVgEp *pVgEp = NULL;
1,292✔
374
  void   *pIter = NULL;
1,292✔
375
  SArray *newVgs = taosArrayInit(0, POINTER_BYTES);
1,292✔
376
  MND_TMQ_NULL_CHECK(newVgs);
1,292!
377
  while (1) {
378
    pIter = sdbFetch(pMnode->pSdb, SDB_VGROUP, pIter, (void **)&pVgroup);
7,859✔
379
    if (pIter == NULL) {
7,859✔
380
      break;
1,292✔
381
    }
382

383
    if (!mndVgroupInDb(pVgroup, pOutput->pSub->dbUid)) {
6,567✔
384
      sdbRelease(pMnode->pSdb, pVgroup);
3,405✔
385
      continue;
3,405✔
386
    }
387

388
    totalVgNum++;
3,162✔
389
    pVgEp = taosMemoryMalloc(sizeof(SMqVgEp));
3,162!
390
    MND_TMQ_NULL_CHECK(pVgEp);
3,162!
391
    pVgEp->epSet = mndGetVgroupEpset(pMnode, pVgroup);
3,162✔
392
    pVgEp->vgId = pVgroup->vgId;
3,162✔
393
    MND_TMQ_NULL_CHECK(taosArrayPush(newVgs, &pVgEp));
3,162!
394
    pVgEp = NULL;
3,162✔
395
    sdbRelease(pMnode->pSdb, pVgroup);
3,162✔
396
  }
397

398
  pIter = NULL;
1,292✔
399
  while (1) {
836✔
400
    pIter = taosHashIterate(pOutput->pSub->consumerHash, pIter);
2,128✔
401
    if (pIter == NULL) break;
2,128✔
402
    SMqConsumerEp *pConsumerEp = (SMqConsumerEp *)pIter;
836✔
403
    int32_t j = 0;
836✔
404
    while (j < taosArrayGetSize(pConsumerEp->vgs)) {
2,455✔
405
      SMqVgEp *pVgEpTmp = taosArrayGetP(pConsumerEp->vgs, j);
1,619✔
406
      MND_TMQ_NULL_CHECK(pVgEpTmp);
1,619!
407
      bool     find = false;
1,619✔
408
      for (int32_t k = 0; k < taosArrayGetSize(newVgs); k++) {
2,218✔
409
        SMqVgEp *pnewVgEp = taosArrayGetP(newVgs, k);
1,943✔
410
        MND_TMQ_NULL_CHECK(pnewVgEp);
1,943!
411
        if (pVgEpTmp->vgId == pnewVgEp->vgId) {
1,943✔
412
          tDeleteSMqVgEp(pnewVgEp);
1,344✔
413
          taosArrayRemove(newVgs, k);
1,344✔
414
          find = true;
1,344✔
415
          break;
1,344✔
416
        }
417
      }
418
      if (!find) {
1,619✔
419
        mInfo("[rebalance] processRemoveAddVgs old vgId:%d", pVgEpTmp->vgId);
275!
420
        tDeleteSMqVgEp(pVgEpTmp);
275✔
421
        taosArrayRemove(pConsumerEp->vgs, j);
275✔
422
        continue;
275✔
423
      }
424
      j++;
1,344✔
425
    }
426
  }
427

428
  if (taosArrayGetSize(pOutput->pSub->unassignedVgs) == 0 && taosArrayGetSize(newVgs) != 0) {
1,292✔
429
    MND_TMQ_NULL_CHECK(taosArrayAddAll(pOutput->pSub->unassignedVgs, newVgs));
275!
430
    mInfo("[rebalance] processRemoveAddVgs add new vg num:%d", (int)taosArrayGetSize(newVgs));
275!
431
    taosArrayDestroy(newVgs);
275✔
432
  } else {
433
    taosArrayDestroyP(newVgs, (FDelete)tDeleteSMqVgEp);
1,017✔
434
  }
435
  return totalVgNum;
1,292✔
436

437
END:
×
438
  sdbRelease(pMnode->pSdb, pVgroup);
×
439
  taosMemoryFree(pVgEp);
×
440
  taosArrayDestroyP(newVgs, (FDelete)tDeleteSMqVgEp);
×
441
  return code;
×
442
}
443

444
static int32_t processSubOffsetRows(SMnode *pMnode, const SMqRebInputObj *pInput, SMqRebOutputObj *pOutput) {
1,292✔
445
  if (pMnode == NULL || pInput == NULL || pOutput == NULL) {
1,292!
446
    return TSDB_CODE_INVALID_PARA;
×
447
  }
448
  SMqSubscribeObj *pSub = NULL;
1,292✔
449
  int32_t          code = mndAcquireSubscribeByKey(pMnode, pInput->pRebInfo->key, &pSub);  // put all offset rows
1,292✔
450
  if( code != 0){
1,292✔
451
    return 0;
475✔
452
  }
453
  taosRLockLatch(&pSub->lock);
817✔
454
  if (pOutput->pSub->offsetRows == NULL) {
817✔
455
    pOutput->pSub->offsetRows = taosArrayInit(4, sizeof(OffsetRows));
675✔
456
    if(pOutput->pSub->offsetRows == NULL) {
675!
457
      taosRUnLockLatch(&pSub->lock);
×
458
      code = terrno;
×
459
      goto END;
×
460
    }
461
  }
462
  void *pIter = NULL;
817✔
463
  while (1) {
836✔
464
    pIter = taosHashIterate(pSub->consumerHash, pIter);
1,653✔
465
    if (pIter == NULL) break;
1,653✔
466
    SMqConsumerEp *pConsumerEp = (SMqConsumerEp *)pIter;
836✔
467
    SMqConsumerEp *pConsumerEpNew = taosHashGet(pOutput->pSub->consumerHash, &pConsumerEp->consumerId, sizeof(int64_t));
836✔
468

469
    for (int j = 0; j < taosArrayGetSize(pConsumerEp->offsetRows); j++) {
2,381✔
470
      OffsetRows *d1 = taosArrayGet(pConsumerEp->offsetRows, j);
1,545✔
471
      MND_TMQ_NULL_CHECK(d1);
1,545!
472
      bool        jump = false;
1,545✔
473
      for (int i = 0; pConsumerEpNew && i < taosArrayGetSize(pConsumerEpNew->vgs); i++) {
2,037✔
474
        SMqVgEp *pVgEp = taosArrayGetP(pConsumerEpNew->vgs, i);
513✔
475
        MND_TMQ_NULL_CHECK(pVgEp);
513!
476
        if (pVgEp->vgId == d1->vgId) {
513✔
477
          jump = true;
21✔
478
          mInfo("pSub->offsetRows jump, because consumer id:0x%" PRIx64 " and vgId:%d not change",
21!
479
                pConsumerEp->consumerId, pVgEp->vgId);
480
          break;
21✔
481
        }
482
      }
483
      if (jump) continue;
1,545✔
484
      bool find = false;
1,524✔
485
      for (int i = 0; i < taosArrayGetSize(pOutput->pSub->offsetRows); i++) {
3,045✔
486
        OffsetRows *d2 = taosArrayGet(pOutput->pSub->offsetRows, i);
1,696✔
487
        MND_TMQ_NULL_CHECK(d2);
1,696!
488
        if (d1->vgId == d2->vgId) {
1,696✔
489
          d2->rows += d1->rows;
175✔
490
          d2->offset = d1->offset;
175✔
491
          d2->ever = d1->ever;
175✔
492
          find = true;
175✔
493
          mInfo("pSub->offsetRows add vgId:%d, after:%" PRId64 ", before:%" PRId64, d2->vgId, d2->rows, d1->rows);
175!
494
          break;
175✔
495
        }
496
      }
497
      if (!find) {
1,524✔
498
        MND_TMQ_NULL_CHECK(taosArrayPush(pOutput->pSub->offsetRows, d1));
2,698!
499
      }
500
    }
501
  }
502
  taosRUnLockLatch(&pSub->lock);
817✔
503
  mndReleaseSubscribe(pMnode, pSub);
817✔
504

505
END:
817✔
506
  return code;
817✔
507
}
508

509
static void printRebalanceLog(SMqRebOutputObj *pOutput) {
1,292✔
510
  if (pOutput == NULL) return;
1,292!
511
  mInfo("sub:%s mq rebalance calculation completed, re-balanced vg", pOutput->pSub->key);
1,292!
512
  for (int32_t i = 0; i < taosArrayGetSize(pOutput->rebVgs); i++) {
4,399✔
513
    SMqRebOutputVg *pOutputRebVg = taosArrayGet(pOutput->rebVgs, i);
3,107✔
514
    if (pOutputRebVg == NULL) continue;
3,107!
515
    mInfo("sub:%s mq rebalance vgId:%d, moved from consumer:0x%" PRIx64 ", to consumer:0x%" PRIx64, pOutput->pSub->key,
3,107!
516
          pOutputRebVg->pVgEp->vgId, pOutputRebVg->oldConsumerId, pOutputRebVg->newConsumerId);
517
  }
518

519
  void *pIter = NULL;
1,292✔
520
  while (1) {
880✔
521
    pIter = taosHashIterate(pOutput->pSub->consumerHash, pIter);
2,172✔
522
    if (pIter == NULL) break;
2,172✔
523
    SMqConsumerEp *pConsumerEp = (SMqConsumerEp *)pIter;
880✔
524
    int32_t        sz = taosArrayGetSize(pConsumerEp->vgs);
880✔
525
    mInfo("sub:%s mq rebalance final cfg: consumer:0x%" PRIx64 " has %d vg", pOutput->pSub->key,
880!
526
          pConsumerEp->consumerId, sz);
527
    for (int32_t i = 0; i < sz; i++) {
2,777✔
528
      SMqVgEp *pVgEp = taosArrayGetP(pConsumerEp->vgs, i);
1,897✔
529
      if (pVgEp == NULL) continue;
1,897!
530
      mInfo("sub:%s mq rebalance final cfg: vg %d to consumer:0x%" PRIx64, pOutput->pSub->key, pVgEp->vgId,
1,897!
531
            pConsumerEp->consumerId);
532
    }
533
  }
534
}
535

536
static void calcVgroupsCnt(const SMqRebInputObj *pInput, int32_t totalVgNum, const char *pSubKey, int32_t *minVgCnt,
1,292✔
537
                           int32_t *remainderVgCnt) {
538
  if (pInput == NULL || pSubKey == NULL || minVgCnt == NULL || remainderVgCnt == NULL) {
1,292!
539
    return;
×
540
  }
541
  int32_t numOfRemoved = taosArrayGetSize(pInput->pRebInfo->removedConsumers);
1,292✔
542
  int32_t numOfAdded = taosArrayGetSize(pInput->pRebInfo->newConsumers);
1,292✔
543
  int32_t numOfFinal = pInput->oldConsumerNum + numOfAdded - numOfRemoved;
1,292✔
544

545
  // calc num
546
  if (numOfFinal != 0) {
1,292✔
547
    *minVgCnt = totalVgNum / numOfFinal;
818✔
548
    *remainderVgCnt = totalVgNum % numOfFinal;
818✔
549
  } else {
550
    mInfo("[rebalance] sub:%s no consumer subscribe this topic", pSubKey);
474!
551
  }
552
  mInfo(
1,292!
553
      "[rebalance] sub:%s mq rebalance %d vgroups, existed consumers:%d, added:%d, removed:%d, minVg:%d remainderVg:%d",
554
      pSubKey, totalVgNum, pInput->oldConsumerNum, numOfAdded, numOfRemoved, *minVgCnt, *remainderVgCnt);
555
}
556

557
static int32_t assignVgroups(SMqRebOutputObj *pOutput, SHashObj *pHash, int32_t minVgCnt) {
1,292✔
558
  if (pOutput == NULL || pHash == NULL) {
1,292!
559
    return TSDB_CODE_INVALID_PARA;
×
560
  }
561
  SMqRebOutputVg *pRebVg = NULL;
1,292✔
562
  void           *pAssignIter = NULL;
1,292✔
563
  void           *pIter = NULL;
1,292✔
564
  int32_t         code = 0;
1,292✔
565

566
  while (1) {
880✔
567
    pIter = taosHashIterate(pOutput->pSub->consumerHash, pIter);
2,172✔
568
    if (pIter == NULL) {
2,172✔
569
      break;
1,292✔
570
    }
571
    SMqConsumerEp *pConsumerEp = (SMqConsumerEp *)pIter;
880✔
572
    while (taosArrayGetSize(pConsumerEp->vgs) < minVgCnt) {
2,695✔
573
      pAssignIter = taosHashIterate(pHash, pAssignIter);
1,815✔
574
      if (pAssignIter == NULL) {
1,815!
575
        mError("[rebalance] sub:%s assign iter is NULL, never should reach here", pOutput->pSub->key);
×
576
        break;
×
577
      }
578

579
      pRebVg = (SMqRebOutputVg *)pAssignIter;
1,815✔
580
      pRebVg->newConsumerId = pConsumerEp->consumerId;
1,815✔
581
      MND_TMQ_NULL_CHECK(taosArrayPush(pConsumerEp->vgs, &pRebVg->pVgEp));
3,630!
582
      mInfo("[rebalance] mq rebalance: add vgId:%d to consumer:0x%" PRIx64 " for average", pRebVg->pVgEp->vgId,
1,815!
583
            pConsumerEp->consumerId);
584
    }
585
  }
586

587
  while (1) {
27✔
588
    pIter = taosHashIterate(pOutput->pSub->consumerHash, pIter);
1,319✔
589
    if (pIter == NULL) {
1,319✔
590
      break;
474✔
591
    }
592
    SMqConsumerEp *pConsumerEp = (SMqConsumerEp *)pIter;
845✔
593
    if (taosArrayGetSize(pConsumerEp->vgs) == minVgCnt) {
845!
594
      pAssignIter = taosHashIterate(pHash, pAssignIter);
845✔
595
      if (pAssignIter == NULL) {
845✔
596
        mInfo("[rebalance] sub:%s assign iter is used up", pOutput->pSub->key);
818!
597
        break;
818✔
598
      }
599

600
      pRebVg = (SMqRebOutputVg *)pAssignIter;
27✔
601
      pRebVg->newConsumerId = pConsumerEp->consumerId;
27✔
602
      MND_TMQ_NULL_CHECK(taosArrayPush(pConsumerEp->vgs, &pRebVg->pVgEp));
54!
603
      mInfo("[rebalance] mq rebalance: add vgId:%d to consumer:0x%" PRIx64 " for average + 1", pRebVg->pVgEp->vgId,
27!
604
            pConsumerEp->consumerId);
605
    }
606
  }
607

608
  taosHashCancelIterate(pOutput->pSub->consumerHash, pIter);
1,292✔
609
  if (pAssignIter != NULL) {
1,292!
610
    mError("[rebalance]sub:%s assign iter is not NULL, never should reach here", pOutput->pSub->key);
×
611
    code = TSDB_CODE_PAR_INTERNAL_ERROR;
×
612
    goto END;
×
613
  }
614
  while (1) {
3,107✔
615
    pAssignIter = taosHashIterate(pHash, pAssignIter);
4,399✔
616
    if (pAssignIter == NULL) {
4,399✔
617
      break;
1,292✔
618
    }
619

620
    SMqRebOutputVg *pRebOutput = (SMqRebOutputVg *)pAssignIter;
3,107✔
621
    MND_TMQ_NULL_CHECK(taosArrayPush(pOutput->rebVgs, pRebOutput));
6,214!
622
    if (taosHashGetSize(pOutput->pSub->consumerHash) == 0) {            // if all consumer is removed
3,107✔
623
      MND_TMQ_NULL_CHECK(taosArrayPush(pOutput->pSub->unassignedVgs, &pRebOutput->pVgEp));  // put all vg into unassigned
2,530!
624
    }
625
  }
626

627
END:
1,292✔
628
  return code;
1,292✔
629
}
630

631
static int32_t mndDoRebalance(SMnode *pMnode, const SMqRebInputObj *pInput, SMqRebOutputObj *pOutput) {
1,292✔
632
  if (pMnode == NULL || pInput == NULL || pOutput == NULL) {
1,292!
633
    return TSDB_CODE_INVALID_PARA;
×
634
  }
635
  int32_t     totalVgNum = processRemoveAddVgs(pMnode, pOutput);
1,292✔
636
  if (totalVgNum < 0){
1,292!
637
    return totalVgNum;
×
638
  }
639
  const char *pSubKey = pOutput->pSub->key;
1,292✔
640
  int32_t     minVgCnt = 0;
1,292✔
641
  int32_t     remainderVgCnt = 0;
1,292✔
642
  int32_t     code = 0;
1,292✔
643
  SHashObj   *pHash = taosHashInit(64, taosGetDefaultHashFunction(TSDB_DATA_TYPE_INT), false, HASH_NO_LOCK);
1,292✔
644
  MND_TMQ_NULL_CHECK(pHash);
1,292!
645
  MND_TMQ_RETURN_CHECK(processRemovedConsumers(pOutput, pHash, pInput));
1,292!
646
  MND_TMQ_RETURN_CHECK(processUnassignedVgroups(pOutput, pHash));
1,292!
647
  calcVgroupsCnt(pInput, totalVgNum, pSubKey, &minVgCnt, &remainderVgCnt);
1,292✔
648
  MND_TMQ_RETURN_CHECK(processModifiedConsumers(pOutput, pHash, minVgCnt, remainderVgCnt));
1,292!
649
  MND_TMQ_RETURN_CHECK(processNewConsumers(pOutput, pInput));
1,292!
650
  MND_TMQ_RETURN_CHECK(assignVgroups(pOutput, pHash, minVgCnt));
1,292!
651
  MND_TMQ_RETURN_CHECK(processSubOffsetRows(pMnode, pInput, pOutput));
1,292!
652
  printRebalanceLog(pOutput);
1,292✔
653
  taosHashCleanup(pHash);
1,292✔
654

655
END:
1,292✔
656
  return code;
1,292✔
657
}
658

659
static int32_t presistConsumerByType(STrans *pTrans, SArray *consumers, int8_t type, char *cgroup, char *topic) {
3,015✔
660
  if (pTrans == NULL || consumers == NULL || cgroup == NULL) {
3,015!
661
    return TSDB_CODE_INVALID_PARA;
×
662
  }
663
  int32_t         code = 0;
3,015✔
664
  SMqConsumerObj *pConsumerNew = NULL;
3,015✔
665
  int32_t         consumerNum = taosArrayGetSize(consumers);
3,015✔
666
  for (int32_t i = 0; i < consumerNum; i++) {
4,148✔
667
    int64_t* consumerId = (int64_t *)taosArrayGet(consumers, i);
1,133✔
668
    MND_TMQ_NULL_CHECK(consumerId);
1,133!
669
    MND_TMQ_RETURN_CHECK(tNewSMqConsumerObj(*consumerId, cgroup, type, topic, NULL, &pConsumerNew));
1,133!
670
    MND_TMQ_RETURN_CHECK(mndSetConsumerCommitLogs(pTrans, pConsumerNew));
1,133!
671
    tDeleteSMqConsumerObj(pConsumerNew);
1,133✔
672
  }
673
  pConsumerNew = NULL;
3,015✔
674

675
END:
3,015✔
676
  tDeleteSMqConsumerObj(pConsumerNew);
3,015✔
677
  return code;
3,015✔
678
}
679

680
static int32_t mndPresistConsumer(STrans *pTrans, const SMqRebOutputObj *pOutput, char *cgroup, char *topic) {
1,005✔
681
  if (pTrans == NULL || pOutput == NULL || cgroup == NULL || topic == NULL) {
1,005!
682
    return TSDB_CODE_INVALID_PARA;
×
683
  }
684
  int32_t code = 0;
1,005✔
685
  MND_TMQ_RETURN_CHECK(presistConsumerByType(pTrans, pOutput->modifyConsumers, CONSUMER_UPDATE_REB, cgroup, NULL));
1,005!
686
  MND_TMQ_RETURN_CHECK(presistConsumerByType(pTrans, pOutput->newConsumers, CONSUMER_ADD_REB, cgroup, topic));
1,005!
687
  MND_TMQ_RETURN_CHECK(presistConsumerByType(pTrans, pOutput->removedConsumers, CONSUMER_REMOVE_REB, cgroup, topic));
1,005!
688
END:
1,005✔
689
  return code;
1,005✔
690
}
691

692
static int32_t mndPersistRebResult(SMnode *pMnode, SRpcMsg *pMsg, const SMqRebOutputObj *pOutput) {
1,292✔
693
  if (pMnode == NULL || pMsg == NULL || pOutput == NULL) {
1,292!
694
    return TSDB_CODE_INVALID_PARA;
×
695
  }
696
  struct SSubplan *pPlan = NULL;
1,292✔
697
  int32_t          code = 0;
1,292✔
698
  STrans          *pTrans = NULL;
1,292✔
699

700
  if (strcmp(pOutput->pSub->qmsg, "") != 0) {
1,292✔
701
    MND_TMQ_RETURN_CHECK(qStringToSubplan(pOutput->pSub->qmsg, &pPlan));
1,022!
702
  }
703

704
  char topic[TSDB_TOPIC_FNAME_LEN] = {0};
1,292✔
705
  char cgroup[TSDB_CGROUP_LEN] = {0};
1,292✔
706
  mndSplitSubscribeKey(pOutput->pSub->key, topic, cgroup, true);
1,292✔
707

708
  pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, TRN_CONFLICT_DB_INSIDE, pMsg, "tmq-reb");
1,292✔
709
  if (pTrans == NULL) {
1,292!
710
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
711
    if (terrno != 0) code = terrno;
×
712
    goto END;
×
713
  }
714

715
  mndTransSetDbName(pTrans, pOutput->pSub->dbName, pOutput->pSub->key);
1,292✔
716
  MND_TMQ_RETURN_CHECK(mndTransCheckConflict(pMnode, pTrans));
1,292✔
717

718
  // 1. redo action: action to all vg
719
  const SArray *rebVgs = pOutput->rebVgs;
1,005✔
720
  int32_t       vgNum = taosArrayGetSize(rebVgs);
1,005✔
721
  for (int32_t i = 0; i < vgNum; i++) {
3,562✔
722
    SMqRebOutputVg *pRebVg = taosArrayGet(rebVgs, i);
2,557✔
723
    MND_TMQ_NULL_CHECK(pRebVg);
2,557!
724
    MND_TMQ_RETURN_CHECK(mndPersistSubChangeVgReq(pMnode, pTrans, pOutput->pSub, pRebVg, pPlan));
2,557!
725
  }
726

727
  // 2. commit log: subscribe and vg assignment
728
  MND_TMQ_RETURN_CHECK(mndSetSubCommitLogs(pTrans, pOutput->pSub));
1,005!
729

730
  // 3. commit log: consumer to update status and epoch
731
  MND_TMQ_RETURN_CHECK(mndPresistConsumer(pTrans, pOutput, cgroup, topic));
1,005!
732

733
  // 4. set cb
734
  mndTransSetCb(pTrans, TRANS_START_FUNC_MQ_REB, TRANS_STOP_FUNC_MQ_REB, NULL, 0);
1,005✔
735

736
  // 5. execution
737
  MND_TMQ_RETURN_CHECK(mndTransPrepare(pMnode, pTrans));
1,005!
738

739
END:
1,005✔
740
  nodesDestroyNode((SNode *)pPlan);
1,292✔
741
  mndTransDrop(pTrans);
1,292✔
742
  TAOS_RETURN(code);
1,292✔
743
}
744

745
static void freeRebalanceItem(void *param) {
1,292✔
746
  if (param == NULL) return;
1,292!
747
  SMqRebInfo *pInfo = param;
1,292✔
748
  taosArrayDestroy(pInfo->newConsumers);
1,292✔
749
  taosArrayDestroy(pInfo->removedConsumers);
1,292✔
750
}
751

752
// type = 0 remove  type = 1 add
753
static int32_t buildRebInfo(SHashObj *rebSubHash, SArray *topicList, int8_t type, char *group, int64_t consumerId) {
2,000✔
754
  if (rebSubHash == NULL || topicList == NULL || group == NULL) {
2,000!
755
    return TSDB_CODE_INVALID_PARA;
×
756
  }
757
  int32_t code = 0;
2,000✔
758
  int32_t topicNum = taosArrayGetSize(topicList);
2,000✔
759
  for (int32_t i = 0; i < topicNum; i++) {
3,124✔
760
    char *removedTopic = taosArrayGetP(topicList, i);
1,124✔
761
    MND_TMQ_NULL_CHECK(removedTopic);
1,124!
762
    char  key[TSDB_SUBSCRIBE_KEY_LEN] = {0};
1,124✔
763
    (void)snprintf(key, TSDB_SUBSCRIBE_KEY_LEN, "%s%s%s", group, TMQ_SEPARATOR, removedTopic);
1,124✔
764
    SMqRebInfo *pRebSub = NULL;
1,124✔
765
    MND_TMQ_RETURN_CHECK(mndGetOrCreateRebSub(rebSubHash, key, &pRebSub));
1,124!
766
    if (type == 0)
1,124✔
767
      MND_TMQ_NULL_CHECK(taosArrayPush(pRebSub->removedConsumers, &consumerId));
1,080!
768
    else if (type == 1)
584!
769
      MND_TMQ_NULL_CHECK(taosArrayPush(pRebSub->newConsumers, &consumerId));
1,168!
770
  }
771

772
END:
2,000✔
773
  return code;
2,000✔
774
}
775

776
static void checkForVgroupSplit(SMnode *pMnode, SMqConsumerObj *pConsumer, SHashObj *rebSubHash) {
2,884✔
777
  if (pMnode == NULL || pConsumer == NULL || rebSubHash == NULL) {
2,884!
778
    return;
×
779
  }
780
  int32_t newTopicNum = taosArrayGetSize(pConsumer->currentTopics);
2,884✔
781
  for (int32_t i = 0; i < newTopicNum; i++) {
5,951✔
782
    char            *topic = taosArrayGetP(pConsumer->currentTopics, i);
3,067✔
783
    if (topic == NULL){
3,067!
784
      continue;
×
785
    }
786
    SMqSubscribeObj *pSub = NULL;
3,067✔
787
    char  key[TSDB_SUBSCRIBE_KEY_LEN] = {0};
3,067✔
788
    (void)snprintf(key, TSDB_SUBSCRIBE_KEY_LEN, "%s%s%s", pConsumer->cgroup, TMQ_SEPARATOR, topic);
3,067✔
789
    int32_t code = mndAcquireSubscribeByKey(pMnode, key, &pSub);
3,067✔
790
    if (code != 0) {
3,067!
791
      continue;
×
792
    }
793
    taosRLockLatch(&pSub->lock);
3,067✔
794

795
    // iterate all vg assigned to the consumer of that topic
796
    SMqConsumerEp *pConsumerEp = taosHashGet(pSub->consumerHash, &pConsumer->consumerId, sizeof(int64_t));
3,067✔
797
    if (pConsumerEp == NULL){
3,067!
798
      taosRUnLockLatch(&pSub->lock);
×
799
      mndReleaseSubscribe(pMnode, pSub);
×
800
      continue;
×
801
    }
802
    int32_t vgNum = taosArrayGetSize(pConsumerEp->vgs);
3,067✔
803
    for (int32_t j = 0; j < vgNum; j++) {
9,096✔
804
      SMqVgEp *pVgEp = taosArrayGetP(pConsumerEp->vgs, j);
6,029✔
805
      if (pVgEp == NULL) {
6,029!
806
        continue;
×
807
      }
808
      SVgObj  *pVgroup = mndAcquireVgroup(pMnode, pVgEp->vgId);
6,029✔
809
      if (!pVgroup) {
6,029✔
810
        code = mndGetOrCreateRebSub(rebSubHash, key, NULL);
241✔
811
        if (code != 0){
241!
812
          mError("failed to mndGetOrCreateRebSub vgroup:%d, error:%s", pVgEp->vgId, tstrerror(code))
×
813
        }else{
814
          mInfo("vnode splitted, vgId:%d rebalance will be triggered", pVgEp->vgId);
241!
815
        }
816
      }
817
      mndReleaseVgroup(pMnode, pVgroup);
6,029✔
818
    }
819
    taosRUnLockLatch(&pSub->lock);
3,067✔
820
    mndReleaseSubscribe(pMnode, pSub);
3,067✔
821
  }
822
}
823

824
static int32_t mndCheckConsumer(SRpcMsg *pMsg, SHashObj *rebSubHash) {
28,715✔
825
  if (pMsg == NULL || rebSubHash == NULL) {
28,715!
826
    return TSDB_CODE_INVALID_PARA;
×
827
  }
828
  SMnode         *pMnode = pMsg->info.node;
28,715✔
829
  SSdb           *pSdb = pMnode->pSdb;
28,715✔
830
  SMqConsumerObj *pConsumer = NULL;
28,715✔
831
  void           *pIter = NULL;
28,715✔
832
  int32_t         code = 0;
28,715✔
833

834
  // iterate all consumers, find all modification
835
  while (1) {
4,270✔
836
    pIter = sdbFetch(pSdb, SDB_CONSUMER, pIter, (void **)&pConsumer);
32,985✔
837
    if (pIter == NULL) {
32,985✔
838
      break;
28,715✔
839
    }
840

841
    int32_t hbStatus = atomic_add_fetch_32(&pConsumer->hbStatus, 1);
4,270✔
842
    int32_t pollStatus = atomic_add_fetch_32(&pConsumer->pollStatus, 1);
4,270✔
843
    int32_t status = atomic_load_32(&pConsumer->status);
4,270✔
844

845
    mDebug("[rebalance] check for consumer:0x%" PRIx64 " status:%d(%s), sub-time:%" PRId64 ", createTime:%" PRId64
4,270!
846
           ", hbstatus:%d, pollStatus:%d",
847
           pConsumer->consumerId, status, mndConsumerStatusName(status), pConsumer->subscribeTime,
848
           pConsumer->createTime, hbStatus, pollStatus);
849

850
    if (status == MQ_CONSUMER_STATUS_READY) {
4,270✔
851
      if (taosArrayGetSize(pConsumer->currentTopics) == 0) {  // unsubscribe or close
3,274✔
852
        MND_TMQ_RETURN_CHECK(mndSendConsumerMsg(pMnode, pConsumer->consumerId, TDMT_MND_TMQ_LOST_CONSUMER_CLEAR, &pMsg->info));
382!
853
      } else if (hbStatus * tsMqRebalanceInterval * 1000 >= pConsumer->sessionTimeoutMs ||
2,892✔
854
                 pollStatus * tsMqRebalanceInterval * 1000 >= pConsumer->maxPollIntervalMs) {
2,884!
855
        taosRLockLatch(&pConsumer->lock);
8✔
856
        MND_TMQ_RETURN_CHECK(buildRebInfo(rebSubHash, pConsumer->currentTopics, 0, pConsumer->cgroup, pConsumer->consumerId));
8!
857
        taosRUnLockLatch(&pConsumer->lock);
8✔
858
      } else {
859
        checkForVgroupSplit(pMnode, pConsumer, rebSubHash);
2,884✔
860
      }
861
    } else if (status == MQ_CONSUMER_STATUS_REBALANCE) {
996!
862
      taosRLockLatch(&pConsumer->lock);
996✔
863
      MND_TMQ_RETURN_CHECK(buildRebInfo(rebSubHash, pConsumer->rebNewTopics, 1, pConsumer->cgroup, pConsumer->consumerId));
996!
864
      MND_TMQ_RETURN_CHECK(buildRebInfo(rebSubHash, pConsumer->rebRemovedTopics, 0, pConsumer->cgroup, pConsumer->consumerId));
996!
865
      taosRUnLockLatch(&pConsumer->lock);
996✔
866
    } else {
867
      MND_TMQ_RETURN_CHECK(mndSendConsumerMsg(pMnode, pConsumer->consumerId, TDMT_MND_TMQ_LOST_CONSUMER_CLEAR, &pMsg->info));
×
868
    }
869

870
    mndReleaseConsumer(pMnode, pConsumer);
4,270✔
871
  }
872
END:
28,715✔
873
  return code;
28,715✔
874
}
875

876
bool mndRebTryStart() {
28,717✔
877
  int32_t old = atomic_val_compare_exchange_32(&mqRebInExecCnt, 0, 1);
28,717✔
878
  if (old > 0) mInfo("[rebalance] counter old val:%d", old) return old == 0;
28,717!
879
}
880

881
void mndRebCntInc() {
1,015✔
882
  int32_t val = atomic_add_fetch_32(&mqRebInExecCnt, 1);
1,015✔
883
  if (val > 0) mInfo("[rebalance] cnt inc, value:%d", val)
1,015!
884
}
1,015✔
885

886
void mndRebCntDec() {
29,730✔
887
  int32_t val = atomic_sub_fetch_32(&mqRebInExecCnt, 1);
29,730✔
888
  if (val > 0) mInfo("[rebalance] cnt sub, value:%d", val)
29,730!
889
}
29,730✔
890

891
static void clearRebOutput(SMqRebOutputObj *rebOutput) {
1,292✔
892
  if (rebOutput == NULL) {
1,292!
893
    return;
×
894
  }
895
  taosArrayDestroy(rebOutput->newConsumers);
1,292✔
896
  taosArrayDestroy(rebOutput->modifyConsumers);
1,292✔
897
  taosArrayDestroy(rebOutput->removedConsumers);
1,292✔
898
  taosArrayDestroy(rebOutput->rebVgs);
1,292✔
899
  tDeleteSubscribeObj(rebOutput->pSub);
1,292✔
900
  taosMemoryFree(rebOutput->pSub);
1,292!
901
}
902

903
static int32_t initRebOutput(SMqRebOutputObj *rebOutput) {
1,292✔
904
  if (rebOutput == NULL) {
1,292!
905
    return TSDB_CODE_INVALID_PARA;
×
906
  }
907
  int32_t code = 0;
1,292✔
908
  rebOutput->newConsumers = taosArrayInit(0, sizeof(int64_t));
1,292✔
909
  MND_TMQ_NULL_CHECK(rebOutput->newConsumers);
1,292!
910
  rebOutput->removedConsumers = taosArrayInit(0, sizeof(int64_t));
1,292✔
911
  MND_TMQ_NULL_CHECK(rebOutput->removedConsumers);
1,292!
912
  rebOutput->modifyConsumers = taosArrayInit(0, sizeof(int64_t));
1,292✔
913
  MND_TMQ_NULL_CHECK(rebOutput->modifyConsumers);
1,292!
914
  rebOutput->rebVgs = taosArrayInit(0, sizeof(SMqRebOutputVg));
1,292✔
915
  MND_TMQ_NULL_CHECK(rebOutput->rebVgs);
1,292!
916
  return code;
1,292✔
917

918
END:
×
919
  clearRebOutput(rebOutput);
×
920
  return code;
×
921
}
922

923
// This function only works when there are dirty consumers
924
static int32_t checkConsumer(SMnode *pMnode, SMqSubscribeObj *pSub) {
817✔
925
  if (pMnode == NULL || pSub == NULL) {
817!
926
    return TSDB_CODE_INVALID_PARA;
×
927
  }
928
  int32_t code = 0;
817✔
929
  void   *pIter = NULL;
817✔
930
  while (1) {
836✔
931
    pIter = taosHashIterate(pSub->consumerHash, pIter);
1,653✔
932
    if (pIter == NULL) {
1,653✔
933
      break;
817✔
934
    }
935

936
    SMqConsumerEp  *pConsumerEp = (SMqConsumerEp *)pIter;
836✔
937
    SMqConsumerObj *pConsumer = NULL;
836✔
938
    code = mndAcquireConsumer(pMnode, pConsumerEp->consumerId, &pConsumer);
836✔
939
    if (code == 0) {
836!
940
      mndReleaseConsumer(pMnode, pConsumer);
836✔
941
      continue;
836✔
942
    }
943
    mError("consumer:0x%" PRIx64 " not exists in sdb for exception", pConsumerEp->consumerId);
×
944
    MND_TMQ_NULL_CHECK(taosArrayAddAll(pSub->unassignedVgs, pConsumerEp->vgs));
×
945

946
    taosArrayDestroy(pConsumerEp->vgs);
×
947
    MND_TMQ_RETURN_CHECK(taosHashRemove(pSub->consumerHash, &pConsumerEp->consumerId, sizeof(int64_t)));
×
948
  }
949
END:
817✔
950
  return code;
817✔
951
}
952

953
static int32_t buildRebOutput(SMnode *pMnode, SMqRebInputObj *rebInput, SMqRebOutputObj *rebOutput) {
1,292✔
954
  if (pMnode == NULL || rebInput == NULL || rebOutput == NULL) {
1,292!
955
    return TSDB_CODE_INVALID_PARA;
×
956
  }
957
  const char      *key = rebInput->pRebInfo->key;
1,292✔
958
  SMqSubscribeObj *pSub = NULL;
1,292✔
959
  int32_t          code = mndAcquireSubscribeByKey(pMnode, key, &pSub);
1,292✔
960

961
  if (code != 0) {
1,292✔
962
    // split sub key and extract topic
963
    char topic[TSDB_TOPIC_FNAME_LEN] = {0};
475✔
964
    char cgroup[TSDB_CGROUP_LEN] = {0};
475✔
965
    mndSplitSubscribeKey(key, topic, cgroup, true);
475✔
966
    SMqTopicObj *pTopic = NULL;
475✔
967
    MND_TMQ_RETURN_CHECK(mndAcquireTopic(pMnode, topic, &pTopic));
475!
968
    taosRLockLatch(&pTopic->lock);
475✔
969

970
    rebInput->oldConsumerNum = 0;
475✔
971
    code = mndCreateSubscription(pMnode, pTopic, key, &rebOutput->pSub);
475✔
972
    if (code != 0) {
475!
973
      mError("[rebalance] mq rebalance %s failed create sub since %s, ignore", key, tstrerror(code));
×
974
      taosRUnLockLatch(&pTopic->lock);
×
975
      mndReleaseTopic(pMnode, pTopic);
×
976
      return code;
×
977
    }
978

979
    (void)memcpy(rebOutput->pSub->dbName, pTopic->db, TSDB_DB_FNAME_LEN);
475✔
980
    taosRUnLockLatch(&pTopic->lock);
475✔
981
    mndReleaseTopic(pMnode, pTopic);
475✔
982

983
    mInfo("[rebalance] sub topic:%s has no consumers sub yet", key);
475!
984
  } else {
985
    taosRLockLatch(&pSub->lock);
817✔
986
    code = tCloneSubscribeObj(pSub, &rebOutput->pSub);
817✔
987
    if(code != 0){
817!
988
      taosRUnLockLatch(&pSub->lock);
×
989
      goto END;
×
990
    }
991
    code = checkConsumer(pMnode, rebOutput->pSub);
817✔
992
    if(code != 0){
817!
993
      taosRUnLockLatch(&pSub->lock);
×
994
      goto END;
×
995
    }
996
    rebInput->oldConsumerNum = taosHashGetSize(rebOutput->pSub->consumerHash);
817✔
997
    taosRUnLockLatch(&pSub->lock);
817✔
998

999
    mInfo("[rebalance] sub topic:%s has %d consumers sub till now", key, rebInput->oldConsumerNum);
817!
1000
    mndReleaseSubscribe(pMnode, pSub);
817✔
1001
  }
1002

1003
END:
1,292✔
1004
  return code;
1,292✔
1005
}
1006

1007
static int32_t mndProcessRebalanceReq(SRpcMsg *pMsg) {
28,717✔
1008
  if (pMsg == NULL) {
28,717!
1009
    return TSDB_CODE_INVALID_PARA;
×
1010
  }
1011
  int     code = 0;
28,717✔
1012
  void   *pIter = NULL;
28,717✔
1013
  SMnode *pMnode = pMsg->info.node;
28,717✔
1014
  mDebug("[rebalance] start to process mq timer");
28,717✔
1015
  if (!mndRebTryStart()) {
28,717✔
1016
    mInfo("[rebalance] mq rebalance already in progress, do nothing");
2!
1017
    return code;
2✔
1018
  }
1019

1020
  SHashObj *rebSubHash = taosHashInit(64, MurmurHash3_32, true, HASH_NO_LOCK);
28,715✔
1021
  MND_TMQ_NULL_CHECK(rebSubHash);
28,715!
1022

1023
  taosHashSetFreeFp(rebSubHash, freeRebalanceItem);
28,715✔
1024

1025
  MND_TMQ_RETURN_CHECK(mndCheckConsumer(pMsg, rebSubHash));
28,715!
1026
  if (taosHashGetSize(rebSubHash) > 0) {
28,715✔
1027
    mInfo("[rebalance] mq rebalance start, total required re-balanced trans:%d", taosHashGetSize(rebSubHash))
1,082!
1028
  }
1029

1030
  while (1) {
1,292✔
1031
    pIter = taosHashIterate(rebSubHash, pIter);
30,007✔
1032
    if (pIter == NULL) {
30,007✔
1033
      break;
28,715✔
1034
    }
1035

1036
    SMqRebInputObj  rebInput = {0};
1,292✔
1037
    SMqRebOutputObj rebOutput = {0};
1,292✔
1038
    MND_TMQ_RETURN_CHECK(initRebOutput(&rebOutput));
1,292!
1039
    rebInput.pRebInfo = (SMqRebInfo *)pIter;
1,292✔
1040
    code = buildRebOutput(pMnode, &rebInput, &rebOutput);
1,292✔
1041
    if (code != 0) {
1,292!
1042
      mError("mq rebalance buildRebOutput, msg:%s", tstrerror(code))
×
1043
    }
1044

1045
    if (code == 0){
1,292!
1046
      code = mndDoRebalance(pMnode, &rebInput, &rebOutput);
1,292✔
1047
      if (code != 0) {
1,292!
1048
        mError("mq rebalance do rebalance error, msg:%s", tstrerror(code))
×
1049
      }
1050
    }
1051

1052
    if (code == 0){
1,292!
1053
      code = mndPersistRebResult(pMnode, pMsg, &rebOutput);
1,292✔
1054
      if (code != 0) {
1,292✔
1055
        mError("mq rebalance persist output error, possibly vnode splitted or dropped,msg:%s", tstrerror(code))
287!
1056
      }
1057
    }
1058

1059
    clearRebOutput(&rebOutput);
1,292✔
1060
  }
1061

1062
  if (taosHashGetSize(rebSubHash) > 0) {
28,715✔
1063
    mInfo("[rebalance] mq rebalance completed successfully, wait trans finish")
1,082!
1064
  }
1065

1066
END:
27,633✔
1067
  taosHashCancelIterate(rebSubHash, pIter);
28,715✔
1068
  taosHashCleanup(rebSubHash);
28,715✔
1069
  mndRebCntDec();
28,715✔
1070

1071
  TAOS_RETURN(code);
28,715✔
1072
}
1073

1074
static int32_t sendDeleteSubToVnode(SMnode *pMnode, SMqSubscribeObj *pSub, STrans *pTrans) {
242✔
1075
  if (pMnode == NULL || pSub == NULL || pTrans == NULL) {
242!
1076
    return TSDB_CODE_INVALID_PARA;
×
1077
  }
1078
  void   *pIter = NULL;
242✔
1079
  SVgObj *pVgObj = NULL;
242✔
1080
  int32_t code = 0;
242✔
1081
  while (1) {
1,624✔
1082
    pIter = sdbFetch(pMnode->pSdb, SDB_VGROUP, pIter, (void **)&pVgObj);
1,866✔
1083
    if (pIter == NULL) {
1,866✔
1084
      break;
242✔
1085
    }
1086

1087
    if (!mndVgroupInDb(pVgObj, pSub->dbUid)) {
1,624✔
1088
      sdbRelease(pMnode->pSdb, pVgObj);
854✔
1089
      continue;
854✔
1090
    }
1091
    SMqVDeleteReq *pReq = taosMemoryCalloc(1, sizeof(SMqVDeleteReq));
770!
1092
    MND_TMQ_NULL_CHECK(pReq);
770!
1093
    pReq->head.vgId = htonl(pVgObj->vgId);
770✔
1094
    pReq->vgId = pVgObj->vgId;
770✔
1095
    pReq->consumerId = -1;
770✔
1096
    (void)memcpy(pReq->subKey, pSub->key, TSDB_SUBSCRIBE_KEY_LEN);
770✔
1097

1098
    STransAction action = {0};
770✔
1099
    action.epSet = mndGetVgroupEpset(pMnode, pVgObj);
770✔
1100
    action.pCont = pReq;
770✔
1101
    action.contLen = sizeof(SMqVDeleteReq);
770✔
1102
    action.msgType = TDMT_VND_TMQ_DELETE_SUB;
770✔
1103
    action.acceptableCode = TSDB_CODE_MND_VGROUP_NOT_EXIST;
770✔
1104

1105
    sdbRelease(pMnode->pSdb, pVgObj);
770✔
1106
    MND_TMQ_RETURN_CHECK(mndTransAppendRedoAction(pTrans, &action));
770!
1107
  }
1108

1109
END:
242✔
1110
  sdbRelease(pMnode->pSdb, pVgObj);
242✔
1111
  sdbCancelFetch(pMnode->pSdb, pIter);
242✔
1112
  return code;
242✔
1113
}
1114

1115
static int32_t mndCheckConsumerByGroup(SMnode *pMnode, STrans *pTrans, char *cgroup, char *topic) {
5✔
1116
  if (pMnode == NULL || pTrans == NULL || cgroup == NULL || topic == NULL) {
5!
1117
    return TSDB_CODE_INVALID_PARA;
×
1118
  }
1119
  void           *pIter = NULL;
5✔
1120
  SMqConsumerObj *pConsumer = NULL;
5✔
1121
  int             code = 0;
5✔
1122
  while (1) {
1✔
1123
    pIter = sdbFetch(pMnode->pSdb, SDB_CONSUMER, pIter, (void **)&pConsumer);
6✔
1124
    if (pIter == NULL) {
6✔
1125
      break;
5✔
1126
    }
1127

1128
    if (strcmp(cgroup, pConsumer->cgroup) != 0) {
1!
1129
      sdbRelease(pMnode->pSdb, pConsumer);
×
1130
      continue;
×
1131
    }
1132

1133
    bool found = checkTopic(pConsumer->assignedTopics, topic);
1✔
1134
    if (found){
1!
1135
      mError("topic:%s, failed to drop since subscribed by consumer:0x%" PRIx64 ", in consumer group %s",
×
1136
             topic, pConsumer->consumerId, pConsumer->cgroup);
1137
      code = TSDB_CODE_MND_CGROUP_USED;
×
1138
      goto END;
×
1139
    }
1140

1141
    sdbRelease(pMnode->pSdb, pConsumer);
1✔
1142
  }
1143

1144
END:
5✔
1145
  sdbRelease(pMnode->pSdb, pConsumer);
5✔
1146
  sdbCancelFetch(pMnode->pSdb, pIter);
5✔
1147
  return code;
5✔
1148
}
1149

1150
static int32_t mndProcessDropCgroupReq(SRpcMsg *pMsg) {
5✔
1151
  if (pMsg == NULL) {
5!
1152
    return TSDB_CODE_INVALID_PARA;
×
1153
  }
1154
  SMnode         *pMnode = pMsg->info.node;
5✔
1155
  SMDropCgroupReq dropReq = {0};
5✔
1156
  STrans         *pTrans = NULL;
5✔
1157
  int32_t         code = TSDB_CODE_ACTION_IN_PROGRESS;
5✔
1158
  SMqSubscribeObj *pSub = NULL;
5✔
1159

1160
  MND_TMQ_RETURN_CHECK(tDeserializeSMDropCgroupReq(pMsg->pCont, pMsg->contLen, &dropReq));
5!
1161
  char  key[TSDB_SUBSCRIBE_KEY_LEN] = {0};
5✔
1162
  (void)snprintf(key, TSDB_SUBSCRIBE_KEY_LEN, "%s%s%s", dropReq.cgroup, TMQ_SEPARATOR, dropReq.topic);
5✔
1163
  code = mndAcquireSubscribeByKey(pMnode, key, &pSub);
5✔
1164
  if (code != 0) {
5!
1165
    if (dropReq.igNotExists) {
×
1166
      mInfo("cgroup:%s on topic:%s, not exist, ignore not exist is set", dropReq.cgroup, dropReq.topic);
×
1167
      return 0;
×
1168
    } else {
1169
      code = TSDB_CODE_MND_SUBSCRIBE_NOT_EXIST;
×
1170
      mError("topic:%s, cgroup:%s, failed to drop since %s", dropReq.topic, dropReq.cgroup, tstrerror(code));
×
1171
      return code;
×
1172
    }
1173
  }
1174

1175
  taosWLockLatch(&pSub->lock);
5✔
1176
  if (taosHashGetSize(pSub->consumerHash) != 0) {
5!
1177
    code = TSDB_CODE_MND_CGROUP_USED;
×
1178
    mError("cgroup:%s on topic:%s, failed to drop since %s", dropReq.cgroup, dropReq.topic, tstrerror(code));
×
1179
    goto END;
×
1180
  }
1181

1182
  pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, TRN_CONFLICT_DB, pMsg, "drop-cgroup");
5✔
1183
  MND_TMQ_NULL_CHECK(pTrans);
5!
1184
  mInfo("trans:%d, used to drop cgroup:%s on topic %s", pTrans->id, dropReq.cgroup, dropReq.topic);
5!
1185
  mndTransSetDbName(pTrans, pSub->dbName, NULL);
5✔
1186
  MND_TMQ_RETURN_CHECK(mndTransCheckConflict(pMnode, pTrans));
5!
1187
  MND_TMQ_RETURN_CHECK(sendDeleteSubToVnode(pMnode, pSub, pTrans));
5!
1188
  MND_TMQ_RETURN_CHECK(mndCheckConsumerByGroup(pMnode, pTrans, dropReq.cgroup, dropReq.topic));
5!
1189
  MND_TMQ_RETURN_CHECK(mndSetDropSubCommitLogs(pMnode, pTrans, pSub));
5!
1190
  MND_TMQ_RETURN_CHECK(mndTransPrepare(pMnode, pTrans));
5!
1191

1192
END:
5✔
1193
  taosWUnLockLatch(&pSub->lock);
5✔
1194
  mndReleaseSubscribe(pMnode, pSub);
5✔
1195
  mndTransDrop(pTrans);
5✔
1196

1197
  if (code != 0) {
5!
1198
    mError("cgroup %s on topic:%s, failed to drop", dropReq.cgroup, dropReq.topic);
×
1199
    TAOS_RETURN(code);
×
1200
  }
1201
  TAOS_RETURN(TSDB_CODE_ACTION_IN_PROGRESS);
5✔
1202
}
1203

1204
void mndCleanupSubscribe(SMnode *pMnode) {}
1,777✔
1205

1206
static SSdbRaw *mndSubActionEncode(SMqSubscribeObj *pSub) {
1,649✔
1207
  if (pSub == NULL) {
1,649!
1208
    return NULL;
×
1209
  }
1210
  int32_t code = 0;
1,649✔
1211
  int32_t lino = 0;
1,649✔
1212
  terrno = TSDB_CODE_OUT_OF_MEMORY;
1,649✔
1213
  void   *buf = NULL;
1,649✔
1214
  int32_t tlen = tEncodeSubscribeObj(NULL, pSub);
1,649✔
1215
  if (tlen <= 0) goto SUB_ENCODE_OVER;
1,649!
1216
  int32_t size = sizeof(int32_t) + tlen + MND_SUBSCRIBE_RESERVE_SIZE;
1,649✔
1217

1218
  SSdbRaw *pRaw = sdbAllocRaw(SDB_SUBSCRIBE, MND_SUBSCRIBE_VER_NUMBER, size);
1,649✔
1219
  if (pRaw == NULL) goto SUB_ENCODE_OVER;
1,649!
1220

1221
  buf = taosMemoryMalloc(tlen);
1,649!
1222
  if (buf == NULL) goto SUB_ENCODE_OVER;
1,649!
1223

1224
  void *abuf = buf;
1,649✔
1225
  if (tEncodeSubscribeObj(&abuf, pSub) < 0){
1,649!
1226
    goto SUB_ENCODE_OVER;
×
1227
  }
1228

1229
  int32_t dataPos = 0;
1,649✔
1230
  SDB_SET_INT32(pRaw, dataPos, tlen, SUB_ENCODE_OVER);
1,649!
1231
  SDB_SET_BINARY(pRaw, dataPos, buf, tlen, SUB_ENCODE_OVER);
1,649!
1232
  SDB_SET_RESERVE(pRaw, dataPos, MND_SUBSCRIBE_RESERVE_SIZE, SUB_ENCODE_OVER);
1,649!
1233
  SDB_SET_DATALEN(pRaw, dataPos, SUB_ENCODE_OVER);
1,649!
1234

1235
  terrno = TSDB_CODE_SUCCESS;
1,649✔
1236

1237
SUB_ENCODE_OVER:
1,649✔
1238
  taosMemoryFreeClear(buf);
1,649!
1239
  if (terrno != TSDB_CODE_SUCCESS) {
1,649!
1240
    mError("subscribe:%s, failed to encode to raw:%p since %s", pSub->key, pRaw, terrstr());
×
1241
    sdbFreeRaw(pRaw);
×
1242
    return NULL;
×
1243
  }
1244

1245
  mTrace("subscribe:%s, encode to raw:%p, row:%p", pSub->key, pRaw, pSub);
1,649✔
1246
  return pRaw;
1,649✔
1247
}
1248

1249
static SSdbRow *mndSubActionDecode(SSdbRaw *pRaw) {
1,279✔
1250
  if (pRaw == NULL) {
1,279!
1251
    return NULL;
×
1252
  }
1253
  int32_t code = 0;
1,279✔
1254
  int32_t lino = 0;
1,279✔
1255
  terrno = TSDB_CODE_OUT_OF_MEMORY;
1,279✔
1256
  SSdbRow         *pRow = NULL;
1,279✔
1257
  SMqSubscribeObj *pSub = NULL;
1,279✔
1258
  void            *buf = NULL;
1,279✔
1259

1260
  int8_t sver = 0;
1,279✔
1261
  if (sdbGetRawSoftVer(pRaw, &sver) != 0) goto SUB_DECODE_OVER;
1,279!
1262

1263
  if (sver > MND_SUBSCRIBE_VER_NUMBER || sver < 1) {
1,279!
1264
    terrno = TSDB_CODE_SDB_INVALID_DATA_VER;
×
1265
    goto SUB_DECODE_OVER;
×
1266
  }
1267

1268
  pRow = sdbAllocRow(sizeof(SMqSubscribeObj));
1,279✔
1269
  if (pRow == NULL) goto SUB_DECODE_OVER;
1,279!
1270

1271
  pSub = sdbGetRowObj(pRow);
1,279✔
1272
  if (pSub == NULL) goto SUB_DECODE_OVER;
1,279!
1273

1274
  int32_t dataPos = 0;
1,279✔
1275
  int32_t tlen;
1276
  SDB_GET_INT32(pRaw, dataPos, &tlen, SUB_DECODE_OVER);
1,279!
1277
  buf = taosMemoryMalloc(tlen);
1,279!
1278
  if (buf == NULL) goto SUB_DECODE_OVER;
1,279!
1279
  SDB_GET_BINARY(pRaw, dataPos, buf, tlen, SUB_DECODE_OVER);
1,279!
1280
  SDB_GET_RESERVE(pRaw, dataPos, MND_SUBSCRIBE_RESERVE_SIZE, SUB_DECODE_OVER);
1,279!
1281

1282
  if (tDecodeSubscribeObj(buf, pSub, sver) == NULL) {
1,279!
1283
    goto SUB_DECODE_OVER;
×
1284
  }
1285

1286
  // update epset saved in mnode
1287
  if (pSub->unassignedVgs != NULL) {
1,279!
1288
    int32_t size = (int32_t)taosArrayGetSize(pSub->unassignedVgs);
1,279✔
1289
    for (int32_t i = 0; i < size; ++i) {
3,236✔
1290
      SMqVgEp *pMqVgEp = (SMqVgEp *)taosArrayGetP(pSub->unassignedVgs, i);
1,957✔
1291
      tmsgUpdateDnodeEpSet(&pMqVgEp->epSet);
1,957✔
1292
    }
1293
  }
1294
  if (pSub->consumerHash != NULL) {
1,279!
1295
    void *pIter = taosHashIterate(pSub->consumerHash, NULL);
1,279✔
1296
    while (pIter) {
1,955✔
1297
      SMqConsumerEp *pConsumerEp = pIter;
676✔
1298
      int32_t        size = (int32_t)taosArrayGetSize(pConsumerEp->vgs);
676✔
1299
      for (int32_t i = 0; i < size; ++i) {
2,161✔
1300
        SMqVgEp *pMqVgEp = (SMqVgEp *)taosArrayGetP(pConsumerEp->vgs, i);
1,485✔
1301
        tmsgUpdateDnodeEpSet(&pMqVgEp->epSet);
1,485✔
1302
      }
1303
      pIter = taosHashIterate(pSub->consumerHash, pIter);
676✔
1304
    }
1305
  }
1306

1307
  terrno = TSDB_CODE_SUCCESS;
1,279✔
1308

1309
SUB_DECODE_OVER:
1,279✔
1310
  taosMemoryFreeClear(buf);
1,279!
1311
  if (terrno != TSDB_CODE_SUCCESS) {
1,279!
1312
    mError("subscribe:%s, failed to decode from raw:%p since %s", pSub == NULL ? "null" : pSub->key, pRaw, terrstr());
×
1313
    taosMemoryFreeClear(pRow);
×
1314
    return NULL;
×
1315
  }
1316

1317
  mTrace("subscribe:%s, decode from raw:%p, row:%p", pSub->key, pRaw, pSub);
1,279✔
1318
  return pRow;
1,279✔
1319
}
1320

1321
static int32_t mndSubActionInsert(SSdb *pSdb, SMqSubscribeObj *pSub) {
503✔
1322
  mTrace("subscribe:%s, perform insert action", pSub != NULL ? pSub->key : "null");
503!
1323
  return 0;
503✔
1324
}
1325

1326
static int32_t mndSubActionDelete(SSdb *pSdb, SMqSubscribeObj *pSub) {
1,279✔
1327
  mTrace("subscribe:%s, perform delete action", pSub != NULL ? pSub->key : "null");
1,279!
1328
  tDeleteSubscribeObj(pSub);
1,279✔
1329
  return 0;
1,279✔
1330
}
1331

1332
static int32_t mndSubActionUpdate(SSdb *pSdb, SMqSubscribeObj *pOldSub, SMqSubscribeObj *pNewSub) {
534✔
1333
  if (pOldSub == NULL || pNewSub == NULL) return -1;
534!
1334
  mTrace("subscribe:%s, perform update action", pOldSub->key);
534✔
1335
  taosWLockLatch(&pOldSub->lock);
534✔
1336

1337
  SHashObj *tmp = pOldSub->consumerHash;
534✔
1338
  pOldSub->consumerHash = pNewSub->consumerHash;
534✔
1339
  pNewSub->consumerHash = tmp;
534✔
1340

1341
  SArray *tmp1 = pOldSub->unassignedVgs;
534✔
1342
  pOldSub->unassignedVgs = pNewSub->unassignedVgs;
534✔
1343
  pNewSub->unassignedVgs = tmp1;
534✔
1344

1345
  SArray *tmp2 = pOldSub->offsetRows;
534✔
1346
  pOldSub->offsetRows = pNewSub->offsetRows;
534✔
1347
  pNewSub->offsetRows = tmp2;
534✔
1348

1349
  taosWUnLockLatch(&pOldSub->lock);
534✔
1350
  return 0;
534✔
1351
}
1352

1353
int32_t mndAcquireSubscribeByKey(SMnode *pMnode, const char *key, SMqSubscribeObj** pSub) {
12,054✔
1354
  if (pMnode == NULL || key == NULL || pSub == NULL){
12,054!
1355
    return TSDB_CODE_INVALID_PARA;
×
1356
  }
1357
  SSdb            *pSdb = pMnode->pSdb;
12,054✔
1358
  *pSub = sdbAcquire(pSdb, SDB_SUBSCRIBE, key);
12,054✔
1359
  if (*pSub == NULL) {
12,054✔
1360
    return TSDB_CODE_MND_SUBSCRIBE_NOT_EXIST;
950✔
1361
  }
1362
  return 0;
11,104✔
1363
}
1364

1365
int32_t mndGetGroupNumByTopic(SMnode *pMnode, const char *topicName) {
600✔
1366
  if (pMnode == NULL || topicName == NULL) return 0;
600!
1367
  int32_t num = 0;
600✔
1368
  SSdb   *pSdb = pMnode->pSdb;
600✔
1369

1370
  void            *pIter = NULL;
600✔
1371
  SMqSubscribeObj *pSub = NULL;
600✔
1372
  while (1) {
1,011✔
1373
    pIter = sdbFetch(pSdb, SDB_SUBSCRIBE, pIter, (void **)&pSub);
1,611✔
1374
    if (pIter == NULL) break;
1,611✔
1375

1376
    char topic[TSDB_TOPIC_FNAME_LEN] = {0};
1,011✔
1377
    char cgroup[TSDB_CGROUP_LEN] = {0};
1,011✔
1378
    mndSplitSubscribeKey(pSub->key, topic, cgroup, true);
1,011✔
1379
    if (strcmp(topic, topicName) != 0) {
1,011✔
1380
      sdbRelease(pSdb, pSub);
745✔
1381
      continue;
745✔
1382
    }
1383

1384
    num++;
266✔
1385
    sdbRelease(pSdb, pSub);
266✔
1386
  }
1387

1388
  return num;
600✔
1389
}
1390

1391
void mndReleaseSubscribe(SMnode *pMnode, SMqSubscribeObj *pSub) {
11,104✔
1392
  if (pMnode == NULL || pSub == NULL) return;
11,104!
1393
  SSdb *pSdb = pMnode->pSdb;
11,104✔
1394
  sdbRelease(pSdb, pSub);
11,104✔
1395
}
1396

1397
int32_t mndSetDropSubCommitLogs(SMnode *pMnode, STrans *pTrans, SMqSubscribeObj *pSub) {
242✔
1398
  if (pMnode == NULL || pTrans == NULL || pSub == NULL) return TSDB_CODE_INVALID_PARA;
242!
1399
  int32_t  code = 0;
242✔
1400
  SSdbRaw *pCommitRaw = mndSubActionEncode(pSub);
242✔
1401
  MND_TMQ_NULL_CHECK(pCommitRaw);
242!
1402
  code = mndTransAppendCommitlog(pTrans, pCommitRaw);
242✔
1403
  if (code != 0){
242!
1404
    sdbFreeRaw(pCommitRaw);
×
1405
    goto END;
×
1406
  }
1407
  code = sdbSetRawStatus(pCommitRaw, SDB_STATUS_DROPPED);
242✔
1408
END:
242✔
1409
  return code;
242✔
1410
}
1411

1412
int32_t mndDropSubByTopic(SMnode *pMnode, STrans *pTrans, const char *topicName) {
319✔
1413
  if (pMnode == NULL || pTrans == NULL || topicName == NULL) return TSDB_CODE_INVALID_PARA;
319!
1414
  SSdb            *pSdb = pMnode->pSdb;
319✔
1415
  int32_t          code = 0;
319✔
1416
  void            *pIter = NULL;
319✔
1417
  SMqSubscribeObj *pSub = NULL;
319✔
1418
  while (1) {
463✔
1419
    sdbRelease(pSdb, pSub);
782✔
1420
    pIter = sdbFetch(pSdb, SDB_SUBSCRIBE, pIter, (void **)&pSub);
782✔
1421
    if (pIter == NULL) break;
782✔
1422

1423
    char topic[TSDB_TOPIC_FNAME_LEN] = {0};
463✔
1424
    char cgroup[TSDB_CGROUP_LEN] = {0};
463✔
1425
    mndSplitSubscribeKey(pSub->key, topic, cgroup, true);
463✔
1426
    if (strcmp(topic, topicName) != 0) {
463✔
1427
      continue;
226✔
1428
    }
1429

1430
    // iter all vnode to delete handle
1431
    if (taosHashGetSize(pSub->consumerHash) != 0) {
237!
1432
      code = TSDB_CODE_MND_IN_REBALANCE;
×
1433
      goto END;
×
1434
    }
1435

1436
    MND_TMQ_RETURN_CHECK(sendDeleteSubToVnode(pMnode, pSub, pTrans));
237!
1437
    MND_TMQ_RETURN_CHECK(mndSetDropSubCommitLogs(pMnode, pTrans, pSub));
237!
1438
  }
1439

1440
END:
319✔
1441
  sdbRelease(pSdb, pSub);
319✔
1442
  sdbCancelFetch(pSdb, pIter);
319✔
1443

1444
  TAOS_RETURN(code);
319✔
1445
}
1446

1447
static int32_t buildResult(SSDataBlock *pBlock, int32_t *numOfRows, int64_t consumerId, const char* user, const char* fqdn,
1,675✔
1448
                           const char *topic, const char *cgroup, SArray *vgs, SArray *offsetRows) {
1449
  if (pBlock == NULL || numOfRows == NULL || topic == NULL || cgroup == NULL){
1,675!
1450
    return TSDB_CODE_INVALID_PARA;
×
1451
  }
1452
  int32_t code = 0;
1,675✔
1453
  int32_t sz = taosArrayGetSize(vgs);
1,675✔
1454
  for (int32_t j = 0; j < sz; j++) {
2,712✔
1455
    SMqVgEp *pVgEp = taosArrayGetP(vgs, j);
1,037✔
1456
    MND_TMQ_NULL_CHECK(pVgEp);
1,037!
1457

1458
    SColumnInfoData *pColInfo = NULL;
1,037✔
1459
    int32_t          cols = 0;
1,037✔
1460

1461
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,037✔
1462
    MND_TMQ_NULL_CHECK(pColInfo);
1,037!
1463
    MND_TMQ_RETURN_CHECK(colDataSetVal(pColInfo, *numOfRows, (const char *)topic, false));
1,037!
1464

1465
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,037✔
1466
    MND_TMQ_NULL_CHECK(pColInfo);
1,037!
1467
    MND_TMQ_RETURN_CHECK(colDataSetVal(pColInfo, *numOfRows, (const char *)cgroup, false));
1,037!
1468

1469
    // vg id
1470
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,037✔
1471
    MND_TMQ_NULL_CHECK(pColInfo);
1,037!
1472
    MND_TMQ_RETURN_CHECK(colDataSetVal(pColInfo, *numOfRows, (const char *)&pVgEp->vgId, false));
1,037!
1473

1474
    // consumer id
1475
    char consumerIdHex[TSDB_CONSUMER_ID_LEN] = {0};
1,037✔
1476
    (void)snprintf(varDataVal(consumerIdHex), TSDB_CONSUMER_ID_LEN - VARSTR_HEADER_SIZE, "0x%" PRIx64, consumerId);
1,037✔
1477
    varDataSetLen(consumerIdHex, strlen(varDataVal(consumerIdHex)));
1,037✔
1478

1479
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,037✔
1480
    MND_TMQ_NULL_CHECK(pColInfo);
1,037!
1481
    MND_TMQ_RETURN_CHECK(colDataSetVal(pColInfo, *numOfRows, (const char *)consumerIdHex, consumerId == -1));
1,037!
1482

1483
    char userStr[TSDB_USER_LEN + VARSTR_HEADER_SIZE] = {0};
1,037✔
1484
    if (user) STR_TO_VARSTR(userStr, user);
1,037✔
1485
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,037✔
1486
    MND_TMQ_NULL_CHECK(pColInfo);
1,037!
1487
    MND_TMQ_RETURN_CHECK(colDataSetVal(pColInfo, *numOfRows, userStr, user == NULL));
1,037!
1488

1489
    char fqdnStr[TSDB_FQDN_LEN + VARSTR_HEADER_SIZE] = {0};
1,037✔
1490
    if (fqdn) STR_TO_VARSTR(fqdnStr, fqdn);
1,037✔
1491
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,037✔
1492
    MND_TMQ_NULL_CHECK(pColInfo);
1,037!
1493
    MND_TMQ_RETURN_CHECK(colDataSetVal(pColInfo, *numOfRows, fqdnStr, fqdn == NULL));
1,037!
1494

1495
    mInfo("mnd show subscriptions: topic %s, consumer:0x%" PRIx64 " cgroup %s vgid %d", varDataVal(topic), consumerId,
1,037!
1496
          varDataVal(cgroup), pVgEp->vgId);
1497

1498
    // offset
1499
    OffsetRows *data = NULL;
1,037✔
1500
    for (int i = 0; i < taosArrayGetSize(offsetRows); i++) {
2,192✔
1501
      OffsetRows *tmp = taosArrayGet(offsetRows, i);
1,155✔
1502
      MND_TMQ_NULL_CHECK(tmp);
1,155!
1503
      if (tmp->vgId != pVgEp->vgId) {
1,155✔
1504
        mInfo("mnd show subscriptions: do not find vgId:%d, %d in offsetRows", tmp->vgId, pVgEp->vgId);
640!
1505
        continue;
640✔
1506
      }
1507
      data = tmp;
515✔
1508
    }
1509
    if (data) {
1,037✔
1510
      // vg id
1511
      char buf[TSDB_OFFSET_LEN * 2 + VARSTR_HEADER_SIZE] = {0};
515✔
1512
      (void)tFormatOffset(varDataVal(buf), TSDB_OFFSET_LEN, &data->offset);
515✔
1513
      (void)snprintf(varDataVal(buf) + strlen(varDataVal(buf)),
515✔
1514
                     sizeof(buf) - VARSTR_HEADER_SIZE - strlen(varDataVal(buf)), "/%" PRId64, data->ever);
515✔
1515
      varDataSetLen(buf, strlen(varDataVal(buf)));
515✔
1516
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
515✔
1517
      MND_TMQ_NULL_CHECK(pColInfo);
515!
1518
      MND_TMQ_RETURN_CHECK(colDataSetVal(pColInfo, *numOfRows, (const char *)buf, false));
515!
1519
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
515✔
1520
      MND_TMQ_NULL_CHECK(pColInfo);
515!
1521
      MND_TMQ_RETURN_CHECK(colDataSetVal(pColInfo, *numOfRows, (const char *)&data->rows, false));
515!
1522
    } else {
1523
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
522✔
1524
      MND_TMQ_NULL_CHECK(pColInfo);
522!
1525
      colDataSetNULL(pColInfo, *numOfRows);
522!
1526
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
522✔
1527
      MND_TMQ_NULL_CHECK(pColInfo);
522!
1528
      colDataSetNULL(pColInfo, *numOfRows);
522!
1529
      mInfo("mnd show subscriptions: do not find vgId:%d in offsetRows", pVgEp->vgId);
522!
1530
    }
1531
    (*numOfRows)++;
1,037✔
1532
  }
1533
  return 0;
1,675✔
1534
END:
×
1535
  return code;
×
1536
}
1537

1538
int32_t mndRetrieveSubscribe(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rowsCapacity) {
5,841✔
1539
  if (pReq == NULL || pShow == NULL || pBlock == NULL){
5,841!
1540
    return TSDB_CODE_INVALID_PARA;
×
1541
  }
1542
  SMnode          *pMnode = pReq->info.node;
5,851✔
1543
  SSdb            *pSdb = pMnode->pSdb;
5,851✔
1544
  int32_t          numOfRows = 0;
5,851✔
1545
  SMqSubscribeObj *pSub = NULL;
5,851✔
1546
  int32_t          code = 0;
5,851✔
1547

1548
  mInfo("mnd show subscriptions begin");
5,851✔
1549

1550
  while (numOfRows < rowsCapacity) {
6,721!
1551
    pShow->pIter = sdbFetch(pSdb, SDB_SUBSCRIBE, pShow->pIter, (void **)&pSub);
6,721✔
1552
    if (pShow->pIter == NULL) {
6,721✔
1553
      break;
5,852✔
1554
    }
1555

1556
    taosRLockLatch(&pSub->lock);
869✔
1557

1558
    if (numOfRows + pSub->vgNum > rowsCapacity) {
869!
1559
      MND_TMQ_RETURN_CHECK(blockDataEnsureCapacity(pBlock, numOfRows + pSub->vgNum))  ;
×
1560
    }
1561

1562
    // topic and cgroup
1563
    char topic[TSDB_TOPIC_FNAME_LEN + VARSTR_HEADER_SIZE] = {0};
869✔
1564
    char cgroup[TSDB_CGROUP_LEN + VARSTR_HEADER_SIZE] = {0};
869✔
1565
    mndSplitSubscribeKey(pSub->key, varDataVal(topic), varDataVal(cgroup), false);
869✔
1566
    varDataSetLen(topic, strlen(varDataVal(topic)));
869✔
1567
    varDataSetLen(cgroup, strlen(varDataVal(cgroup)));
869✔
1568

1569
    SMqConsumerEp *pConsumerEp = NULL;
869✔
1570
    void          *pIter = NULL;
869✔
1571

1572
    while (1) {
806✔
1573
      pIter = taosHashIterate(pSub->consumerHash, pIter);
1,675✔
1574
      if (pIter == NULL) break;
1,675✔
1575
      pConsumerEp = (SMqConsumerEp *)pIter;
806✔
1576

1577
      char          *user = NULL;
806✔
1578
      char          *fqdn = NULL;
806✔
1579
      SMqConsumerObj *pConsumer = sdbAcquire(pSdb, SDB_CONSUMER, &pConsumerEp->consumerId);
806✔
1580
      if (pConsumer != NULL) {
806!
1581
        user = pConsumer->user;
806✔
1582
        fqdn = pConsumer->fqdn;
806✔
1583
        sdbRelease(pSdb, pConsumer);
806✔
1584
      }
1585
      MND_TMQ_RETURN_CHECK(buildResult(pBlock, &numOfRows, pConsumerEp->consumerId, user, fqdn, topic, cgroup, pConsumerEp->vgs,
806!
1586
                  pConsumerEp->offsetRows));
1587
    }
1588

1589
    MND_TMQ_RETURN_CHECK(buildResult(pBlock, &numOfRows, -1, NULL, NULL, topic, cgroup, pSub->unassignedVgs, pSub->offsetRows));
869!
1590

1591
    pBlock->info.rows = numOfRows;
869✔
1592

1593
    taosRUnLockLatch(&pSub->lock);
869✔
1594
    sdbRelease(pSdb, pSub);
869✔
1595
  }
1596

1597
  mInfo("mnd end show subscriptions");
5,852!
1598

1599
  pShow->numOfRows += numOfRows;
5,852✔
1600
  return numOfRows;
5,852✔
1601

1602
END:
×
1603
  taosRUnLockLatch(&pSub->lock);
×
1604
  sdbRelease(pSdb, pSub);
×
1605

1606
  return code;
10✔
1607
}
1608

1609
void mndCancelGetNextSubscribe(SMnode *pMnode, void *pIter) {
×
1610
  if (pMnode == NULL) {
×
1611
    return;
×
1612
  }
1613
  SSdb *pSdb = pMnode->pSdb;
×
1614
  sdbCancelFetchByType(pSdb, pIter, SDB_SUBSCRIBE);
×
1615
}
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc