• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

taosdata / TDengine / #4180

27 May 2025 10:49AM UTC coverage: 63.267% (+0.4%) from 62.885%
#4180

push

travis-ci

web-flow
TD-35056 (#31227)

158426 of 318644 branches covered (49.72%)

Branch coverage included in aggregate %.

243945 of 317346 relevant lines covered (76.87%)

18276423.81 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

59.32
/source/dnode/mnode/impl/src/mndVgroup.c
1
/*
2
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
3
 *
4
 * This program is free software: you can use, redistribute, and/or modify
5
 * it under the terms of the GNU Affero General Public License, version 3
6
 * or later ("AGPL"), as published by the Free Software Foundation.
7
 *
8
 * This program is distributed in the hope that it will be useful, but WITHOUT
9
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10
 * FITNESS FOR A PARTICULAR PURPOSE.
11
 *
12
 * You should have received a copy of the GNU Affero General Public License
13
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
14
 */
15

16
#define _DEFAULT_SOURCE
17
#include "audit.h"
18
#include "mndArbGroup.h"
19
#include "mndDb.h"
20
#include "mndDnode.h"
21
#include "mndMnode.h"
22
#include "mndPrivilege.h"
23
#include "mndShow.h"
24
#include "mndStb.h"
25
#include "mndStream.h"
26
#include "mndTopic.h"
27
#include "mndTrans.h"
28
#include "mndUser.h"
29
#include "mndVgroup.h"
30
#include "tmisce.h"
31

32
#define VGROUP_VER_NUMBER   1
33
#define VGROUP_RESERVE_SIZE 64
34

35
static int32_t mndVgroupActionInsert(SSdb *pSdb, SVgObj *pVgroup);
36
static int32_t mndVgroupActionDelete(SSdb *pSdb, SVgObj *pVgroup);
37
static int32_t mndVgroupActionUpdate(SSdb *pSdb, SVgObj *pOld, SVgObj *pNew);
38
static int32_t mndNewVgActionValidate(SMnode *pMnode, STrans *pTrans, SSdbRaw *pRaw);
39

40
static int32_t mndRetrieveVgroups(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows);
41
static void    mndCancelGetNextVgroup(SMnode *pMnode, void *pIter);
42
static int32_t mndRetrieveVnodes(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows);
43
static void    mndCancelGetNextVnode(SMnode *pMnode, void *pIter);
44

45
static int32_t mndProcessRedistributeVgroupMsg(SRpcMsg *pReq);
46
static int32_t mndProcessSplitVgroupMsg(SRpcMsg *pReq);
47
static int32_t mndProcessBalanceVgroupMsg(SRpcMsg *pReq);
48
static int32_t mndProcessVgroupBalanceLeaderMsg(SRpcMsg *pReq);
49

50
int32_t mndInitVgroup(SMnode *pMnode) {
2,282✔
51
  SSdbTable table = {
2,282✔
52
      .sdbType = SDB_VGROUP,
53
      .keyType = SDB_KEY_INT32,
54
      .encodeFp = (SdbEncodeFp)mndVgroupActionEncode,
55
      .decodeFp = (SdbDecodeFp)mndVgroupActionDecode,
56
      .insertFp = (SdbInsertFp)mndVgroupActionInsert,
57
      .updateFp = (SdbUpdateFp)mndVgroupActionUpdate,
58
      .deleteFp = (SdbDeleteFp)mndVgroupActionDelete,
59
      .validateFp = (SdbValidateFp)mndNewVgActionValidate,
60
  };
61

62
  mndSetMsgHandle(pMnode, TDMT_DND_CREATE_VNODE_RSP, mndTransProcessRsp);
2,282✔
63
  mndSetMsgHandle(pMnode, TDMT_VND_ALTER_REPLICA_RSP, mndTransProcessRsp);
2,282✔
64
  mndSetMsgHandle(pMnode, TDMT_VND_ALTER_CONFIG_RSP, mndTransProcessRsp);
2,282✔
65
  mndSetMsgHandle(pMnode, TDMT_VND_ALTER_CONFIRM_RSP, mndTransProcessRsp);
2,282✔
66
  mndSetMsgHandle(pMnode, TDMT_VND_ALTER_HASHRANGE_RSP, mndTransProcessRsp);
2,282✔
67
  mndSetMsgHandle(pMnode, TDMT_DND_DROP_VNODE_RSP, mndTransProcessRsp);
2,282✔
68
  mndSetMsgHandle(pMnode, TDMT_VND_COMPACT_RSP, mndTransProcessRsp);
2,282✔
69
  mndSetMsgHandle(pMnode, TDMT_VND_DISABLE_WRITE_RSP, mndTransProcessRsp);
2,282✔
70
  mndSetMsgHandle(pMnode, TDMT_SYNC_FORCE_FOLLOWER_RSP, mndTransProcessRsp);
2,282✔
71
  mndSetMsgHandle(pMnode, TDMT_DND_ALTER_VNODE_TYPE_RSP, mndTransProcessRsp);
2,282✔
72
  mndSetMsgHandle(pMnode, TDMT_DND_CHECK_VNODE_LEARNER_CATCHUP_RSP, mndTransProcessRsp);
2,282✔
73
  mndSetMsgHandle(pMnode, TDMT_SYNC_CONFIG_CHANGE_RSP, mndTransProcessRsp);
2,282✔
74

75
  mndSetMsgHandle(pMnode, TDMT_MND_REDISTRIBUTE_VGROUP, mndProcessRedistributeVgroupMsg);
2,282✔
76
  mndSetMsgHandle(pMnode, TDMT_MND_SPLIT_VGROUP, mndProcessSplitVgroupMsg);
2,282✔
77
  // mndSetMsgHandle(pMnode, TDMT_MND_BALANCE_VGROUP, mndProcessVgroupBalanceLeaderMsg);
78
  mndSetMsgHandle(pMnode, TDMT_MND_BALANCE_VGROUP, mndProcessBalanceVgroupMsg);
2,282✔
79
  mndSetMsgHandle(pMnode, TDMT_MND_BALANCE_VGROUP_LEADER, mndProcessVgroupBalanceLeaderMsg);
2,282✔
80

81
  mndAddShowRetrieveHandle(pMnode, TSDB_MGMT_TABLE_VGROUP, mndRetrieveVgroups);
2,282✔
82
  mndAddShowFreeIterHandle(pMnode, TSDB_MGMT_TABLE_VGROUP, mndCancelGetNextVgroup);
2,282✔
83
  mndAddShowRetrieveHandle(pMnode, TSDB_MGMT_TABLE_VNODES, mndRetrieveVnodes);
2,282✔
84
  mndAddShowFreeIterHandle(pMnode, TSDB_MGMT_TABLE_VNODES, mndCancelGetNextVnode);
2,282✔
85

86
  return sdbSetTable(pMnode->pSdb, table);
2,282✔
87
}
88

89
void mndCleanupVgroup(SMnode *pMnode) {}
2,279✔
90

91
SSdbRaw *mndVgroupActionEncode(SVgObj *pVgroup) {
49,378✔
92
  int32_t code = 0;
49,378✔
93
  int32_t lino = 0;
49,378✔
94
  terrno = TSDB_CODE_OUT_OF_MEMORY;
49,378✔
95

96
  SSdbRaw *pRaw = sdbAllocRaw(SDB_VGROUP, VGROUP_VER_NUMBER, sizeof(SVgObj) + VGROUP_RESERVE_SIZE);
49,378✔
97
  if (pRaw == NULL) goto _OVER;
49,378!
98

99
  int32_t dataPos = 0;
49,378✔
100
  SDB_SET_INT32(pRaw, dataPos, pVgroup->vgId, _OVER)
49,378!
101
  SDB_SET_INT64(pRaw, dataPos, pVgroup->createdTime, _OVER)
49,378!
102
  SDB_SET_INT64(pRaw, dataPos, pVgroup->updateTime, _OVER)
49,378!
103
  SDB_SET_INT32(pRaw, dataPos, pVgroup->version, _OVER)
49,378!
104
  SDB_SET_INT32(pRaw, dataPos, pVgroup->hashBegin, _OVER)
49,378!
105
  SDB_SET_INT32(pRaw, dataPos, pVgroup->hashEnd, _OVER)
49,378!
106
  SDB_SET_BINARY(pRaw, dataPos, pVgroup->dbName, TSDB_DB_FNAME_LEN, _OVER)
49,378!
107
  SDB_SET_INT64(pRaw, dataPos, pVgroup->dbUid, _OVER)
49,378!
108
  SDB_SET_INT8(pRaw, dataPos, pVgroup->isTsma, _OVER)
49,378!
109
  SDB_SET_INT8(pRaw, dataPos, pVgroup->replica, _OVER)
49,378!
110
  for (int8_t i = 0; i < pVgroup->replica; ++i) {
104,555✔
111
    SVnodeGid *pVgid = &pVgroup->vnodeGid[i];
55,177✔
112
    SDB_SET_INT32(pRaw, dataPos, pVgid->dnodeId, _OVER)
55,177!
113
  }
114
  SDB_SET_INT32(pRaw, dataPos, pVgroup->syncConfChangeVer, _OVER)
49,378!
115
  SDB_SET_RESERVE(pRaw, dataPos, VGROUP_RESERVE_SIZE, _OVER)
49,378!
116
  SDB_SET_DATALEN(pRaw, dataPos, _OVER)
49,378!
117

118
  terrno = 0;
49,378✔
119

120
_OVER:
49,378✔
121
  if (terrno != 0) {
49,378!
122
    mError("vgId:%d, failed to encode to raw:%p since %s", pVgroup->vgId, pRaw, terrstr());
×
123
    sdbFreeRaw(pRaw);
×
124
    return NULL;
×
125
  }
126

127
  mTrace("vgId:%d, encode to raw:%p, row:%p", pVgroup->vgId, pRaw, pVgroup);
49,378✔
128
  return pRaw;
49,378✔
129
}
130

131
SSdbRow *mndVgroupActionDecode(SSdbRaw *pRaw) {
41,855✔
132
  int32_t code = 0;
41,855✔
133
  int32_t lino = 0;
41,855✔
134
  terrno = TSDB_CODE_OUT_OF_MEMORY;
41,855✔
135
  SSdbRow *pRow = NULL;
41,855✔
136
  SVgObj  *pVgroup = NULL;
41,855✔
137

138
  int8_t sver = 0;
41,855✔
139
  if (sdbGetRawSoftVer(pRaw, &sver) != 0) goto _OVER;
41,855!
140

141
  if (sver < 1 || sver > VGROUP_VER_NUMBER) {
41,855!
142
    terrno = TSDB_CODE_SDB_INVALID_DATA_VER;
×
143
    goto _OVER;
×
144
  }
145

146
  pRow = sdbAllocRow(sizeof(SVgObj));
41,855✔
147
  if (pRow == NULL) goto _OVER;
41,855!
148

149
  pVgroup = sdbGetRowObj(pRow);
41,855✔
150
  if (pVgroup == NULL) goto _OVER;
41,855!
151

152
  int32_t dataPos = 0;
41,855✔
153
  SDB_GET_INT32(pRaw, dataPos, &pVgroup->vgId, _OVER)
41,855!
154
  SDB_GET_INT64(pRaw, dataPos, &pVgroup->createdTime, _OVER)
41,855!
155
  SDB_GET_INT64(pRaw, dataPos, &pVgroup->updateTime, _OVER)
41,855!
156
  SDB_GET_INT32(pRaw, dataPos, &pVgroup->version, _OVER)
41,855!
157
  SDB_GET_INT32(pRaw, dataPos, &pVgroup->hashBegin, _OVER)
41,855!
158
  SDB_GET_INT32(pRaw, dataPos, &pVgroup->hashEnd, _OVER)
41,855!
159
  SDB_GET_BINARY(pRaw, dataPos, pVgroup->dbName, TSDB_DB_FNAME_LEN, _OVER)
41,855!
160
  SDB_GET_INT64(pRaw, dataPos, &pVgroup->dbUid, _OVER)
41,855!
161
  SDB_GET_INT8(pRaw, dataPos, &pVgroup->isTsma, _OVER)
41,855!
162
  SDB_GET_INT8(pRaw, dataPos, &pVgroup->replica, _OVER)
41,855!
163
  for (int8_t i = 0; i < pVgroup->replica; ++i) {
90,131✔
164
    SVnodeGid *pVgid = &pVgroup->vnodeGid[i];
48,276✔
165
    SDB_GET_INT32(pRaw, dataPos, &pVgid->dnodeId, _OVER)
48,276!
166
    if (pVgroup->replica == 1) {
48,276✔
167
      pVgid->syncState = TAOS_SYNC_STATE_LEADER;
38,580✔
168
    }
169
  }
170
  if (dataPos + sizeof(int32_t) + VGROUP_RESERVE_SIZE <= pRaw->dataLen) {
41,855!
171
    SDB_GET_INT32(pRaw, dataPos, &pVgroup->syncConfChangeVer, _OVER)
41,855!
172
  }
173

174
  SDB_GET_RESERVE(pRaw, dataPos, VGROUP_RESERVE_SIZE, _OVER)
41,855!
175

176
  terrno = 0;
41,855✔
177

178
_OVER:
41,855✔
179
  if (terrno != 0) {
41,855!
180
    mError("vgId:%d, failed to decode from raw:%p since %s", pVgroup == NULL ? 0 : pVgroup->vgId, pRaw, terrstr());
×
181
    taosMemoryFreeClear(pRow);
×
182
    return NULL;
×
183
  }
184

185
  mTrace("vgId:%d, decode from raw:%p, row:%p", pVgroup->vgId, pRaw, pVgroup);
41,855✔
186
  return pRow;
41,855✔
187
}
188

189
static int32_t mndNewVgActionValidate(SMnode *pMnode, STrans *pTrans, SSdbRaw *pRaw) {
11,616✔
190
  SSdb    *pSdb = pMnode->pSdb;
11,616✔
191
  SSdbRow *pRow = NULL;
11,616✔
192
  SVgObj  *pVgroup = NULL;
11,616✔
193
  int      code = -1;
11,616✔
194

195
  pRow = mndVgroupActionDecode(pRaw);
11,616✔
196
  if (pRow == NULL) {
11,616!
197
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
198
    if (terrno != 0) code = terrno;
×
199
    goto _OVER;
×
200
  }
201
  pVgroup = sdbGetRowObj(pRow);
11,616✔
202
  if (pVgroup == NULL) {
11,616!
203
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
204
    if (terrno != 0) code = terrno;
×
205
    goto _OVER;
×
206
  }
207

208
  int32_t maxVgId = sdbGetMaxId(pMnode->pSdb, SDB_VGROUP);
11,616✔
209
  if (maxVgId > pVgroup->vgId) {
11,616!
210
    mError("trans:%d, vgroup id %d already in use. maxVgId:%d", pTrans->id, pVgroup->vgId, maxVgId);
×
211
    goto _OVER;
×
212
  }
213

214
  code = 0;
11,616✔
215
_OVER:
11,616✔
216
  if (pVgroup) mndVgroupActionDelete(pSdb, pVgroup);
11,616!
217
  taosMemoryFreeClear(pRow);
11,616!
218
  TAOS_RETURN(code);
11,616✔
219
}
220

221
static int32_t mndVgroupActionInsert(SSdb *pSdb, SVgObj *pVgroup) {
12,788✔
222
  mTrace("vgId:%d, perform insert action, row:%p", pVgroup->vgId, pVgroup);
12,788✔
223
  return 0;
12,788✔
224
}
225

226
static int32_t mndVgroupActionDelete(SSdb *pSdb, SVgObj *pVgroup) {
41,826✔
227
  mTrace("vgId:%d, perform delete action, row:%p", pVgroup->vgId, pVgroup);
41,826✔
228
  return 0;
41,826✔
229
}
230

231
static int32_t mndVgroupActionUpdate(SSdb *pSdb, SVgObj *pOld, SVgObj *pNew) {
12,318✔
232
  mTrace("vgId:%d, perform update action, old row:%p new row:%p", pOld->vgId, pOld, pNew);
12,318✔
233
  pOld->updateTime = pNew->updateTime;
12,318✔
234
  pOld->version = pNew->version;
12,318✔
235
  pOld->hashBegin = pNew->hashBegin;
12,318✔
236
  pOld->hashEnd = pNew->hashEnd;
12,318✔
237
  pOld->replica = pNew->replica;
12,318✔
238
  pOld->isTsma = pNew->isTsma;
12,318✔
239
  for (int32_t i = 0; i < pNew->replica; ++i) {
27,234✔
240
    SVnodeGid *pNewGid = &pNew->vnodeGid[i];
14,916✔
241
    for (int32_t j = 0; j < pOld->replica; ++j) {
37,698✔
242
      SVnodeGid *pOldGid = &pOld->vnodeGid[j];
22,782✔
243
      if (pNewGid->dnodeId == pOldGid->dnodeId) {
22,782✔
244
        pNewGid->syncState = pOldGid->syncState;
14,418✔
245
        pNewGid->syncRestore = pOldGid->syncRestore;
14,418✔
246
        pNewGid->syncCanRead = pOldGid->syncCanRead;
14,418✔
247
        pNewGid->syncAppliedIndex = pOldGid->syncAppliedIndex;
14,418✔
248
        pNewGid->syncCommitIndex = pOldGid->syncCommitIndex;
14,418✔
249
        pNewGid->bufferSegmentUsed = pOldGid->bufferSegmentUsed;
14,418✔
250
        pNewGid->bufferSegmentSize = pOldGid->bufferSegmentSize;
14,418✔
251
      }
252
    }
253
  }
254
  pNew->numOfTables = pOld->numOfTables;
12,318✔
255
  pNew->numOfTimeSeries = pOld->numOfTimeSeries;
12,318✔
256
  pNew->totalStorage = pOld->totalStorage;
12,318✔
257
  pNew->compStorage = pOld->compStorage;
12,318✔
258
  pNew->pointsWritten = pOld->pointsWritten;
12,318✔
259
  pNew->compact = pOld->compact;
12,318✔
260
  memcpy(pOld->vnodeGid, pNew->vnodeGid, (TSDB_MAX_REPLICA + TSDB_MAX_LEARNER_REPLICA) * sizeof(SVnodeGid));
12,318✔
261
  pOld->syncConfChangeVer = pNew->syncConfChangeVer;
12,318✔
262
  return 0;
12,318✔
263
}
264

265
SVgObj *mndAcquireVgroup(SMnode *pMnode, int32_t vgId) {
725,517✔
266
  SSdb   *pSdb = pMnode->pSdb;
725,517✔
267
  SVgObj *pVgroup = sdbAcquire(pSdb, SDB_VGROUP, &vgId);
725,517✔
268
  if (pVgroup == NULL && terrno == TSDB_CODE_SDB_OBJ_NOT_THERE) {
725,517✔
269
    terrno = TSDB_CODE_MND_VGROUP_NOT_EXIST;
4,686✔
270
  }
271
  return pVgroup;
725,517✔
272
}
273

274
void mndReleaseVgroup(SMnode *pMnode, SVgObj *pVgroup) {
723,633✔
275
  SSdb *pSdb = pMnode->pSdb;
723,633✔
276
  sdbRelease(pSdb, pVgroup);
723,633✔
277
}
723,633✔
278

279
void *mndBuildCreateVnodeReq(SMnode *pMnode, SDnodeObj *pDnode, SDbObj *pDb, SVgObj *pVgroup, int32_t *pContLen) {
11,921✔
280
  SCreateVnodeReq createReq = {0};
11,921✔
281
  createReq.vgId = pVgroup->vgId;
11,921✔
282
  memcpy(createReq.db, pDb->name, TSDB_DB_FNAME_LEN);
11,921✔
283
  createReq.dbUid = pDb->uid;
11,921✔
284
  createReq.vgVersion = pVgroup->version;
11,921✔
285
  createReq.numOfStables = pDb->cfg.numOfStables;
11,921✔
286
  createReq.buffer = pDb->cfg.buffer;
11,921✔
287
  createReq.pageSize = pDb->cfg.pageSize;
11,921✔
288
  createReq.pages = pDb->cfg.pages;
11,921✔
289
  createReq.cacheLastSize = pDb->cfg.cacheLastSize;
11,921✔
290
  createReq.daysPerFile = pDb->cfg.daysPerFile;
11,921✔
291
  createReq.daysToKeep0 = pDb->cfg.daysToKeep0;
11,921✔
292
  createReq.daysToKeep1 = pDb->cfg.daysToKeep1;
11,921✔
293
  createReq.daysToKeep2 = pDb->cfg.daysToKeep2;
11,921✔
294
  createReq.keepTimeOffset = pDb->cfg.keepTimeOffset;
11,921✔
295
  createReq.s3ChunkSize = pDb->cfg.s3ChunkSize;
11,921✔
296
  createReq.s3KeepLocal = pDb->cfg.s3KeepLocal;
11,921✔
297
  createReq.s3Compact = pDb->cfg.s3Compact;
11,921✔
298
  createReq.minRows = pDb->cfg.minRows;
11,921✔
299
  createReq.maxRows = pDb->cfg.maxRows;
11,921✔
300
  createReq.walFsyncPeriod = pDb->cfg.walFsyncPeriod;
11,921✔
301
  createReq.walLevel = pDb->cfg.walLevel;
11,921✔
302
  createReq.precision = pDb->cfg.precision;
11,921✔
303
  createReq.compression = pDb->cfg.compression;
11,921✔
304
  createReq.strict = pDb->cfg.strict;
11,921✔
305
  createReq.cacheLast = pDb->cfg.cacheLast;
11,921✔
306
  createReq.replica = 0;
11,921✔
307
  createReq.learnerReplica = 0;
11,921✔
308
  createReq.selfIndex = -1;
11,921✔
309
  createReq.learnerSelfIndex = -1;
11,921✔
310
  createReq.hashBegin = pVgroup->hashBegin;
11,921✔
311
  createReq.hashEnd = pVgroup->hashEnd;
11,921✔
312
  createReq.hashMethod = pDb->cfg.hashMethod;
11,921✔
313
  createReq.numOfRetensions = pDb->cfg.numOfRetensions;
11,921✔
314
  createReq.pRetensions = pDb->cfg.pRetensions;
11,921✔
315
  createReq.isTsma = pVgroup->isTsma;
11,921✔
316
  createReq.pTsma = pVgroup->pTsma;
11,921✔
317
  createReq.walRetentionPeriod = pDb->cfg.walRetentionPeriod;
11,921✔
318
  createReq.walRetentionSize = pDb->cfg.walRetentionSize;
11,921✔
319
  createReq.walRollPeriod = pDb->cfg.walRollPeriod;
11,921✔
320
  createReq.walSegmentSize = pDb->cfg.walSegmentSize;
11,921✔
321
  createReq.sstTrigger = pDb->cfg.sstTrigger;
11,921✔
322
  createReq.hashPrefix = pDb->cfg.hashPrefix;
11,921✔
323
  createReq.hashSuffix = pDb->cfg.hashSuffix;
11,921✔
324
  createReq.tsdbPageSize = pDb->cfg.tsdbPageSize;
11,921✔
325
  createReq.changeVersion = ++(pVgroup->syncConfChangeVer);
11,921✔
326
  createReq.encryptAlgorithm = pDb->cfg.encryptAlgorithm;
11,921✔
327
  int32_t code = 0;
11,921✔
328

329
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
27,007✔
330
    SReplica *pReplica = NULL;
15,086✔
331

332
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
15,086✔
333
      pReplica = &createReq.replicas[createReq.replica];
14,833✔
334
    } else {
335
      pReplica = &createReq.learnerReplicas[createReq.learnerReplica];
253✔
336
    }
337

338
    SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
15,086✔
339
    SDnodeObj *pVgidDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
15,086✔
340
    if (pVgidDnode == NULL) {
15,086!
341
      return NULL;
×
342
    }
343

344
    pReplica->id = pVgidDnode->id;
15,086✔
345
    pReplica->port = pVgidDnode->port;
15,086✔
346
    memcpy(pReplica->fqdn, pVgidDnode->fqdn, TSDB_FQDN_LEN);
15,086✔
347
    mndReleaseDnode(pMnode, pVgidDnode);
15,086✔
348

349
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
15,086✔
350
      if (pDnode->id == pVgid->dnodeId) {
14,833✔
351
        createReq.selfIndex = createReq.replica;
11,668✔
352
      }
353
    } else {
354
      if (pDnode->id == pVgid->dnodeId) {
253!
355
        createReq.learnerSelfIndex = createReq.learnerReplica;
253✔
356
      }
357
    }
358

359
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
15,086✔
360
      createReq.replica++;
14,833✔
361
    } else {
362
      createReq.learnerReplica++;
253✔
363
    }
364
  }
365

366
  if (createReq.selfIndex == -1 && createReq.learnerSelfIndex == -1) {
11,921!
367
    terrno = TSDB_CODE_APP_ERROR;
×
368
    return NULL;
×
369
  }
370

371
  createReq.changeVersion = pVgroup->syncConfChangeVer;
11,921✔
372

373
  mInfo(
11,921!
374
      "vgId:%d, build create vnode req, replica:%d selfIndex:%d learnerReplica:%d learnerSelfIndex:%d strict:%d "
375
      "changeVersion:%d",
376
      createReq.vgId, createReq.replica, createReq.selfIndex, createReq.learnerReplica, createReq.learnerSelfIndex,
377
      createReq.strict, createReq.changeVersion);
378
  for (int32_t i = 0; i < createReq.replica; ++i) {
26,754✔
379
    mInfo("vgId:%d, replica:%d ep:%s:%u", createReq.vgId, i, createReq.replicas[i].fqdn, createReq.replicas[i].port);
14,833!
380
  }
381
  for (int32_t i = 0; i < createReq.learnerReplica; ++i) {
12,174✔
382
    mInfo("vgId:%d, replica:%d ep:%s:%u", createReq.vgId, i, createReq.learnerReplicas[i].fqdn,
253!
383
          createReq.learnerReplicas[i].port);
384
  }
385

386
  int32_t contLen = tSerializeSCreateVnodeReq(NULL, 0, &createReq);
11,921✔
387
  if (contLen < 0) {
11,921!
388
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
389
    return NULL;
×
390
  }
391

392
  void *pReq = taosMemoryMalloc(contLen);
11,921!
393
  if (pReq == NULL) {
11,921!
394
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
395
    return NULL;
×
396
  }
397

398
  code = tSerializeSCreateVnodeReq(pReq, contLen, &createReq);
11,921✔
399
  if (code < 0) {
11,921!
400
    terrno = TSDB_CODE_APP_ERROR;
×
401
    taosMemoryFree(pReq);
×
402
    mError("vgId:%d, failed to serialize create vnode req,since %s", createReq.vgId, terrstr());
×
403
    return NULL;
×
404
  }
405
  *pContLen = contLen;
11,921✔
406
  return pReq;
11,921✔
407
}
408

409
static void *mndBuildAlterVnodeConfigReq(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, int32_t *pContLen) {
646✔
410
  SAlterVnodeConfigReq alterReq = {0};
646✔
411
  alterReq.vgVersion = pVgroup->version;
646✔
412
  alterReq.buffer = pDb->cfg.buffer;
646✔
413
  alterReq.pageSize = pDb->cfg.pageSize;
646✔
414
  alterReq.pages = pDb->cfg.pages;
646✔
415
  alterReq.cacheLastSize = pDb->cfg.cacheLastSize;
646✔
416
  alterReq.daysPerFile = pDb->cfg.daysPerFile;
646✔
417
  alterReq.daysToKeep0 = pDb->cfg.daysToKeep0;
646✔
418
  alterReq.daysToKeep1 = pDb->cfg.daysToKeep1;
646✔
419
  alterReq.daysToKeep2 = pDb->cfg.daysToKeep2;
646✔
420
  alterReq.keepTimeOffset = pDb->cfg.keepTimeOffset;
646✔
421
  alterReq.walFsyncPeriod = pDb->cfg.walFsyncPeriod;
646✔
422
  alterReq.walLevel = pDb->cfg.walLevel;
646✔
423
  alterReq.strict = pDb->cfg.strict;
646✔
424
  alterReq.cacheLast = pDb->cfg.cacheLast;
646✔
425
  alterReq.sttTrigger = pDb->cfg.sstTrigger;
646✔
426
  alterReq.minRows = pDb->cfg.minRows;
646✔
427
  alterReq.walRetentionPeriod = pDb->cfg.walRetentionPeriod;
646✔
428
  alterReq.walRetentionSize = pDb->cfg.walRetentionSize;
646✔
429
  alterReq.s3KeepLocal = pDb->cfg.s3KeepLocal;
646✔
430
  alterReq.s3Compact = pDb->cfg.s3Compact;
646✔
431

432
  mInfo("vgId:%d, build alter vnode config req", pVgroup->vgId);
646!
433
  int32_t contLen = tSerializeSAlterVnodeConfigReq(NULL, 0, &alterReq);
646✔
434
  if (contLen < 0) {
646!
435
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
436
    return NULL;
×
437
  }
438
  contLen += sizeof(SMsgHead);
646✔
439

440
  void *pReq = taosMemoryMalloc(contLen);
646!
441
  if (pReq == NULL) {
646!
442
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
443
    return NULL;
×
444
  }
445

446
  SMsgHead *pHead = pReq;
646✔
447
  pHead->contLen = htonl(contLen);
646✔
448
  pHead->vgId = htonl(pVgroup->vgId);
646✔
449

450
  if (tSerializeSAlterVnodeConfigReq((char *)pReq + sizeof(SMsgHead), contLen, &alterReq) < 0) {
646!
451
    taosMemoryFree(pReq);
×
452
    mError("vgId:%d, failed to serialize alter vnode config req,since %s", pVgroup->vgId, terrstr());
×
453
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
454
    return NULL;
×
455
  }
456
  *pContLen = contLen;
646✔
457
  return pReq;
646✔
458
}
459

460
static void *mndBuildAlterVnodeReplicaReq(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId,
1,618✔
461
                                          int32_t *pContLen) {
462
  SAlterVnodeReplicaReq alterReq = {
1,618✔
463
      .vgId = pVgroup->vgId,
1,618✔
464
      .strict = pDb->cfg.strict,
1,618✔
465
      .replica = 0,
466
      .learnerReplica = 0,
467
      .selfIndex = -1,
468
      .learnerSelfIndex = -1,
469
      .changeVersion = ++(pVgroup->syncConfChangeVer),
1,618✔
470
  };
471

472
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
6,321✔
473
    SReplica *pReplica = NULL;
4,703✔
474

475
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
4,703✔
476
      pReplica = &alterReq.replicas[alterReq.replica];
4,326✔
477
      alterReq.replica++;
4,326✔
478
    } else {
479
      pReplica = &alterReq.learnerReplicas[alterReq.learnerReplica];
377✔
480
      alterReq.learnerReplica++;
377✔
481
    }
482

483
    SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
4,703✔
484
    SDnodeObj *pVgidDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
4,703✔
485
    if (pVgidDnode == NULL) return NULL;
4,703!
486

487
    pReplica->id = pVgidDnode->id;
4,703✔
488
    pReplica->port = pVgidDnode->port;
4,703✔
489
    memcpy(pReplica->fqdn, pVgidDnode->fqdn, TSDB_FQDN_LEN);
4,703✔
490
    mndReleaseDnode(pMnode, pVgidDnode);
4,703✔
491

492
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
4,703✔
493
      if (dnodeId == pVgid->dnodeId) {
4,326✔
494
        alterReq.selfIndex = v;
1,618✔
495
      }
496
    } else {
497
      if (dnodeId == pVgid->dnodeId) {
377!
498
        alterReq.learnerSelfIndex = v;
×
499
      }
500
    }
501
  }
502

503
  mInfo(
1,618!
504
      "vgId:%d, build alter vnode req, replica:%d selfIndex:%d learnerReplica:%d learnerSelfIndex:%d strict:%d "
505
      "changeVersion:%d",
506
      alterReq.vgId, alterReq.replica, alterReq.selfIndex, alterReq.learnerReplica, alterReq.learnerSelfIndex,
507
      alterReq.strict, alterReq.changeVersion);
508
  for (int32_t i = 0; i < alterReq.replica; ++i) {
5,944✔
509
    mInfo("vgId:%d, replica:%d ep:%s:%u", alterReq.vgId, i, alterReq.replicas[i].fqdn, alterReq.replicas[i].port);
4,326!
510
  }
511
  for (int32_t i = 0; i < alterReq.learnerReplica; ++i) {
1,995✔
512
    mInfo("vgId:%d, learnerReplica:%d ep:%s:%u", alterReq.vgId, i, alterReq.learnerReplicas[i].fqdn,
377!
513
          alterReq.learnerReplicas[i].port);
514
  }
515

516
  if (alterReq.selfIndex == -1 && alterReq.learnerSelfIndex == -1) {
1,618!
517
    terrno = TSDB_CODE_APP_ERROR;
×
518
    return NULL;
×
519
  }
520

521
  int32_t contLen = tSerializeSAlterVnodeReplicaReq(NULL, 0, &alterReq);
1,618✔
522
  if (contLen < 0) {
1,618!
523
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
524
    return NULL;
×
525
  }
526

527
  void *pReq = taosMemoryMalloc(contLen);
1,618!
528
  if (pReq == NULL) {
1,618!
529
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
530
    return NULL;
×
531
  }
532

533
  if (tSerializeSAlterVnodeReplicaReq(pReq, contLen, &alterReq) < 0) {
1,618!
534
    mError("vgId:%d, failed to serialize alter vnode req,since %s", alterReq.vgId, terrstr());
×
535
    taosMemoryFree(pReq);
×
536
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
537
    return NULL;
×
538
  }
539
  *pContLen = contLen;
1,618✔
540
  return pReq;
1,618✔
541
}
542

543
static void *mndBuildCheckLearnCatchupReq(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId,
×
544
                                          int32_t *pContLen) {
545
  SCheckLearnCatchupReq req = {
×
546
      .vgId = pVgroup->vgId,
×
547
      .strict = pDb->cfg.strict,
×
548
      .replica = 0,
549
      .learnerReplica = 0,
550
      .selfIndex = -1,
551
      .learnerSelfIndex = -1,
552
  };
553

554
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
×
555
    SReplica *pReplica = NULL;
×
556

557
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
×
558
      pReplica = &req.replicas[req.replica];
×
559
      req.replica++;
×
560
    } else {
561
      pReplica = &req.learnerReplicas[req.learnerReplica];
×
562
      req.learnerReplica++;
×
563
    }
564

565
    SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
×
566
    SDnodeObj *pVgidDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
×
567
    if (pVgidDnode == NULL) return NULL;
×
568

569
    pReplica->id = pVgidDnode->id;
×
570
    pReplica->port = pVgidDnode->port;
×
571
    memcpy(pReplica->fqdn, pVgidDnode->fqdn, TSDB_FQDN_LEN);
×
572
    mndReleaseDnode(pMnode, pVgidDnode);
×
573

574
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
×
575
      if (dnodeId == pVgid->dnodeId) {
×
576
        req.selfIndex = v;
×
577
      }
578
    } else {
579
      if (dnodeId == pVgid->dnodeId) {
×
580
        req.learnerSelfIndex = v;
×
581
      }
582
    }
583
  }
584

585
  mInfo("vgId:%d, build alter vnode req, replica:%d selfIndex:%d learnerReplica:%d learnerSelfIndex:%d strict:%d",
×
586
        req.vgId, req.replica, req.selfIndex, req.learnerReplica, req.learnerSelfIndex, req.strict);
587
  for (int32_t i = 0; i < req.replica; ++i) {
×
588
    mInfo("vgId:%d, replica:%d ep:%s:%u", req.vgId, i, req.replicas[i].fqdn, req.replicas[i].port);
×
589
  }
590
  for (int32_t i = 0; i < req.learnerReplica; ++i) {
×
591
    mInfo("vgId:%d, learnerReplica:%d ep:%s:%u", req.vgId, i, req.learnerReplicas[i].fqdn, req.learnerReplicas[i].port);
×
592
  }
593

594
  if (req.selfIndex == -1 && req.learnerSelfIndex == -1) {
×
595
    terrno = TSDB_CODE_APP_ERROR;
×
596
    return NULL;
×
597
  }
598

599
  int32_t contLen = tSerializeSAlterVnodeReplicaReq(NULL, 0, &req);
×
600
  if (contLen < 0) {
×
601
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
602
    return NULL;
×
603
  }
604

605
  void *pReq = taosMemoryMalloc(contLen);
×
606
  if (pReq == NULL) {
×
607
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
608
    return NULL;
×
609
  }
610

611
  if (tSerializeSAlterVnodeReplicaReq(pReq, contLen, &req) < 0) {
×
612
    mError("vgId:%d, failed to serialize alter vnode req,since %s", req.vgId, terrstr());
×
613
    taosMemoryFree(pReq);
×
614
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
615
    return NULL;
×
616
  }
617
  *pContLen = contLen;
×
618
  return pReq;
×
619
}
620

621
static void *mndBuildDisableVnodeWriteReq(SMnode *pMnode, SDbObj *pDb, int32_t vgId, int32_t *pContLen) {
112✔
622
  SDisableVnodeWriteReq disableReq = {
112✔
623
      .vgId = vgId,
624
      .disable = 1,
625
  };
626

627
  mInfo("vgId:%d, build disable vnode write req", vgId);
112!
628
  int32_t contLen = tSerializeSDisableVnodeWriteReq(NULL, 0, &disableReq);
112✔
629
  if (contLen < 0) {
112!
630
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
631
    return NULL;
×
632
  }
633

634
  void *pReq = taosMemoryMalloc(contLen);
112!
635
  if (pReq == NULL) {
112!
636
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
637
    return NULL;
×
638
  }
639

640
  if (tSerializeSDisableVnodeWriteReq(pReq, contLen, &disableReq) < 0) {
112!
641
    mError("vgId:%d, failed to serialize disable vnode write req,since %s", vgId, terrstr());
×
642
    taosMemoryFree(pReq);
×
643
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
644
    return NULL;
×
645
  }
646
  *pContLen = contLen;
112✔
647
  return pReq;
112✔
648
}
649

650
static void *mndBuildAlterVnodeHashRangeReq(SMnode *pMnode, int32_t srcVgId, SVgObj *pVgroup, int32_t *pContLen) {
112✔
651
  SAlterVnodeHashRangeReq alterReq = {
112✔
652
      .srcVgId = srcVgId,
653
      .dstVgId = pVgroup->vgId,
112✔
654
      .hashBegin = pVgroup->hashBegin,
112✔
655
      .hashEnd = pVgroup->hashEnd,
112✔
656
      .changeVersion = ++(pVgroup->syncConfChangeVer),
112✔
657
  };
658

659
  mInfo("vgId:%d, build alter vnode hashrange req, dstVgId:%d, hashrange:[%u, %u]", srcVgId, pVgroup->vgId,
112!
660
        pVgroup->hashBegin, pVgroup->hashEnd);
661
  int32_t contLen = tSerializeSAlterVnodeHashRangeReq(NULL, 0, &alterReq);
112✔
662
  if (contLen < 0) {
112!
663
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
664
    return NULL;
×
665
  }
666

667
  void *pReq = taosMemoryMalloc(contLen);
112!
668
  if (pReq == NULL) {
112!
669
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
670
    return NULL;
×
671
  }
672

673
  if (tSerializeSAlterVnodeHashRangeReq(pReq, contLen, &alterReq) < 0) {
112!
674
    mError("vgId:%d, failed to serialize alter vnode hashrange req,since %s", srcVgId, terrstr());
×
675
    taosMemoryFree(pReq);
×
676
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
677
    return NULL;
×
678
  }
679
  *pContLen = contLen;
112✔
680
  return pReq;
112✔
681
}
682

683
void *mndBuildDropVnodeReq(SMnode *pMnode, SDnodeObj *pDnode, SDbObj *pDb, SVgObj *pVgroup, int32_t *pContLen) {
16,792✔
684
  SDropVnodeReq dropReq = {0};
16,792✔
685
  dropReq.dnodeId = pDnode->id;
16,792✔
686
  dropReq.vgId = pVgroup->vgId;
16,792✔
687
  memcpy(dropReq.db, pDb->name, TSDB_DB_FNAME_LEN);
16,792✔
688
  dropReq.dbUid = pDb->uid;
16,792✔
689

690
  mInfo("vgId:%d, build drop vnode req", dropReq.vgId);
16,792!
691
  int32_t contLen = tSerializeSDropVnodeReq(NULL, 0, &dropReq);
16,792✔
692
  if (contLen < 0) {
16,792!
693
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
694
    return NULL;
×
695
  }
696

697
  void *pReq = taosMemoryMalloc(contLen);
16,792!
698
  if (pReq == NULL) {
16,792!
699
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
700
    return NULL;
×
701
  }
702

703
  if (tSerializeSDropVnodeReq(pReq, contLen, &dropReq) < 0) {
16,792!
704
    mError("vgId:%d, failed to serialize drop vnode req,since %s", dropReq.vgId, terrstr());
×
705
    taosMemoryFree(pReq);
×
706
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
707
    return NULL;
×
708
  }
709
  *pContLen = contLen;
16,792✔
710
  return pReq;
16,792✔
711
}
712

713
static bool mndResetDnodesArrayFp(SMnode *pMnode, void *pObj, void *p1, void *p2, void *p3) {
7,485✔
714
  SDnodeObj *pDnode = pObj;
7,485✔
715
  pDnode->numOfVnodes = 0;
7,485✔
716
  pDnode->numOfOtherNodes = 0;
7,485✔
717
  return true;
7,485✔
718
}
719

720
static bool mndBuildDnodesArrayFp(SMnode *pMnode, void *pObj, void *p1, void *p2, void *p3) {
7,479✔
721
  SDnodeObj *pDnode = pObj;
7,479✔
722
  SArray    *pArray = p1;
7,479✔
723
  int32_t    exceptDnodeId = *(int32_t *)p2;
7,479✔
724
  SArray    *dnodeList = p3;
7,479✔
725

726
  if (exceptDnodeId == pDnode->id) {
7,479✔
727
    return true;
16✔
728
  }
729

730
  if (dnodeList != NULL) {
7,463✔
731
    int32_t dnodeListSize = taosArrayGetSize(dnodeList);
101✔
732
    if (dnodeListSize > 0) {
101!
733
      bool inDnodeList = false;
101✔
734
      for (int32_t index = 0; index < dnodeListSize; ++index) {
328✔
735
        int32_t dnodeId = *(int32_t *)taosArrayGet(dnodeList, index);
227✔
736
        if (pDnode->id == dnodeId) {
227✔
737
          inDnodeList = true;
47✔
738
        }
739
      }
740
      if (!inDnodeList) {
101✔
741
        return true;
54✔
742
      }
743
    } else {
744
      return true;  // TS-6191
×
745
    }
746
  }
747

748
  int64_t curMs = taosGetTimestampMs();
7,409✔
749
  bool    online = mndIsDnodeOnline(pDnode, curMs);
7,409✔
750
  bool    isMnode = mndIsMnode(pMnode, pDnode->id);
7,409✔
751
  pDnode->numOfVnodes = mndGetVnodesNum(pMnode, pDnode->id);
7,409✔
752
  pDnode->memUsed = mndGetVnodesMemory(pMnode, pDnode->id);
7,409✔
753

754
  mInfo("dnode:%d, vnodes:%d supportVnodes:%d isMnode:%d online:%d memory avail:%" PRId64 " used:%" PRId64, pDnode->id,
7,409!
755
        pDnode->numOfVnodes, pDnode->numOfSupportVnodes, isMnode, online, pDnode->memAvail, pDnode->memUsed);
756

757
  if (isMnode) {
7,409✔
758
    pDnode->numOfOtherNodes++;
6,122✔
759
  }
760

761
  if (online && pDnode->numOfSupportVnodes > 0) {
7,409✔
762
    if (taosArrayPush(pArray, pDnode) == NULL) return false;
6,744!
763
  }
764
  return true;
7,409✔
765
}
766

767
static bool isDnodeInList(SArray *dnodeList, int32_t dnodeId) {
2✔
768
  int32_t dnodeListSize = taosArrayGetSize(dnodeList);
2✔
769
  for (int32_t i = 0; i < dnodeListSize; ++i) {
5!
770
    int32_t id = *(int32_t *)TARRAY_GET_ELEM(dnodeList, i);
5✔
771
    if (id == dnodeId) {
5✔
772
      return true;
2✔
773
    }
774
  }
775
  return false;
×
776
}
777

778
#ifdef TD_ENTERPRISE
779
static float mndGetDnodeScore1(SDnodeObj *pDnode, int32_t additionDnodes, float ratio) {
12✔
780
  float totalDnodes = pDnode->numOfVnodes + (float)pDnode->numOfOtherNodes * ratio + additionDnodes;
12✔
781
  float result = totalDnodes / pDnode->numOfSupportVnodes;
12✔
782
  return pDnode->numOfVnodes > 0 ? -result : result;
12✔
783
}
784

785
static int32_t mndCompareDnodeVnodes1(SDnodeObj *pDnode1, SDnodeObj *pDnode2) {
6✔
786
  float d1Score = mndGetDnodeScore1(pDnode1, 0, 0.9);
6✔
787
  float d2Score = mndGetDnodeScore1(pDnode2, 0, 0.9);
6✔
788
  if (d1Score == d2Score) {
6✔
789
    if (pDnode1->id == pDnode2->id) {
2!
790
      return 0;
×
791
    }
792
    return pDnode1->id > pDnode2->id ? 1 : -1;
2!
793
  }
794
  return d1Score > d2Score ? 1 : -1;
4!
795
}
796

797
static bool mndBuildDnodesListFp(SMnode *pMnode, void *pObj, void *p1, void *p2, void *p3) {
6✔
798
  SDnodeObj *pDnode = pObj;
6✔
799
  SArray    *pArray = p1;
6✔
800

801
  bool isMnode = mndIsMnode(pMnode, pDnode->id);
6✔
802
  pDnode->numOfVnodes = mndGetVnodesNum(pMnode, pDnode->id);
6✔
803

804
  if (isMnode) {
6✔
805
    pDnode->numOfOtherNodes++;
2✔
806
  }
807

808
  if (pDnode->numOfSupportVnodes > 0) {
6!
809
    if (taosArrayPush(pArray, pDnode) == NULL) return false;
6!
810
  }
811
  return true;
6✔
812
}
813

814
// TS-6191
815
static int32_t mndBuildNodesCheckDualReplica(SMnode *pMnode, int32_t nDnodes, SArray *dnodeList, SArray **ppDnodeList) {
5,794✔
816
  int32_t code = 0;
5,794✔
817
  if (!grantCheckDualReplicaDnodes(pMnode)) {
5,794✔
818
    TAOS_RETURN(code);
5,792✔
819
  }
820
  SSdb   *pSdb = pMnode->pSdb;
2✔
821
  SArray *pArray = taosArrayInit(nDnodes, sizeof(SDnodeObj));
2✔
822
  if (pArray == NULL) {
2!
823
    TAOS_RETURN(code = terrno);
×
824
  }
825
  *ppDnodeList = pArray;
2✔
826

827
  sdbTraverse(pSdb, SDB_DNODE, mndResetDnodesArrayFp, NULL, NULL, NULL);
2✔
828
  sdbTraverse(pSdb, SDB_DNODE, mndBuildDnodesListFp, pArray, NULL, NULL);
2✔
829

830
  int32_t arrSize = taosArrayGetSize(pArray);
2✔
831
  if (arrSize <= 0) {
2!
832
    TAOS_RETURN(code);
×
833
  }
834
  if (arrSize > 1) taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes1);
2!
835

836
  int32_t dnodeListSize = taosArrayGetSize(dnodeList);
2✔
837
  if (dnodeListSize <= 0) {
2✔
838
    if (arrSize > 2) taosArrayRemoveBatch(pArray, 2, arrSize - 2, NULL);
1!
839
  } else {
840
    int32_t nDnodesWithVnodes = 0;
1✔
841
    for (int32_t i = 0; i < arrSize; ++i) {
3!
842
      SDnodeObj *pDnode = TARRAY_GET_ELEM(pArray, i);
3✔
843
      if (pDnode->numOfVnodes <= 0) {
3✔
844
        break;
1✔
845
      }
846
      ++nDnodesWithVnodes;
2✔
847
    }
848
    int32_t dnodeId = -1;
1✔
849
    if (nDnodesWithVnodes == 1) {
1!
850
      dnodeId = ((SDnodeObj *)TARRAY_GET_ELEM(pArray, 0))->id;
×
851
    } else if (nDnodesWithVnodes >= 2) {
1!
852
      // must select the dnodes from the 1st 2 dnodes
853
      taosArrayRemoveBatch(pArray, 2, arrSize - 2, NULL);
1✔
854
    }
855
    for (int32_t i = 0; i < TARRAY_SIZE(pArray);) {
3✔
856
      SDnodeObj *pDnode = taosArrayGet(pArray, i);
2✔
857
      if (!isDnodeInList(dnodeList, pDnode->id)) {
2!
858
        taosArrayRemove(pArray, i);
×
859
        continue;
×
860
      }
861
      ++i;
2✔
862
    }
863
    if (nDnodesWithVnodes == 1) {
1!
864
      SDnodeObj *pDnode = taosArrayGet(pArray, 0);
×
865
      if (pDnode && (pDnode->id != dnodeId)) {  // the first dnode is not in dnodeList, remove the last element
×
866
        taosArrayRemove(pArray, taosArrayGetSize(pArray) - 1);
×
867
      }
868
    }
869
  }
870

871
  TAOS_RETURN(code);
2✔
872
}
873
#endif
874

875
SArray *mndBuildDnodesArray(SMnode *pMnode, int32_t exceptDnodeId, SArray *dnodeList) {
5,794✔
876
  SSdb   *pSdb = pMnode->pSdb;
5,794✔
877
  int32_t numOfDnodes = mndGetDnodeSize(pMnode);
5,794✔
878
  SArray *tDnodeList = NULL;
5,794✔
879
  SArray *pDnodeList = NULL;
5,794✔
880

881
  SArray *pArray = taosArrayInit(numOfDnodes, sizeof(SDnodeObj));
5,794✔
882
  if (pArray == NULL) {
5,794!
883
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
884
    return NULL;
×
885
  }
886
  if (taosArrayGetSize(dnodeList) > 0) {
5,794✔
887
    tDnodeList = dnodeList;
20✔
888
  }
889
#ifdef TD_ENTERPRISE
890
  if (0 != mndBuildNodesCheckDualReplica(pMnode, numOfDnodes, tDnodeList, &pDnodeList)) {
5,794!
891
    taosArrayDestroy(pArray);
×
892
    return NULL;
×
893
  }
894
#endif
895
  sdbTraverse(pSdb, SDB_DNODE, mndResetDnodesArrayFp, NULL, NULL, NULL);
5,794✔
896
  sdbTraverse(pSdb, SDB_DNODE, mndBuildDnodesArrayFp, pArray, &exceptDnodeId, pDnodeList ? pDnodeList : tDnodeList);
5,794✔
897

898
  mDebug("build %d dnodes array", (int32_t)taosArrayGetSize(pArray));
5,794✔
899
  for (int32_t i = 0; i < (int32_t)taosArrayGetSize(pArray); ++i) {
12,538✔
900
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
6,744✔
901
    mDebug("dnode:%d, vnodes:%d others:%d", pDnode->id, pDnode->numOfVnodes, pDnode->numOfOtherNodes);
6,744✔
902
  }
903
  taosArrayDestroy(pDnodeList);
5,794✔
904
  return pArray;
5,794✔
905
}
906

907
static int32_t mndCompareDnodeId(int32_t *dnode1Id, int32_t *dnode2Id) {
×
908
  if (*dnode1Id == *dnode2Id) {
×
909
    return 0;
×
910
  }
911
  return *dnode1Id > *dnode2Id ? 1 : -1;
×
912
}
913

914
static float mndGetDnodeScore(SDnodeObj *pDnode, int32_t additionDnodes, float ratio) {
23,416✔
915
  float totalDnodes = pDnode->numOfVnodes + (float)pDnode->numOfOtherNodes * ratio + additionDnodes;
23,416✔
916
  return totalDnodes / pDnode->numOfSupportVnodes;
23,416✔
917
}
918

919
static int32_t mndCompareDnodeVnodes(SDnodeObj *pDnode1, SDnodeObj *pDnode2) {
5,652✔
920
  float d1Score = mndGetDnodeScore(pDnode1, 0, 0.9);
5,652✔
921
  float d2Score = mndGetDnodeScore(pDnode2, 0, 0.9);
5,652✔
922
  if (d1Score == d2Score) {
5,652✔
923
    return 0;
1,987✔
924
  }
925
  return d1Score > d2Score ? 1 : -1;
3,665✔
926
}
927

928
void mndSortVnodeGid(SVgObj *pVgroup) {
10,887✔
929
  for (int32_t i = 0; i < pVgroup->replica; ++i) {
22,959✔
930
    for (int32_t j = 0; j < pVgroup->replica - 1 - i; ++j) {
13,846✔
931
      if (pVgroup->vnodeGid[j].dnodeId > pVgroup->vnodeGid[j + 1].dnodeId) {
1,774✔
932
        TSWAP(pVgroup->vnodeGid[j], pVgroup->vnodeGid[j + 1]);
679✔
933
      }
934
    }
935
  }
936
}
10,887✔
937

938
static int32_t mndGetAvailableDnode(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, SArray *pArray) {
11,273✔
939
  mDebug("start to sort %d dnodes", (int32_t)taosArrayGetSize(pArray));
11,273✔
940
  taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes);
11,273✔
941
  for (int32_t i = 0; i < (int32_t)taosArrayGetSize(pArray); ++i) {
25,165✔
942
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
13,892✔
943
    mDebug("dnode:%d, score:%f", pDnode->id, mndGetDnodeScore(pDnode, 0, 0.9));
13,892✔
944
  }
945

946
  int32_t size = taosArrayGetSize(pArray);
11,273✔
947
  if (size < pVgroup->replica) {
11,273✔
948
    mError("db:%s, vgId:%d, no enough online dnodes:%d to alloc %d replica", pVgroup->dbName, pVgroup->vgId, size,
462!
949
           pVgroup->replica);
950
    TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_DNODES);
462✔
951
  }
952

953
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
22,663✔
954
    SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
11,852✔
955
    SDnodeObj *pDnode = taosArrayGet(pArray, v);
11,852✔
956
    if (pDnode == NULL) {
11,852!
957
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_DNODES);
×
958
    }
959
    if (pDnode->numOfVnodes >= pDnode->numOfSupportVnodes) {
11,852!
960
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_VNODES);
×
961
    }
962

963
    int64_t vgMem = mndGetVgroupMemory(pMnode, pDb, pVgroup);
11,852✔
964
    if (pDnode->memAvail - vgMem - pDnode->memUsed <= 0) {
11,852!
965
      mError("db:%s, vgId:%d, no enough memory:%" PRId64 " in dnode:%d, avail:%" PRId64 " used:%" PRId64,
×
966
             pVgroup->dbName, pVgroup->vgId, vgMem, pDnode->id, pDnode->memAvail, pDnode->memUsed);
967
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE);
×
968
    } else {
969
      pDnode->memUsed += vgMem;
11,852✔
970
    }
971

972
    pVgid->dnodeId = pDnode->id;
11,852✔
973
    if (pVgroup->replica == 1) {
11,852✔
974
      pVgid->syncState = TAOS_SYNC_STATE_LEADER;
10,287✔
975
    } else {
976
      pVgid->syncState = TAOS_SYNC_STATE_FOLLOWER;
1,565✔
977
    }
978

979
    mInfo("db:%s, vgId:%d, vn:%d is alloced, memory:%" PRId64 ", dnode:%d avail:%" PRId64 " used:%" PRId64,
11,852!
980
          pVgroup->dbName, pVgroup->vgId, v, vgMem, pVgid->dnodeId, pDnode->memAvail, pDnode->memUsed);
981
    pDnode->numOfVnodes++;
11,852✔
982
  }
983

984
  mndSortVnodeGid(pVgroup);
10,811✔
985
  return 0;
10,811✔
986
}
987

988
int32_t mndAllocSmaVgroup(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup) {
×
989
  int32_t code = 0;
×
990
  SArray *pArray = mndBuildDnodesArray(pMnode, 0, NULL);
×
991
  if (pArray == NULL) {
×
992
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
993
    if (terrno != 0) code = terrno;
×
994
    TAOS_RETURN(code);
×
995
  }
996

997
  pVgroup->vgId = sdbGetMaxId(pMnode->pSdb, SDB_VGROUP);
×
998
  pVgroup->isTsma = 1;
×
999
  pVgroup->createdTime = taosGetTimestampMs();
×
1000
  pVgroup->updateTime = pVgroup->createdTime;
×
1001
  pVgroup->version = 1;
×
1002
  memcpy(pVgroup->dbName, pDb->name, TSDB_DB_FNAME_LEN);
×
1003
  pVgroup->dbUid = pDb->uid;
×
1004
  pVgroup->replica = 1;
×
1005

1006
  if (mndGetAvailableDnode(pMnode, pDb, pVgroup, pArray) != 0) return -1;
×
1007
  taosArrayDestroy(pArray);
×
1008

1009
  mInfo("db:%s, sma vgId:%d is alloced", pDb->name, pVgroup->vgId);
×
1010
  return 0;
×
1011
}
1012

1013
int32_t mndAllocVgroup(SMnode *pMnode, SDbObj *pDb, SVgObj **ppVgroups, SArray *dnodeList) {
5,439✔
1014
  int32_t code = -1;
5,439✔
1015
  SArray *pArray = NULL;
5,439✔
1016
  SVgObj *pVgroups = NULL;
5,439✔
1017

1018
  pVgroups = taosMemoryCalloc(pDb->cfg.numOfVgroups, sizeof(SVgObj));
5,439!
1019
  if (pVgroups == NULL) {
5,439!
1020
    code = terrno;
×
1021
    goto _OVER;
×
1022
  }
1023

1024
  pArray = mndBuildDnodesArray(pMnode, 0, dnodeList);
5,439✔
1025
  if (pArray == NULL) {
5,439!
1026
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1027
    if (terrno != 0) code = terrno;
×
1028
    goto _OVER;
×
1029
  }
1030

1031
  mInfo("db:%s, total %d dnodes used to create %d vgroups (%d vnodes)", pDb->name, (int32_t)taosArrayGetSize(pArray),
5,439!
1032
        pDb->cfg.numOfVgroups, pDb->cfg.numOfVgroups * pDb->cfg.replications);
1033

1034
  int32_t  allocedVgroups = 0;
5,439✔
1035
  int32_t  maxVgId = sdbGetMaxId(pMnode->pSdb, SDB_VGROUP);
5,439✔
1036
  uint32_t hashMin = 0;
5,439✔
1037
  uint32_t hashMax = UINT32_MAX;
5,439✔
1038
  uint32_t hashInterval = (hashMax - hashMin) / pDb->cfg.numOfVgroups;
5,439✔
1039

1040
  if (maxVgId < 2) maxVgId = 2;
5,439✔
1041

1042
  for (uint32_t v = 0; v < pDb->cfg.numOfVgroups; v++) {
16,250✔
1043
    SVgObj *pVgroup = &pVgroups[v];
11,273✔
1044
    pVgroup->vgId = maxVgId++;
11,273✔
1045
    pVgroup->createdTime = taosGetTimestampMs();
11,273✔
1046
    pVgroup->updateTime = pVgroups->createdTime;
11,273✔
1047
    pVgroup->version = 1;
11,273✔
1048
    pVgroup->hashBegin = hashMin + hashInterval * v;
11,273✔
1049
    if (v == pDb->cfg.numOfVgroups - 1) {
11,273✔
1050
      pVgroup->hashEnd = hashMax;
5,086✔
1051
    } else {
1052
      pVgroup->hashEnd = hashMin + hashInterval * (v + 1) - 1;
6,187✔
1053
    }
1054

1055
    memcpy(pVgroup->dbName, pDb->name, TSDB_DB_FNAME_LEN);
11,273✔
1056
    pVgroup->dbUid = pDb->uid;
11,273✔
1057
    pVgroup->replica = pDb->cfg.replications;
11,273✔
1058

1059
    if ((code = mndGetAvailableDnode(pMnode, pDb, pVgroup, pArray)) != 0) {
11,273✔
1060
      goto _OVER;
462✔
1061
    }
1062

1063
    allocedVgroups++;
10,811✔
1064
  }
1065

1066
  *ppVgroups = pVgroups;
4,977✔
1067
  code = 0;
4,977✔
1068

1069
  mInfo("db:%s, total %d vgroups is alloced, replica:%d", pDb->name, pDb->cfg.numOfVgroups, pDb->cfg.replications);
4,977!
1070

1071
_OVER:
×
1072
  if (code != 0) taosMemoryFree(pVgroups);
5,439!
1073
  taosArrayDestroy(pArray);
5,439✔
1074
  TAOS_RETURN(code);
5,439✔
1075
}
1076

1077
SEpSet mndGetVgroupEpset(SMnode *pMnode, const SVgObj *pVgroup) {
193,405✔
1078
  SEpSet epset = {0};
193,405✔
1079

1080
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
405,172✔
1081
    const SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
211,767✔
1082
    SDnodeObj       *pDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
211,767✔
1083
    if (pDnode == NULL) continue;
211,767✔
1084

1085
    if (pVgid->syncState == TAOS_SYNC_STATE_LEADER || pVgid->syncState == TAOS_SYNC_STATE_ASSIGNED_LEADER) {
211,720!
1086
      epset.inUse = epset.numOfEps;
191,654✔
1087
    }
1088

1089
    if (addEpIntoEpSet(&epset, pDnode->fqdn, pDnode->port) != 0) {
211,720!
1090
      mWarn("vgId:%d, failed to add ep:%s:%d into epset", pVgroup->vgId, pDnode->fqdn, pDnode->port);
×
1091
    }
1092
    mndReleaseDnode(pMnode, pDnode);
211,720✔
1093
  }
1094
  epsetSort(&epset);
193,405✔
1095

1096
  return epset;
193,405✔
1097
}
1098

1099
SEpSet mndGetVgroupEpsetById(SMnode *pMnode, int32_t vgId) {
21✔
1100
  SEpSet epset = {0};
21✔
1101

1102
  SVgObj *pVgroup = mndAcquireVgroup(pMnode, vgId);
21✔
1103
  if (!pVgroup) return epset;
21!
1104

1105
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
63✔
1106
    const SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
42✔
1107
    SDnodeObj       *pDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
42✔
1108
    if (pDnode == NULL) continue;
42!
1109

1110
    if (pVgid->syncState == TAOS_SYNC_STATE_LEADER || pVgid->syncState == TAOS_SYNC_STATE_ASSIGNED_LEADER) {
42!
1111
      epset.inUse = epset.numOfEps;
9✔
1112
    }
1113

1114
    if (addEpIntoEpSet(&epset, pDnode->fqdn, pDnode->port) != 0) {
42!
1115
      mWarn("vgId:%d, failed to add ep:%s:%d into epset", pVgroup->vgId, pDnode->fqdn, pDnode->port);
×
1116
    }
1117
    mndReleaseDnode(pMnode, pDnode);
42✔
1118
  }
1119

1120
  mndReleaseVgroup(pMnode, pVgroup);
21✔
1121
  return epset;
21✔
1122
}
1123

1124
static int32_t mndRetrieveVgroups(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows) {
13,963✔
1125
  SMnode *pMnode = pReq->info.node;
13,963✔
1126
  SSdb   *pSdb = pMnode->pSdb;
13,963✔
1127
  int32_t numOfRows = 0;
13,963✔
1128
  SVgObj *pVgroup = NULL;
13,963✔
1129
  int32_t cols = 0;
13,963✔
1130
  int64_t curMs = taosGetTimestampMs();
13,964✔
1131
  int32_t code = 0;
13,964✔
1132

1133
  SDbObj *pDb = NULL;
13,964✔
1134
  if (strlen(pShow->db) > 0) {
13,964✔
1135
    pDb = mndAcquireDb(pMnode, pShow->db);
877✔
1136
    if (pDb == NULL) {
877!
1137
      return 0;
×
1138
    }
1139
  }
1140

1141
  while (numOfRows < rows) {
676,039✔
1142
    pShow->pIter = sdbFetch(pSdb, SDB_VGROUP, pShow->pIter, (void **)&pVgroup);
676,026✔
1143
    if (pShow->pIter == NULL) break;
675,880✔
1144

1145
    if (pDb != NULL && pVgroup->dbUid != pDb->uid) {
661,907✔
1146
      sdbRelease(pSdb, pVgroup);
961✔
1147
      continue;
961✔
1148
    }
1149

1150
    cols = 0;
660,946✔
1151
    SColumnInfoData *pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
660,946✔
1152
    code = colDataSetVal(pColInfo, numOfRows, (const char *)&pVgroup->vgId, false);
654,919✔
1153
    if (code != 0) {
654,987!
1154
      mError("vgId:%d, failed to set vgId, since %s", pVgroup->vgId, tstrerror(code));
×
1155
      return code;
×
1156
    }
1157

1158
    SName name = {0};
654,987✔
1159
    char  db[TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
654,987✔
1160
    code = tNameFromString(&name, pVgroup->dbName, T_NAME_ACCT | T_NAME_DB);
654,987✔
1161
    if (code != 0) {
660,860!
1162
      mError("vgId:%d, failed to set dbName, since %s", pVgroup->vgId, tstrerror(code));
×
1163
      return code;
×
1164
    }
1165
    (void)tNameGetDbName(&name, varDataVal(db));
660,860✔
1166
    varDataSetLen(db, strlen(varDataVal(db)));
660,773✔
1167

1168
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
660,773✔
1169
    code = colDataSetVal(pColInfo, numOfRows, (const char *)db, false);
653,271✔
1170
    if (code != 0) {
655,377!
1171
      mError("vgId:%d, failed to set dbName, since %s", pVgroup->vgId, tstrerror(code));
×
1172
      return code;
×
1173
    }
1174

1175
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
655,377✔
1176
    code = colDataSetVal(pColInfo, numOfRows, (const char *)&pVgroup->numOfTables, false);
648,500✔
1177
    if (code != 0) {
650,615!
1178
      mError("vgId:%d, failed to set numOfTables, since %s", pVgroup->vgId, tstrerror(code));
×
1179
      return code;
×
1180
    }
1181

1182
    // default 3 replica, add 1 replica if move vnode
1183
    for (int32_t i = 0; i < 4; ++i) {
3,138,703✔
1184
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
2,454,286✔
1185
      if (i < pVgroup->replica) {
2,437,518✔
1186
        int16_t dnodeId = (int16_t)pVgroup->vnodeGid[i].dnodeId;
557,230✔
1187
        code = colDataSetVal(pColInfo, numOfRows, (const char *)&dnodeId, false);
557,230✔
1188
        if (code != 0) {
652,875!
1189
          mError("vgId:%d, failed to set dnodeId, since %s", pVgroup->vgId, tstrerror(code));
×
1190
          return code;
×
1191
        }
1192

1193
        bool       exist = false;
652,875✔
1194
        bool       online = false;
652,875✔
1195
        SDnodeObj *pDnode = mndAcquireDnode(pMnode, pVgroup->vnodeGid[i].dnodeId);
652,875✔
1196
        if (pDnode != NULL) {
663,195!
1197
          exist = true;
663,203✔
1198
          online = mndIsDnodeOnline(pDnode, curMs);
663,203✔
1199
          mndReleaseDnode(pMnode, pDnode);
662,916✔
1200
        }
1201

1202
        char buf1[20] = {0};
663,696✔
1203
        char role[20] = "offline";
663,696✔
1204
        if (!exist) {
663,696!
1205
          tstrncpy(role, "dropping", sizeof(role));
×
1206
        } else if (online) {
663,696✔
1207
          char *star = "";
663,581✔
1208
          if (pVgroup->vnodeGid[i].syncState == TAOS_SYNC_STATE_LEADER ||
663,581✔
1209
              pVgroup->vnodeGid[i].syncState == TAOS_SYNC_STATE_ASSIGNED_LEADER) {
2,834!
1210
            if (!pVgroup->vnodeGid[i].syncRestore && !pVgroup->vnodeGid[i].syncCanRead) {
660,747!
1211
              star = "**";
1,466✔
1212
            } else if (!pVgroup->vnodeGid[i].syncRestore && pVgroup->vnodeGid[i].syncCanRead) {
659,281!
1213
              star = "*";
×
1214
            } else {
1215
            }
1216
          }
1217
          snprintf(role, sizeof(role), "%s%s", syncStr(pVgroup->vnodeGid[i].syncState), star);
663,581✔
1218
          /*
1219
          mInfo("db:%s, learner progress:%d", pDb->name, pVgroup->vnodeGid[i].learnerProgress);
1220

1221
          if (pVgroup->vnodeGid[i].syncState == TAOS_SYNC_STATE_LEARNER) {
1222
            if(pVgroup->vnodeGid[i].learnerProgress < 0){
1223
              snprintf(role, sizeof(role), "%s-",
1224
                syncStr(pVgroup->vnodeGid[i].syncState));
1225

1226
            }
1227
            else if(pVgroup->vnodeGid[i].learnerProgress >= 100){
1228
              snprintf(role, sizeof(role), "%s--",
1229
                syncStr(pVgroup->vnodeGid[i].syncState));
1230
            }
1231
            else{
1232
              snprintf(role, sizeof(role), "%s%d",
1233
                syncStr(pVgroup->vnodeGid[i].syncState), pVgroup->vnodeGid[i].learnerProgress);
1234
            }
1235
          }
1236
          else{
1237
            snprintf(role, sizeof(role), "%s%s", syncStr(pVgroup->vnodeGid[i].syncState), star);
1238
          }
1239
          */
1240
        } else {
1241
        }
1242
        STR_WITH_MAXSIZE_TO_VARSTR(buf1, role, pShow->pMeta->pSchemas[cols].bytes);
663,669✔
1243

1244
        pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
663,669✔
1245
        code = colDataSetVal(pColInfo, numOfRows, (const char *)buf1, false);
657,262✔
1246
        if (code != 0) {
658,434!
1247
          mError("vgId:%d, failed to set role, since %s", pVgroup->vgId, tstrerror(code));
×
1248
          return code;
×
1249
        }
1250

1251
        char applyStr[TSDB_SYNC_APPLY_COMMIT_LEN + 1] = {0};
658,434✔
1252
        char buf[TSDB_SYNC_APPLY_COMMIT_LEN + VARSTR_HEADER_SIZE + 1] = {0};
658,434✔
1253
        snprintf(applyStr, sizeof(applyStr), "%" PRId64 "/%" PRId64, pVgroup->vnodeGid[i].syncAppliedIndex,
658,434✔
1254
                 pVgroup->vnodeGid[i].syncCommitIndex);
658,434✔
1255
        STR_WITH_MAXSIZE_TO_VARSTR(buf, applyStr, pShow->pMeta->pSchemas[cols].bytes);
658,434✔
1256

1257
        pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
658,434✔
1258
        code = colDataSetVal(pColInfo, numOfRows, (const char *)&buf, false);
655,514✔
1259
        if (code != 0) {
658,059!
1260
          mError("vgId:%d, failed to set role, since %s", pVgroup->vgId, tstrerror(code));
×
1261
          return code;
×
1262
        }
1263
      } else {
1264
        colDataSetNULL(pColInfo, numOfRows);
1,880,288✔
1265
        pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,880,288✔
1266
        colDataSetNULL(pColInfo, numOfRows);
1,851,687!
1267
        pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,851,687✔
1268
        colDataSetNULL(pColInfo, numOfRows);
1,830,029!
1269
      }
1270
    }
1271

1272
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
684,417✔
1273
    int32_t cacheUsage = (int32_t)pVgroup->cacheUsage;
647,037✔
1274
    code = colDataSetVal(pColInfo, numOfRows, (const char *)&cacheUsage, false);
647,037✔
1275
    if (code != 0) {
655,580!
1276
      mError("vgId:%d, failed to set cacheUsage, since %s", pVgroup->vgId, tstrerror(code));
×
1277
      return code;
×
1278
    }
1279

1280
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
655,580✔
1281
    code = colDataSetVal(pColInfo, numOfRows, (const char *)&pVgroup->numOfCachedTables, false);
648,173✔
1282
    if (code != 0) {
651,557!
1283
      mError("vgId:%d, failed to set numOfCachedTables, since %s", pVgroup->vgId, tstrerror(code));
×
1284
      return code;
×
1285
    }
1286

1287
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
651,557✔
1288
    code = colDataSetVal(pColInfo, numOfRows, (const char *)&pVgroup->isTsma, false);
645,310✔
1289
    if (code != 0) {
649,819!
1290
      mError("vgId:%d, failed to set isTsma, since %s", pVgroup->vgId, tstrerror(code));
×
1291
      return code;
×
1292
    }
1293
    numOfRows++;
649,819✔
1294
    sdbRelease(pSdb, pVgroup);
649,819✔
1295
  }
1296

1297
  if (pDb != NULL) {
13,986✔
1298
    mndReleaseDb(pMnode, pDb);
877✔
1299
  }
1300

1301
  pShow->numOfRows += numOfRows;
13,973✔
1302
  return numOfRows;
13,973✔
1303
}
1304

1305
static void mndCancelGetNextVgroup(SMnode *pMnode, void *pIter) {
×
1306
  SSdb *pSdb = pMnode->pSdb;
×
1307
  sdbCancelFetchByType(pSdb, pIter, SDB_VGROUP);
×
1308
}
×
1309

1310
static bool mndGetVnodesNumFp(SMnode *pMnode, void *pObj, void *p1, void *p2, void *p3) {
341,653✔
1311
  SVgObj  *pVgroup = pObj;
341,653✔
1312
  int32_t  dnodeId = *(int32_t *)p1;
341,653✔
1313
  int32_t *pNumOfVnodes = (int32_t *)p2;
341,653✔
1314

1315
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
701,481✔
1316
    if (pVgroup->vnodeGid[v].dnodeId == dnodeId) {
359,828✔
1317
      (*pNumOfVnodes)++;
331,087✔
1318
    }
1319
  }
1320

1321
  return true;
341,653✔
1322
}
1323

1324
int32_t mndGetVnodesNum(SMnode *pMnode, int32_t dnodeId) {
17,933✔
1325
  int32_t numOfVnodes = 0;
17,933✔
1326
  sdbTraverse(pMnode->pSdb, SDB_VGROUP, mndGetVnodesNumFp, &dnodeId, &numOfVnodes, NULL);
17,933✔
1327
  return numOfVnodes;
17,958✔
1328
}
1329

1330
int64_t mndGetVgroupMemory(SMnode *pMnode, SDbObj *pDbInput, SVgObj *pVgroup) {
39,184✔
1331
  SDbObj *pDb = pDbInput;
39,184✔
1332
  if (pDbInput == NULL) {
39,184✔
1333
    pDb = mndAcquireDb(pMnode, pVgroup->dbName);
25,624✔
1334
  }
1335

1336
  int64_t vgroupMemroy = 0;
39,184✔
1337
  if (pDb != NULL) {
39,184✔
1338
    int64_t buffer = (int64_t)pDb->cfg.buffer * 1024 * 1024;
39,180✔
1339
    int64_t cache = (int64_t)pDb->cfg.pages * pDb->cfg.pageSize * 1024;
39,180✔
1340
    vgroupMemroy = buffer + cache;
39,180✔
1341
    int64_t cacheLast = (int64_t)pDb->cfg.cacheLastSize * 1024 * 1024;
39,180✔
1342
    if (pDb->cfg.cacheLast > 0) {
39,180✔
1343
      vgroupMemroy += cacheLast;
8,454✔
1344
    }
1345
    mDebug("db:%s, vgroup:%d, buffer:%" PRId64 " cache:%" PRId64 " cacheLast:%" PRId64, pDb->name, pVgroup->vgId,
39,180✔
1346
           buffer, cache, cacheLast);
1347
  }
1348

1349
  if (pDbInput == NULL) {
39,184✔
1350
    mndReleaseDb(pMnode, pDb);
25,624✔
1351
  }
1352
  return vgroupMemroy;
39,184✔
1353
}
1354

1355
static bool mndGetVnodeMemroyFp(SMnode *pMnode, void *pObj, void *p1, void *p2, void *p3) {
29,621✔
1356
  SVgObj  *pVgroup = pObj;
29,621✔
1357
  int32_t  dnodeId = *(int32_t *)p1;
29,621✔
1358
  int64_t *pVnodeMemory = (int64_t *)p2;
29,621✔
1359

1360
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
68,059✔
1361
    if (pVgroup->vnodeGid[v].dnodeId == dnodeId) {
38,438✔
1362
      *pVnodeMemory += mndGetVgroupMemory(pMnode, NULL, pVgroup);
25,272✔
1363
    }
1364
  }
1365

1366
  return true;
29,621✔
1367
}
1368

1369
int64_t mndGetVnodesMemory(SMnode *pMnode, int32_t dnodeId) {
7,409✔
1370
  int64_t vnodeMemory = 0;
7,409✔
1371
  sdbTraverse(pMnode->pSdb, SDB_VGROUP, mndGetVnodeMemroyFp, &dnodeId, &vnodeMemory, NULL);
7,409✔
1372
  return vnodeMemory;
7,409✔
1373
}
1374

1375
void calculateRstoreFinishTime(double rate, int64_t applyCount, char *restoreStr, size_t restoreStrSize) {
×
1376
  if (rate == 0) {
×
1377
    snprintf(restoreStr, restoreStrSize, "0:0:0");
×
1378
    return;
×
1379
  }
1380

1381
  int64_t costTime = applyCount / rate;
×
1382
  int64_t totalSeconds = costTime / 1000;
×
1383
  int64_t hours = totalSeconds / 3600;
×
1384
  totalSeconds %= 3600;
×
1385
  int64_t minutes = totalSeconds / 60;
×
1386
  int64_t seconds = totalSeconds % 60;
×
1387
  snprintf(restoreStr, restoreStrSize, "%" PRId64 ":%" PRId64 ":%" PRId64, hours, minutes, seconds);
×
1388
}
1389

1390
static int32_t mndRetrieveVnodes(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows) {
8,083✔
1391
  SMnode *pMnode = pReq->info.node;
8,083✔
1392
  SSdb   *pSdb = pMnode->pSdb;
8,083✔
1393
  int32_t numOfRows = 0;
8,083✔
1394
  SVgObj *pVgroup = NULL;
8,083✔
1395
  int32_t cols = 0;
8,083✔
1396
  int64_t curMs = taosGetTimestampMs();
8,083✔
1397
  int32_t code = 0;
8,083✔
1398

1399
  while (numOfRows < rows - TSDB_MAX_REPLICA) {
427,333!
1400
    pShow->pIter = sdbFetch(pSdb, SDB_VGROUP, pShow->pIter, (void **)&pVgroup);
427,333✔
1401
    if (pShow->pIter == NULL) break;
427,213✔
1402

1403
    for (int32_t i = 0; i < pVgroup->replica && numOfRows < rows; ++i) {
838,723✔
1404
      SVnodeGid       *pGid = &pVgroup->vnodeGid[i];
419,462✔
1405
      SColumnInfoData *pColInfo = NULL;
419,462✔
1406
      cols = 0;
419,462✔
1407

1408
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
419,462✔
1409
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&pGid->dnodeId, false);
416,255✔
1410
      if (code != 0) {
415,199!
1411
        mError("vgId:%d, failed to set dnodeId, since %s", pVgroup->vgId, tstrerror(code));
×
1412
        return code;
×
1413
      }
1414
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
415,199✔
1415
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&pVgroup->vgId, false);
412,402✔
1416
      if (code != 0) {
413,440!
1417
        mError("vgId:%d, failed to set vgId, since %s", pVgroup->vgId, tstrerror(code));
×
1418
        return code;
×
1419
      }
1420

1421
      // db_name
1422
      const char *dbname = mndGetDbStr(pVgroup->dbName);
413,440✔
1423
      char        b1[TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
415,604✔
1424
      if (dbname != NULL) {
415,604!
1425
        STR_WITH_MAXSIZE_TO_VARSTR(b1, dbname, TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE);
418,038✔
1426
      } else {
1427
        STR_WITH_MAXSIZE_TO_VARSTR(b1, "NULL", TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE);
×
1428
      }
1429
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
415,604✔
1430
      code = colDataSetVal(pColInfo, numOfRows, (const char *)b1, false);
413,898✔
1431
      if (code != 0) {
414,632!
1432
        mError("vgId:%d, failed to set dbName, since %s", pVgroup->vgId, tstrerror(code));
×
1433
        return code;
×
1434
      }
1435

1436
      // dnode is online?
1437
      SDnodeObj *pDnode = mndAcquireDnode(pMnode, pGid->dnodeId);
414,632✔
1438
      if (pDnode == NULL) {
419,222!
1439
        mError("failed to acquire dnode. dnodeId:%d", pGid->dnodeId);
×
1440
        break;
×
1441
      }
1442
      bool isDnodeOnline = mndIsDnodeOnline(pDnode, curMs);
419,222✔
1443

1444
      char       buf[20] = {0};
419,126✔
1445
      ESyncState syncState = (isDnodeOnline) ? pGid->syncState : TAOS_SYNC_STATE_OFFLINE;
419,126✔
1446
      STR_TO_VARSTR(buf, syncStr(syncState));
419,126✔
1447
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
418,741✔
1448
      code = colDataSetVal(pColInfo, numOfRows, (const char *)buf, false);
414,068✔
1449
      if (code != 0) {
413,934!
1450
        mError("vgId:%d, failed to set syncState, since %s", pVgroup->vgId, tstrerror(code));
×
1451
        return code;
×
1452
      }
1453

1454
      int64_t roleTimeMs = (isDnodeOnline) ? pGid->roleTimeMs : 0;
413,934✔
1455
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
413,934✔
1456
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&roleTimeMs, false);
410,943✔
1457
      if (code != 0) {
411,547!
1458
        mError("vgId:%d, failed to set roleTimeMs, since %s", pVgroup->vgId, tstrerror(code));
×
1459
        return code;
×
1460
      }
1461

1462
      int64_t startTimeMs = (isDnodeOnline) ? pGid->startTimeMs : 0;
411,547✔
1463
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
411,547✔
1464
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&startTimeMs, false);
408,637✔
1465
      if (code != 0) {
410,278!
1466
        mError("vgId:%d, failed to set startTimeMs, since %s", pVgroup->vgId, tstrerror(code));
×
1467
        return code;
×
1468
      }
1469

1470
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
410,278✔
1471
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&pGid->syncRestore, false);
407,733✔
1472
      if (code != 0) {
410,610!
1473
        mError("vgId:%d, failed to set syncRestore, since %s", pVgroup->vgId, tstrerror(code));
×
1474
        return code;
×
1475
      }
1476

1477
      int64_t unappliedCount = pGid->syncCommitIndex - pGid->syncAppliedIndex;
410,610✔
1478
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
410,610✔
1479
      char restoreStr[20] = {0};
408,068✔
1480
      if (unappliedCount > 0) {
408,068!
1481
        calculateRstoreFinishTime(pGid->appliedRate, unappliedCount, restoreStr, sizeof(restoreStr));
×
1482
      }
1483
      STR_TO_VARSTR(buf, restoreStr);
408,068✔
1484
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&buf, false);
408,068✔
1485
      if (code != 0) {
415,357!
1486
        mError("vgId:%d, failed to set syncRestore finish time, since %s", pVgroup->vgId, tstrerror(code));
×
1487
        return code;
×
1488
      }
1489

1490
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
415,357✔
1491
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&unappliedCount, false);
410,552✔
1492
      if (code != 0) {
411,028!
1493
        mError("vgId:%d, failed to set syncRestore, since %s", pVgroup->vgId, tstrerror(code));
×
1494
        return code;
×
1495
      }
1496

1497
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
411,028✔
1498
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&pGid->bufferSegmentUsed, false);
407,761✔
1499
      if (code != 0) {
409,760!
1500
        mError("vgId:%d, failed to set buffer segment used, since %s", pVgroup->vgId, tstrerror(code));
×
1501
        return code;
×
1502
      }
1503

1504
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
409,760✔
1505
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&pGid->bufferSegmentSize, false);
407,288✔
1506
      if (code != 0) {
410,171!
1507
        mError("vgId:%d, failed to set buffer segment size, since %s", pVgroup->vgId, tstrerror(code));
×
1508
        return code;
×
1509
      }
1510

1511
      numOfRows++;
410,171✔
1512
      sdbRelease(pSdb, pDnode);
410,171✔
1513
    }
1514

1515
    sdbRelease(pSdb, pVgroup);
419,261✔
1516
  }
1517

1518
  pShow->numOfRows += numOfRows;
8,086✔
1519
  return numOfRows;
8,086✔
1520
}
1521

1522
static void mndCancelGetNextVnode(SMnode *pMnode, void *pIter) {
×
1523
  SSdb *pSdb = pMnode->pSdb;
×
1524
  sdbCancelFetchByType(pSdb, pIter, SDB_VGROUP);
×
1525
}
×
1526

1527
static int32_t mndAddVnodeToVgroup(SMnode *pMnode, STrans *pTrans, SVgObj *pVgroup, SArray *pArray) {
224✔
1528
  int32_t code = 0;
224✔
1529
  taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes);
224✔
1530
  for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
881✔
1531
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
657✔
1532
    mInfo("dnode:%d, equivalent vnodes:%d others:%d", pDnode->id, pDnode->numOfVnodes, pDnode->numOfOtherNodes);
657!
1533
  }
1534

1535
  SVnodeGid *pVgid = &pVgroup->vnodeGid[pVgroup->replica];
224✔
1536
  for (int32_t d = 0; d < taosArrayGetSize(pArray); ++d) {
278✔
1537
    SDnodeObj *pDnode = taosArrayGet(pArray, d);
266✔
1538

1539
    bool used = false;
266✔
1540
    for (int32_t vn = 0; vn < pVgroup->replica; ++vn) {
607✔
1541
      if (pDnode->id == pVgroup->vnodeGid[vn].dnodeId) {
395✔
1542
        used = true;
54✔
1543
        break;
54✔
1544
      }
1545
    }
1546
    if (used) continue;
266✔
1547

1548
    if (pDnode == NULL) {
212!
1549
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_DNODES);
×
1550
    }
1551
    if (pDnode->numOfVnodes >= pDnode->numOfSupportVnodes) {
212!
1552
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_VNODES);
×
1553
    }
1554

1555
    int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
212✔
1556
    if (pDnode->memAvail - vgMem - pDnode->memUsed <= 0) {
212!
1557
      mError("db:%s, vgId:%d, no enough memory:%" PRId64 " in dnode:%d avail:%" PRId64 " used:%" PRId64,
×
1558
             pVgroup->dbName, pVgroup->vgId, vgMem, pDnode->id, pDnode->memAvail, pDnode->memUsed);
1559
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE);
×
1560
    } else {
1561
      pDnode->memUsed += vgMem;
212✔
1562
    }
1563

1564
    pVgid->dnodeId = pDnode->id;
212✔
1565
    pVgid->syncState = TAOS_SYNC_STATE_OFFLINE;
212✔
1566
    mInfo("db:%s, vgId:%d, vn:%d is added, memory:%" PRId64 ", dnode:%d avail:%" PRId64 " used:%" PRId64,
212!
1567
          pVgroup->dbName, pVgroup->vgId, pVgroup->replica, vgMem, pVgid->dnodeId, pDnode->memAvail, pDnode->memUsed);
1568

1569
    pVgroup->replica++;
212✔
1570
    pDnode->numOfVnodes++;
212✔
1571

1572
    SSdbRaw *pVgRaw = mndVgroupActionEncode(pVgroup);
212✔
1573
    if (pVgRaw == NULL) {
212!
1574
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1575
      if (terrno != 0) code = terrno;
×
1576
      TAOS_RETURN(code);
×
1577
    }
1578
    if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
212!
1579
      sdbFreeRaw(pVgRaw);
×
1580
      TAOS_RETURN(code);
×
1581
    }
1582
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
212✔
1583
    if (code != 0) {
212!
1584
      mError("vgId:%d, failed to set raw status since %s at line:%d", pVgroup->vgId, tstrerror(code), __LINE__);
×
1585
    }
1586
    TAOS_RETURN(code);
212✔
1587
  }
1588

1589
  code = TSDB_CODE_MND_NO_ENOUGH_DNODES;
12✔
1590
  mError("db:%s, failed to add vnode to vgId:%d since %s", pVgroup->dbName, pVgroup->vgId, tstrerror(code));
12!
1591
  TAOS_RETURN(code);
12✔
1592
}
1593

1594
static int32_t mndRemoveVnodeFromVgroup(SMnode *pMnode, STrans *pTrans, SVgObj *pVgroup, SArray *pArray,
39✔
1595
                                        SVnodeGid *pDelVgid) {
1596
  taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes);
39✔
1597
  for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
169✔
1598
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
130✔
1599
    mInfo("dnode:%d, equivalent vnodes:%d others:%d", pDnode->id, pDnode->numOfVnodes, pDnode->numOfOtherNodes);
130!
1600
  }
1601

1602
  int32_t code = -1;
39✔
1603
  for (int32_t d = taosArrayGetSize(pArray) - 1; d >= 0; --d) {
51!
1604
    SDnodeObj *pDnode = taosArrayGet(pArray, d);
51✔
1605

1606
    for (int32_t vn = 0; vn < pVgroup->replica; ++vn) {
111✔
1607
      SVnodeGid *pVgid = &pVgroup->vnodeGid[vn];
99✔
1608
      if (pVgid->dnodeId == pDnode->id) {
99✔
1609
        int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
39✔
1610
        pDnode->memUsed -= vgMem;
39✔
1611
        mInfo("db:%s, vgId:%d, vn:%d is removed, memory:%" PRId64 ", dnode:%d avail:%" PRId64 " used:%" PRId64,
39!
1612
              pVgroup->dbName, pVgroup->vgId, vn, vgMem, pVgid->dnodeId, pDnode->memAvail, pDnode->memUsed);
1613
        pDnode->numOfVnodes--;
39✔
1614
        pVgroup->replica--;
39✔
1615
        *pDelVgid = *pVgid;
39✔
1616
        *pVgid = pVgroup->vnodeGid[pVgroup->replica];
39✔
1617
        memset(&pVgroup->vnodeGid[pVgroup->replica], 0, sizeof(SVnodeGid));
39✔
1618
        code = 0;
39✔
1619
        goto _OVER;
39✔
1620
      }
1621
    }
1622
  }
1623

1624
_OVER:
×
1625
  if (code != 0) {
39!
1626
    code = TSDB_CODE_APP_ERROR;
×
1627
    mError("db:%s, failed to remove vnode from vgId:%d since %s", pVgroup->dbName, pVgroup->vgId, tstrerror(code));
×
1628
    TAOS_RETURN(code);
×
1629
  }
1630

1631
  for (int32_t vn = 0; vn < pVgroup->replica; ++vn) {
113✔
1632
    SVnodeGid *pVgid = &pVgroup->vnodeGid[vn];
74✔
1633
    mInfo("db:%s, vgId:%d, vn:%d dnode:%d is reserved", pVgroup->dbName, pVgroup->vgId, vn, pVgid->dnodeId);
74!
1634
  }
1635

1636
  SSdbRaw *pVgRaw = mndVgroupActionEncode(pVgroup);
39✔
1637
  if (pVgRaw == NULL) {
39!
1638
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1639
    if (terrno != 0) code = terrno;
×
1640
    TAOS_RETURN(code);
×
1641
  }
1642
  if (mndTransAppendRedolog(pTrans, pVgRaw) != 0) {
39!
1643
    sdbFreeRaw(pVgRaw);
×
1644
    TAOS_RETURN(code);
×
1645
  }
1646
  code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
39✔
1647
  if (code != 0) {
39!
1648
    mError("vgId:%d, failed to set raw status since %s at line:%d", pVgroup->vgId, tstrerror(code), __LINE__);
×
1649
  }
1650

1651
  TAOS_RETURN(code);
39✔
1652
}
1653

1654
static int32_t mndRemoveVnodeFromVgroupWithoutSave(SMnode *pMnode, STrans *pTrans, SVgObj *pVgroup, SArray *pArray,
×
1655
                                                   SVnodeGid *pDelVgid) {
1656
  taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes);
×
1657
  for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
×
1658
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
×
1659
    mInfo("dnode:%d, equivalent vnodes:%d others:%d", pDnode->id, pDnode->numOfVnodes, pDnode->numOfOtherNodes);
×
1660
  }
1661

1662
  int32_t code = -1;
×
1663
  for (int32_t d = taosArrayGetSize(pArray) - 1; d >= 0; --d) {
×
1664
    SDnodeObj *pDnode = taosArrayGet(pArray, d);
×
1665

1666
    for (int32_t vn = 0; vn < pVgroup->replica; ++vn) {
×
1667
      SVnodeGid *pVgid = &pVgroup->vnodeGid[vn];
×
1668
      if (pVgid->dnodeId == pDnode->id) {
×
1669
        int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
×
1670
        pDnode->memUsed -= vgMem;
×
1671
        mInfo("db:%s, vgId:%d, vn:%d is removed, memory:%" PRId64 ", dnode:%d avail:%" PRId64 " used:%" PRId64,
×
1672
              pVgroup->dbName, pVgroup->vgId, vn, vgMem, pVgid->dnodeId, pDnode->memAvail, pDnode->memUsed);
1673
        pDnode->numOfVnodes--;
×
1674
        pVgroup->replica--;
×
1675
        *pDelVgid = *pVgid;
×
1676
        *pVgid = pVgroup->vnodeGid[pVgroup->replica];
×
1677
        memset(&pVgroup->vnodeGid[pVgroup->replica], 0, sizeof(SVnodeGid));
×
1678
        code = 0;
×
1679
        goto _OVER;
×
1680
      }
1681
    }
1682
  }
1683

1684
_OVER:
×
1685
  if (code != 0) {
×
1686
    code = TSDB_CODE_APP_ERROR;
×
1687
    mError("db:%s, failed to remove vnode from vgId:%d since %s", pVgroup->dbName, pVgroup->vgId, tstrerror(code));
×
1688
    TAOS_RETURN(code);
×
1689
  }
1690

1691
  for (int32_t vn = 0; vn < pVgroup->replica; ++vn) {
×
1692
    SVnodeGid *pVgid = &pVgroup->vnodeGid[vn];
×
1693
    mInfo("db:%s, vgId:%d, vn:%d dnode:%d is reserved", pVgroup->dbName, pVgroup->vgId, vn, pVgid->dnodeId);
×
1694
  }
1695

1696
  TAOS_RETURN(code);
×
1697
}
1698

1699
int32_t mndAddCreateVnodeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, SVnodeGid *pVgid) {
11,901✔
1700
  int32_t      code = 0;
11,901✔
1701
  STransAction action = {0};
11,901✔
1702

1703
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
11,901✔
1704
  if (pDnode == NULL) return -1;
11,901!
1705
  action.epSet = mndGetDnodeEpset(pDnode);
11,901✔
1706
  mndReleaseDnode(pMnode, pDnode);
11,901✔
1707

1708
  int32_t contLen = 0;
11,901✔
1709
  void   *pReq = mndBuildCreateVnodeReq(pMnode, pDnode, pDb, pVgroup, &contLen);
11,901✔
1710
  if (pReq == NULL) return -1;
11,901!
1711

1712
  action.pCont = pReq;
11,901✔
1713
  action.contLen = contLen;
11,901✔
1714
  action.msgType = TDMT_DND_CREATE_VNODE;
11,901✔
1715
  action.acceptableCode = TSDB_CODE_VND_ALREADY_EXIST;
11,901✔
1716

1717
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
11,901!
1718
    taosMemoryFree(pReq);
×
1719
    TAOS_RETURN(code);
×
1720
  }
1721

1722
  TAOS_RETURN(code);
11,901✔
1723
}
1724

1725
int32_t mndRestoreAddCreateVnodeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
20✔
1726
                                       SDnodeObj *pDnode) {
1727
  int32_t      code = 0;
20✔
1728
  STransAction action = {0};
20✔
1729

1730
  action.epSet = mndGetDnodeEpset(pDnode);
20✔
1731

1732
  int32_t contLen = 0;
20✔
1733
  void   *pReq = mndBuildCreateVnodeReq(pMnode, pDnode, pDb, pVgroup, &contLen);
20✔
1734
  if (pReq == NULL) {
20!
1735
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1736
    if (terrno != 0) code = terrno;
×
1737
    TAOS_RETURN(code);
×
1738
  }
1739

1740
  action.pCont = pReq;
20✔
1741
  action.contLen = contLen;
20✔
1742
  action.msgType = TDMT_DND_CREATE_VNODE;
20✔
1743
  action.acceptableCode = TSDB_CODE_VND_ALREADY_EXIST;
20✔
1744

1745
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
20!
1746
    taosMemoryFree(pReq);
×
1747
    TAOS_RETURN(code);
×
1748
  }
1749

1750
  TAOS_RETURN(code);
20✔
1751
}
1752

1753
int32_t mndAddAlterVnodeConfirmAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup) {
666✔
1754
  int32_t      code = 0;
666✔
1755
  STransAction action = {0};
666✔
1756
  action.epSet = mndGetVgroupEpset(pMnode, pVgroup);
666✔
1757

1758
  mInfo("vgId:%d, build alter vnode confirm req", pVgroup->vgId);
666!
1759
  int32_t   contLen = sizeof(SMsgHead);
666✔
1760
  SMsgHead *pHead = taosMemoryMalloc(contLen);
666!
1761
  if (pHead == NULL) {
666!
1762
    TAOS_RETURN(terrno);
×
1763
  }
1764

1765
  pHead->contLen = htonl(contLen);
666✔
1766
  pHead->vgId = htonl(pVgroup->vgId);
666✔
1767

1768
  action.pCont = pHead;
666✔
1769
  action.contLen = contLen;
666✔
1770
  action.msgType = TDMT_VND_ALTER_CONFIRM;
666✔
1771
  // incorrect redirect result will cause this erro
1772
  action.retryCode = TSDB_CODE_VND_INVALID_VGROUP_ID;
666✔
1773

1774
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
666!
1775
    taosMemoryFree(pHead);
×
1776
    TAOS_RETURN(code);
×
1777
  }
1778

1779
  TAOS_RETURN(code);
666✔
1780
}
1781

1782
int32_t mndAddChangeConfigAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pOldVgroup, SVgObj *pNewVgroup,
×
1783
                                 int32_t dnodeId) {
1784
  int32_t      code = 0;
×
1785
  STransAction action = {0};
×
1786
  action.epSet = mndGetVgroupEpset(pMnode, pNewVgroup);
×
1787

1788
  int32_t contLen = 0;
×
1789
  void   *pReq = mndBuildAlterVnodeReplicaReq(pMnode, pDb, pNewVgroup, dnodeId, &contLen);
×
1790
  if (pReq == NULL) {
×
1791
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1792
    if (terrno != 0) code = terrno;
×
1793
    TAOS_RETURN(code);
×
1794
  }
1795

1796
  int32_t totallen = contLen + sizeof(SMsgHead);
×
1797

1798
  SMsgHead *pHead = taosMemoryMalloc(totallen);
×
1799
  if (pHead == NULL) {
×
1800
    taosMemoryFree(pReq);
×
1801
    TAOS_RETURN(terrno);
×
1802
  }
1803

1804
  pHead->contLen = htonl(totallen);
×
1805
  pHead->vgId = htonl(pNewVgroup->vgId);
×
1806

1807
  memcpy((void *)(pHead + 1), pReq, contLen);
×
1808
  taosMemoryFree(pReq);
×
1809

1810
  action.pCont = pHead;
×
1811
  action.contLen = totallen;
×
1812
  action.msgType = TDMT_SYNC_CONFIG_CHANGE;
×
1813

1814
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
×
1815
    taosMemoryFree(pHead);
×
1816
    TAOS_RETURN(code);
×
1817
  }
1818

1819
  TAOS_RETURN(code);
×
1820
}
1821

1822
static int32_t mndAddAlterVnodeHashRangeAction(SMnode *pMnode, STrans *pTrans, int32_t srcVgId, SVgObj *pVgroup) {
112✔
1823
  int32_t      code = 0;
112✔
1824
  STransAction action = {0};
112✔
1825
  action.epSet = mndGetVgroupEpset(pMnode, pVgroup);
112✔
1826

1827
  int32_t contLen = 0;
112✔
1828
  void   *pReq = mndBuildAlterVnodeHashRangeReq(pMnode, srcVgId, pVgroup, &contLen);
112✔
1829
  if (pReq == NULL) {
112!
1830
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1831
    if (terrno != 0) code = terrno;
×
1832
    TAOS_RETURN(code);
×
1833
  }
1834

1835
  action.pCont = pReq;
112✔
1836
  action.contLen = contLen;
112✔
1837
  action.msgType = TDMT_VND_ALTER_HASHRANGE;
112✔
1838
  action.acceptableCode = TSDB_CODE_VND_ALREADY_EXIST;
112✔
1839

1840
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
112!
1841
    taosMemoryFree(pReq);
×
1842
    TAOS_RETURN(code);
×
1843
  }
1844

1845
  mInfo("trans:%d, add alter vnode hash range action for from vgId:%d to vgId:%d", pTrans->id, srcVgId, pVgroup->vgId);
112!
1846
  TAOS_RETURN(code);
112✔
1847
}
1848

1849
int32_t mndAddAlterVnodeConfigAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup) {
646✔
1850
  int32_t      code = 0;
646✔
1851
  STransAction action = {0};
646✔
1852
  action.epSet = mndGetVgroupEpset(pMnode, pVgroup);
646✔
1853

1854
  int32_t contLen = 0;
646✔
1855
  void   *pReq = mndBuildAlterVnodeConfigReq(pMnode, pDb, pVgroup, &contLen);
646✔
1856
  if (pReq == NULL) {
646!
1857
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1858
    if (terrno != 0) code = terrno;
×
1859
    TAOS_RETURN(code);
×
1860
  }
1861

1862
  action.pCont = pReq;
646✔
1863
  action.contLen = contLen;
646✔
1864
  action.msgType = TDMT_VND_ALTER_CONFIG;
646✔
1865

1866
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
646!
1867
    taosMemoryFree(pReq);
×
1868
    TAOS_RETURN(code);
×
1869
  }
1870

1871
  TAOS_RETURN(code);
646✔
1872
}
1873

1874
int32_t mndAddNewVgPrepareAction(SMnode *pMnode, STrans *pTrans, SVgObj *pVg) {
10,827✔
1875
  int32_t  code = 0;
10,827✔
1876
  SSdbRaw *pRaw = mndVgroupActionEncode(pVg);
10,827✔
1877
  if (pRaw == NULL) {
10,827!
1878
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1879
    if (terrno != 0) code = terrno;
×
1880
    goto _err;
×
1881
  }
1882

1883
  TAOS_CHECK_GOTO(mndTransAppendPrepareLog(pTrans, pRaw), NULL, _err);
10,827!
1884
  if (sdbSetRawStatus(pRaw, SDB_STATUS_CREATING) != 0) {
10,827!
1885
    mError("vgId:%d, failed to set raw status at line:%d", pVg->vgId, __LINE__);
×
1886
  }
1887
  if (code != 0) {
10,827!
1888
    mError("vgId:%d, failed to set raw status since %s at line:%d", pVg->vgId, tstrerror(code), __LINE__);
×
1889
    TAOS_RETURN(code);
×
1890
  }
1891
  pRaw = NULL;
10,827✔
1892
  TAOS_RETURN(code);
10,827✔
1893

1894
_err:
×
1895
  sdbFreeRaw(pRaw);
×
1896
  TAOS_RETURN(code);
×
1897
}
1898

1899
int32_t mndAddAlterVnodeReplicaAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId) {
1,365✔
1900
  int32_t    code = 0;
1,365✔
1901
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
1,365✔
1902
  if (pDnode == NULL) {
1,365!
1903
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1904
    if (terrno != 0) code = terrno;
×
1905
    TAOS_RETURN(code);
×
1906
  }
1907

1908
  STransAction action = {0};
1,365✔
1909
  action.epSet = mndGetDnodeEpset(pDnode);
1,365✔
1910
  mndReleaseDnode(pMnode, pDnode);
1,365✔
1911

1912
  int32_t contLen = 0;
1,365✔
1913
  void   *pReq = mndBuildAlterVnodeReplicaReq(pMnode, pDb, pVgroup, dnodeId, &contLen);
1,365✔
1914
  if (pReq == NULL) {
1,365!
1915
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1916
    if (terrno != 0) code = terrno;
×
1917
    TAOS_RETURN(code);
×
1918
  }
1919

1920
  action.pCont = pReq;
1,365✔
1921
  action.contLen = contLen;
1,365✔
1922
  action.msgType = TDMT_VND_ALTER_REPLICA;
1,365✔
1923

1924
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
1,365!
1925
    taosMemoryFree(pReq);
×
1926
    TAOS_RETURN(code);
×
1927
  }
1928

1929
  TAOS_RETURN(code);
1,365✔
1930
}
1931

1932
int32_t mndAddCheckLearnerCatchupAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId) {
×
1933
  int32_t    code = 0;
×
1934
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
×
1935
  if (pDnode == NULL) {
×
1936
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1937
    if (terrno != 0) code = terrno;
×
1938
    TAOS_RETURN(code);
×
1939
  }
1940

1941
  STransAction action = {0};
×
1942
  action.epSet = mndGetDnodeEpset(pDnode);
×
1943
  mndReleaseDnode(pMnode, pDnode);
×
1944

1945
  int32_t contLen = 0;
×
1946
  void   *pReq = mndBuildCheckLearnCatchupReq(pMnode, pDb, pVgroup, dnodeId, &contLen);
×
1947
  if (pReq == NULL) {
×
1948
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1949
    if (terrno != 0) code = terrno;
×
1950
    TAOS_RETURN(code);
×
1951
  }
1952

1953
  action.pCont = pReq;
×
1954
  action.contLen = contLen;
×
1955
  action.msgType = TDMT_DND_CHECK_VNODE_LEARNER_CATCHUP;
×
1956
  action.acceptableCode = TSDB_CODE_VND_ALREADY_IS_VOTER;
×
1957
  action.retryCode = TSDB_CODE_VND_NOT_CATCH_UP;
×
1958

1959
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
×
1960
    taosMemoryFree(pReq);
×
1961
    TAOS_RETURN(code);
×
1962
  }
1963

1964
  TAOS_RETURN(code);
×
1965
}
1966

1967
int32_t mndAddAlterVnodeTypeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId) {
233✔
1968
  int32_t    code = 0;
233✔
1969
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
233✔
1970
  if (pDnode == NULL) {
233!
1971
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1972
    if (terrno != 0) code = terrno;
×
1973
    TAOS_RETURN(code);
×
1974
  }
1975

1976
  STransAction action = {0};
233✔
1977
  action.epSet = mndGetDnodeEpset(pDnode);
233✔
1978
  mndReleaseDnode(pMnode, pDnode);
233✔
1979

1980
  int32_t contLen = 0;
233✔
1981
  void   *pReq = mndBuildAlterVnodeReplicaReq(pMnode, pDb, pVgroup, dnodeId, &contLen);
233✔
1982
  if (pReq == NULL) {
233!
1983
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1984
    if (terrno != 0) code = terrno;
×
1985
    TAOS_RETURN(code);
×
1986
  }
1987

1988
  action.pCont = pReq;
233✔
1989
  action.contLen = contLen;
233✔
1990
  action.msgType = TDMT_DND_ALTER_VNODE_TYPE;
233✔
1991
  action.acceptableCode = TSDB_CODE_VND_ALREADY_IS_VOTER;
233✔
1992
  action.retryCode = TSDB_CODE_VND_NOT_CATCH_UP;
233✔
1993

1994
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
233!
1995
    taosMemoryFree(pReq);
×
1996
    TAOS_RETURN(code);
×
1997
  }
1998

1999
  TAOS_RETURN(code);
233✔
2000
}
2001

2002
int32_t mndRestoreAddAlterVnodeTypeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
20✔
2003
                                          SDnodeObj *pDnode) {
2004
  int32_t      code = 0;
20✔
2005
  STransAction action = {0};
20✔
2006
  action.epSet = mndGetDnodeEpset(pDnode);
20✔
2007

2008
  int32_t contLen = 0;
20✔
2009
  void   *pReq = mndBuildAlterVnodeReplicaReq(pMnode, pDb, pVgroup, pDnode->id, &contLen);
20✔
2010
  if (pReq == NULL) {
20!
2011
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2012
    if (terrno != 0) code = terrno;
×
2013
    TAOS_RETURN(code);
×
2014
  }
2015

2016
  action.pCont = pReq;
20✔
2017
  action.contLen = contLen;
20✔
2018
  action.msgType = TDMT_DND_ALTER_VNODE_TYPE;
20✔
2019
  action.acceptableCode = TSDB_CODE_VND_ALREADY_IS_VOTER;
20✔
2020
  action.retryCode = TSDB_CODE_VND_NOT_CATCH_UP;
20✔
2021

2022
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
20!
2023
    taosMemoryFree(pReq);
×
2024
    TAOS_RETURN(code);
×
2025
  }
2026

2027
  TAOS_RETURN(code);
20✔
2028
}
2029

2030
static int32_t mndAddDisableVnodeWriteAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
112✔
2031
                                             int32_t dnodeId) {
2032
  int32_t    code = 0;
112✔
2033
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
112✔
2034
  if (pDnode == NULL) {
112!
2035
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2036
    if (terrno != 0) code = terrno;
×
2037
    TAOS_RETURN(code);
×
2038
  }
2039

2040
  STransAction action = {0};
112✔
2041
  action.epSet = mndGetDnodeEpset(pDnode);
112✔
2042
  mndReleaseDnode(pMnode, pDnode);
112✔
2043

2044
  int32_t contLen = 0;
112✔
2045
  void   *pReq = mndBuildDisableVnodeWriteReq(pMnode, pDb, pVgroup->vgId, &contLen);
112✔
2046
  if (pReq == NULL) {
112!
2047
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2048
    if (terrno != 0) code = terrno;
×
2049
    TAOS_RETURN(code);
×
2050
  }
2051

2052
  action.pCont = pReq;
112✔
2053
  action.contLen = contLen;
112✔
2054
  action.msgType = TDMT_VND_DISABLE_WRITE;
112✔
2055

2056
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
112!
2057
    taosMemoryFree(pReq);
×
2058
    TAOS_RETURN(code);
×
2059
  }
2060

2061
  TAOS_RETURN(code);
112✔
2062
}
2063

2064
int32_t mndAddDropVnodeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, SVnodeGid *pVgid,
16,792✔
2065
                              bool isRedo) {
2066
  int32_t      code = 0;
16,792✔
2067
  STransAction action = {0};
16,792✔
2068

2069
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
16,792✔
2070
  if (pDnode == NULL) {
16,792!
2071
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2072
    if (terrno != 0) code = terrno;
×
2073
    TAOS_RETURN(code);
×
2074
  }
2075
  action.epSet = mndGetDnodeEpset(pDnode);
16,792✔
2076
  mndReleaseDnode(pMnode, pDnode);
16,792✔
2077

2078
  int32_t contLen = 0;
16,792✔
2079
  void   *pReq = mndBuildDropVnodeReq(pMnode, pDnode, pDb, pVgroup, &contLen);
16,792✔
2080
  if (pReq == NULL) {
16,792!
2081
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2082
    if (terrno != 0) code = terrno;
×
2083
    TAOS_RETURN(code);
×
2084
  }
2085

2086
  action.pCont = pReq;
16,792✔
2087
  action.contLen = contLen;
16,792✔
2088
  action.msgType = TDMT_DND_DROP_VNODE;
16,792✔
2089
  action.acceptableCode = TSDB_CODE_VND_NOT_EXIST;
16,792✔
2090

2091
  if (isRedo) {
16,792✔
2092
    if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
5,228!
2093
      taosMemoryFree(pReq);
×
2094
      TAOS_RETURN(code);
×
2095
    }
2096
  } else {
2097
    if ((code = mndTransAppendUndoAction(pTrans, &action)) != 0) {
11,564!
2098
      taosMemoryFree(pReq);
×
2099
      TAOS_RETURN(code);
×
2100
    }
2101
  }
2102

2103
  TAOS_RETURN(code);
16,792✔
2104
}
2105

2106
int32_t mndSetMoveVgroupInfoToTrans(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int32_t vnIndex,
33✔
2107
                                    SArray *pArray, bool force, bool unsafe) {
2108
  int32_t code = 0;
33✔
2109
  SVgObj  newVg = {0};
33✔
2110
  memcpy(&newVg, pVgroup, sizeof(SVgObj));
33✔
2111

2112
  mInfo("vgId:%d, vgroup info before move, replica:%d", newVg.vgId, newVg.replica);
33!
2113
  for (int32_t i = 0; i < newVg.replica; ++i) {
102✔
2114
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg.vgId, i, newVg.vnodeGid[i].dnodeId);
69!
2115
  }
2116

2117
  if (!force) {
33✔
2118
#if 1
2119
    {
2120
#else
2121
    if (newVg.replica == 1) {
2122
#endif
2123
      mInfo("vgId:%d, will add 1 vnode, replca:%d", pVgroup->vgId, newVg.replica);
29!
2124
      TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, &newVg, pArray));
29✔
2125
      for (int32_t i = 0; i < newVg.replica - 1; ++i) {
88✔
2126
        TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg, newVg.vnodeGid[i].dnodeId));
60!
2127
      }
2128
      TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pDb, &newVg, &newVg.vnodeGid[newVg.replica - 1]));
28!
2129
      TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg));
28!
2130

2131
      mInfo("vgId:%d, will remove 1 vnode, replca:2", pVgroup->vgId);
28!
2132
      newVg.replica--;
28✔
2133
      SVnodeGid del = newVg.vnodeGid[vnIndex];
28✔
2134
      newVg.vnodeGid[vnIndex] = newVg.vnodeGid[newVg.replica];
28✔
2135
      memset(&newVg.vnodeGid[newVg.replica], 0, sizeof(SVnodeGid));
28✔
2136
      {
2137
        SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
28✔
2138
        if (pRaw == NULL) {
28!
2139
          code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2140
          if (terrno != 0) code = terrno;
×
2141
          TAOS_RETURN(code);
×
2142
        }
2143
        if ((code = mndTransAppendRedolog(pTrans, pRaw)) != 0) {
28!
2144
          sdbFreeRaw(pRaw);
×
2145
          TAOS_RETURN(code);
×
2146
        }
2147
        code = sdbSetRawStatus(pRaw, SDB_STATUS_READY);
28✔
2148
        if (code != 0) {
28!
2149
          mError("vgId:%d, failed to set raw status since %s at line:%d", newVg.vgId, tstrerror(code), __LINE__);
×
2150
          return code;
×
2151
        }
2152
      }
2153

2154
      TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pDb, &newVg, &del, true));
28!
2155
      for (int32_t i = 0; i < newVg.replica; ++i) {
88✔
2156
        TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg, newVg.vnodeGid[i].dnodeId));
60!
2157
      }
2158
      TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg));
28!
2159
#if 1
2160
    }
2161
#else
2162
    } else {  // new replica == 3
2163
      mInfo("vgId:%d, will add 1 vnode, replca:3", pVgroup->vgId);
2164
      if (mndAddVnodeToVgroup(pMnode, pTrans, &newVg, pArray) != 0) return -1;
2165
      mInfo("vgId:%d, will remove 1 vnode, replca:4", pVgroup->vgId);
2166
      newVg.replica--;
2167
      SVnodeGid del = newVg.vnodeGid[vnIndex];
2168
      newVg.vnodeGid[vnIndex] = newVg.vnodeGid[newVg.replica];
2169
      memset(&newVg.vnodeGid[newVg.replica], 0, sizeof(SVnodeGid));
2170
      {
2171
        SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
2172
        if (pRaw == NULL) return -1;
2173
        if (mndTransAppendRedolog(pTrans, pRaw) != 0) {
2174
          sdbFreeRaw(pRaw);
2175
          return -1;
2176
        }
2177
      }
2178

2179
      if (mndAddDropVnodeAction(pMnode, pTrans, pDb, &newVg, &del, true) != 0) return -1;
2180
      for (int32_t i = 0; i < newVg.replica; ++i) {
2181
        if (i == vnIndex) continue;
2182
        if (mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg, newVg.vnodeGid[i].dnodeId) != 0) return -1;
2183
      }
2184
      if (mndAddCreateVnodeAction(pMnode, pTrans, pDb, &newVg, &newVg.vnodeGid[vnIndex]) != 0) return -1;
2185
      if (mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg) != 0) return -1;
2186
    }
2187
#endif
2188
  } else {
2189
    mInfo("vgId:%d, will add 1 vnode and force remove 1 vnode", pVgroup->vgId);
4!
2190
    TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, &newVg, pArray));
4!
2191
    newVg.replica--;
4✔
2192
    // SVnodeGid del = newVg.vnodeGid[vnIndex];
2193
    newVg.vnodeGid[vnIndex] = newVg.vnodeGid[newVg.replica];
4✔
2194
    memset(&newVg.vnodeGid[newVg.replica], 0, sizeof(SVnodeGid));
4✔
2195
    {
2196
      SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
4✔
2197
      if (pRaw == NULL) {
4!
2198
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2199
        if (terrno != 0) code = terrno;
×
2200
        TAOS_RETURN(code);
×
2201
      }
2202
      if ((code = mndTransAppendRedolog(pTrans, pRaw)) != 0) {
4!
2203
        sdbFreeRaw(pRaw);
×
2204
        TAOS_RETURN(code);
×
2205
      }
2206
      code = sdbSetRawStatus(pRaw, SDB_STATUS_READY);
4✔
2207
      if (code != 0) {
4!
2208
        mError("vgId:%d, failed to set raw status since %s at line:%d", newVg.vgId, tstrerror(code), __LINE__);
×
2209
        return code;
×
2210
      }
2211
    }
2212

2213
    for (int32_t i = 0; i < newVg.replica; ++i) {
12✔
2214
      if (i != vnIndex) {
8✔
2215
        TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg, newVg.vnodeGid[i].dnodeId));
4!
2216
      }
2217
    }
2218
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pDb, &newVg, &newVg.vnodeGid[vnIndex]));
4!
2219
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg));
4!
2220

2221
    if (newVg.replica == 1) {
4✔
2222
      if (force && !unsafe) {
2!
2223
        TAOS_RETURN(TSDB_CODE_VND_META_DATA_UNSAFE_DELETE);
1✔
2224
      }
2225

2226
      SSdb *pSdb = pMnode->pSdb;
1✔
2227
      void *pIter = NULL;
1✔
2228

2229
      while (1) {
3✔
2230
        SStbObj *pStb = NULL;
4✔
2231
        pIter = sdbFetch(pSdb, SDB_STB, pIter, (void **)&pStb);
4✔
2232
        if (pIter == NULL) break;
4✔
2233

2234
        if (strcmp(pStb->db, pDb->name) == 0) {
3✔
2235
          if ((code = mndSetForceDropCreateStbRedoActions(pMnode, pTrans, &newVg, pStb)) != 0) {
2!
2236
            sdbCancelFetch(pSdb, pIter);
×
2237
            sdbRelease(pSdb, pStb);
×
2238
            TAOS_RETURN(code);
×
2239
          }
2240
        }
2241

2242
        sdbRelease(pSdb, pStb);
3✔
2243
      }
2244

2245
      mInfo("vgId:%d, all data is dropped since replica=1", pVgroup->vgId);
1!
2246
    }
2247
  }
2248

2249
  {
2250
    SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
31✔
2251
    if (pRaw == NULL) {
31!
2252
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2253
      if (terrno != 0) code = terrno;
×
2254
      TAOS_RETURN(code);
×
2255
    }
2256
    if ((code = mndTransAppendCommitlog(pTrans, pRaw)) != 0) {
31!
2257
      sdbFreeRaw(pRaw);
×
2258
      TAOS_RETURN(code);
×
2259
    }
2260
    code = sdbSetRawStatus(pRaw, SDB_STATUS_READY);
31✔
2261
    if (code != 0) {
31!
2262
      mError("vgId:%d, failed to set raw status since %s at line:%d", newVg.vgId, tstrerror(code), __LINE__);
×
2263
      return code;
×
2264
    }
2265
  }
2266

2267
  mInfo("vgId:%d, vgroup info after move, replica:%d", newVg.vgId, newVg.replica);
31!
2268
  for (int32_t i = 0; i < newVg.replica; ++i) {
98✔
2269
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg.vgId, i, newVg.vnodeGid[i].dnodeId);
67!
2270
  }
2271
  TAOS_RETURN(code);
31✔
2272
}
2273

2274
int32_t mndSetMoveVgroupsInfoToTrans(SMnode *pMnode, STrans *pTrans, int32_t delDnodeId, bool force, bool unsafe) {
16✔
2275
  int32_t code = 0;
16✔
2276
  SArray *pArray = mndBuildDnodesArray(pMnode, delDnodeId, NULL);
16✔
2277
  if (pArray == NULL) {
16!
2278
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2279
    if (terrno != 0) code = terrno;
×
2280
    TAOS_RETURN(code);
×
2281
  }
2282

2283
  void *pIter = NULL;
16✔
2284
  while (1) {
44✔
2285
    SVgObj *pVgroup = NULL;
60✔
2286
    pIter = sdbFetch(pMnode->pSdb, SDB_VGROUP, pIter, (void **)&pVgroup);
60✔
2287
    if (pIter == NULL) break;
60✔
2288

2289
    int32_t vnIndex = -1;
46✔
2290
    for (int32_t i = 0; i < pVgroup->replica; ++i) {
81✔
2291
      if (pVgroup->vnodeGid[i].dnodeId == delDnodeId) {
68✔
2292
        vnIndex = i;
33✔
2293
        break;
33✔
2294
      }
2295
    }
2296

2297
    code = 0;
46✔
2298
    if (vnIndex != -1) {
46✔
2299
      mInfo("vgId:%d, vnode:%d will be removed from dnode:%d, force:%d", pVgroup->vgId, vnIndex, delDnodeId, force);
33!
2300
      SDbObj *pDb = mndAcquireDb(pMnode, pVgroup->dbName);
33✔
2301
      code = mndSetMoveVgroupInfoToTrans(pMnode, pTrans, pDb, pVgroup, vnIndex, pArray, force, unsafe);
33✔
2302
      mndReleaseDb(pMnode, pDb);
33✔
2303
    }
2304

2305
    sdbRelease(pMnode->pSdb, pVgroup);
46✔
2306

2307
    if (code != 0) {
46✔
2308
      sdbCancelFetch(pMnode->pSdb, pIter);
2✔
2309
      break;
2✔
2310
    }
2311
  }
2312

2313
  taosArrayDestroy(pArray);
16✔
2314
  TAOS_RETURN(code);
16✔
2315
}
2316

2317
static int32_t mndAddIncVgroupReplicaToTrans(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
125✔
2318
                                             int32_t newDnodeId) {
2319
  int32_t code = 0;
125✔
2320
  mInfo("vgId:%d, will add 1 vnode, replica:%d dnode:%d", pVgroup->vgId, pVgroup->replica, newDnodeId);
125!
2321

2322
  // assoc dnode
2323
  SVnodeGid *pGid = &pVgroup->vnodeGid[pVgroup->replica];
125✔
2324
  pVgroup->replica++;
125✔
2325
  pGid->dnodeId = newDnodeId;
125✔
2326
  pGid->syncState = TAOS_SYNC_STATE_OFFLINE;
125✔
2327
  pGid->nodeRole = TAOS_SYNC_ROLE_LEARNER;
125✔
2328

2329
  SSdbRaw *pVgRaw = mndVgroupActionEncode(pVgroup);
125✔
2330
  if (pVgRaw == NULL) {
125!
2331
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2332
    if (terrno != 0) code = terrno;
×
2333
    TAOS_RETURN(code);
×
2334
  }
2335
  if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
125!
2336
    sdbFreeRaw(pVgRaw);
×
2337
    TAOS_RETURN(code);
×
2338
  }
2339
  code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
125✔
2340
  if (code != 0) {
125!
2341
    mError("vgId:%d, failed to set raw status since %s at line:%d", pVgroup->vgId, tstrerror(code), __LINE__);
×
2342
    TAOS_RETURN(code);
×
2343
  }
2344

2345
  // learner
2346
  for (int32_t i = 0; i < pVgroup->replica - 1; ++i) {
394✔
2347
    TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, pVgroup, pVgroup->vnodeGid[i].dnodeId));
269!
2348
  }
2349
  TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pDb, pVgroup, pGid));
125!
2350

2351
  // voter
2352
  pGid->nodeRole = TAOS_SYNC_ROLE_VOTER;
125✔
2353
  TAOS_CHECK_RETURN(mndAddAlterVnodeTypeAction(pMnode, pTrans, pDb, pVgroup, pGid->dnodeId));
125!
2354
  for (int32_t i = 0; i < pVgroup->replica - 1; ++i) {
394✔
2355
    TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, pVgroup, pVgroup->vnodeGid[i].dnodeId));
269!
2356
  }
2357

2358
  // confirm
2359
  TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, pVgroup));
125!
2360

2361
  TAOS_RETURN(code);
125✔
2362
}
2363

2364
static int32_t mndAddDecVgroupReplicaFromTrans(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
125✔
2365
                                               int32_t delDnodeId) {
2366
  int32_t code = 0;
125✔
2367
  mInfo("vgId:%d, will remove 1 vnode, replica:%d dnode:%d", pVgroup->vgId, pVgroup->replica, delDnodeId);
125!
2368

2369
  SVnodeGid *pGid = NULL;
125✔
2370
  SVnodeGid  delGid = {0};
125✔
2371
  for (int32_t i = 0; i < pVgroup->replica; ++i) {
198!
2372
    if (pVgroup->vnodeGid[i].dnodeId == delDnodeId) {
198✔
2373
      pGid = &pVgroup->vnodeGid[i];
125✔
2374
      break;
125✔
2375
    }
2376
  }
2377

2378
  if (pGid == NULL) return 0;
125!
2379

2380
  pVgroup->replica--;
125✔
2381
  memcpy(&delGid, pGid, sizeof(SVnodeGid));
125✔
2382
  memcpy(pGid, &pVgroup->vnodeGid[pVgroup->replica], sizeof(SVnodeGid));
125✔
2383
  memset(&pVgroup->vnodeGid[pVgroup->replica], 0, sizeof(SVnodeGid));
125✔
2384

2385
  SSdbRaw *pVgRaw = mndVgroupActionEncode(pVgroup);
125✔
2386
  if (pVgRaw == NULL) {
125!
2387
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2388
    if (terrno != 0) code = terrno;
×
2389
    TAOS_RETURN(code);
×
2390
  }
2391
  if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
125!
2392
    sdbFreeRaw(pVgRaw);
×
2393
    TAOS_RETURN(code);
×
2394
  }
2395
  code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
125✔
2396
  if (code != 0) {
125!
2397
    mError("vgId:%d, failed to set raw status since %s at line:%d", pVgroup->vgId, tstrerror(code), __LINE__);
×
2398
    TAOS_RETURN(code);
×
2399
  }
2400

2401
  TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pDb, pVgroup, &delGid, true));
125!
2402
  for (int32_t i = 0; i < pVgroup->replica; ++i) {
394✔
2403
    TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, pVgroup, pVgroup->vnodeGid[i].dnodeId));
269!
2404
  }
2405
  TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, pVgroup));
125!
2406

2407
  TAOS_RETURN(code);
125✔
2408
}
2409

2410
static int32_t mndRedistributeVgroup(SMnode *pMnode, SRpcMsg *pReq, SDbObj *pDb, SVgObj *pVgroup, SDnodeObj *pNew1,
79✔
2411
                                     SDnodeObj *pOld1, SDnodeObj *pNew2, SDnodeObj *pOld2, SDnodeObj *pNew3,
2412
                                     SDnodeObj *pOld3) {
2413
  int32_t code = -1;
79✔
2414
  STrans *pTrans = NULL;
79✔
2415

2416
  pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, TRN_CONFLICT_GLOBAL, pReq, "red-vgroup");
79✔
2417
  if (pTrans == NULL) {
79!
2418
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2419
    if (terrno != 0) code = terrno;
×
2420
    goto _OVER;
×
2421
  }
2422

2423
  mndTransSetDbName(pTrans, pVgroup->dbName, NULL);
79✔
2424
  TAOS_CHECK_GOTO(mndTransCheckConflictWithCompact(pMnode, pTrans), NULL, _OVER);
79✔
2425

2426
  mndTransSetSerial(pTrans);
78✔
2427
  mInfo("trans:%d, used to redistribute vgroup, vgId:%d", pTrans->id, pVgroup->vgId);
78!
2428

2429
  SVgObj newVg = {0};
78✔
2430
  memcpy(&newVg, pVgroup, sizeof(SVgObj));
78✔
2431
  mInfo("vgId:%d, vgroup info before redistribute, replica:%d", newVg.vgId, newVg.replica);
78!
2432
  for (int32_t i = 0; i < newVg.replica; ++i) {
234✔
2433
    mInfo("vgId:%d, vnode:%d dnode:%d role:%s", newVg.vgId, i, newVg.vnodeGid[i].dnodeId,
156!
2434
          syncStr(newVg.vnodeGid[i].syncState));
2435
  }
2436

2437
  if (pNew1 != NULL && pOld1 != NULL) {
78!
2438
    int32_t numOfVnodes = mndGetVnodesNum(pMnode, pNew1->id);
78✔
2439
    if (numOfVnodes >= pNew1->numOfSupportVnodes) {
78✔
2440
      mError("vgId:%d, no enough vnodes in dnode:%d, numOfVnodes:%d support:%d", newVg.vgId, pNew1->id, numOfVnodes,
1!
2441
             pNew1->numOfSupportVnodes);
2442
      code = TSDB_CODE_MND_NO_ENOUGH_VNODES;
1✔
2443
      goto _OVER;
1✔
2444
    }
2445

2446
    int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
77✔
2447
    if (pNew1->memAvail - vgMem - pNew1->memUsed <= 0) {
77!
2448
      mError("db:%s, vgId:%d, no enough memory:%" PRId64 " in dnode:%d avail:%" PRId64 " used:%" PRId64,
×
2449
             pVgroup->dbName, pVgroup->vgId, vgMem, pNew1->id, pNew1->memAvail, pNew1->memUsed);
2450
      code = TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE;
×
2451
      goto _OVER;
×
2452
    } else {
2453
      pNew1->memUsed += vgMem;
77✔
2454
    }
2455

2456
    TAOS_CHECK_GOTO(mndAddIncVgroupReplicaToTrans(pMnode, pTrans, pDb, &newVg, pNew1->id), NULL, _OVER);
77!
2457
    TAOS_CHECK_GOTO(mndAddDecVgroupReplicaFromTrans(pMnode, pTrans, pDb, &newVg, pOld1->id), NULL, _OVER);
77!
2458
  }
2459

2460
  if (pNew2 != NULL && pOld2 != NULL) {
77!
2461
    int32_t numOfVnodes = mndGetVnodesNum(pMnode, pNew2->id);
16✔
2462
    if (numOfVnodes >= pNew2->numOfSupportVnodes) {
16!
2463
      mError("vgId:%d, no enough vnodes in dnode:%d, numOfVnodes:%d support:%d", newVg.vgId, pNew2->id, numOfVnodes,
×
2464
             pNew2->numOfSupportVnodes);
2465
      code = TSDB_CODE_MND_NO_ENOUGH_VNODES;
×
2466
      goto _OVER;
×
2467
    }
2468
    int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
16✔
2469
    if (pNew2->memAvail - vgMem - pNew2->memUsed <= 0) {
16!
2470
      mError("db:%s, vgId:%d, no enough memory:%" PRId64 " in dnode:%d avail:%" PRId64 " used:%" PRId64,
×
2471
             pVgroup->dbName, pVgroup->vgId, vgMem, pNew2->id, pNew2->memAvail, pNew2->memUsed);
2472
      code = TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE;
×
2473
      goto _OVER;
×
2474
    } else {
2475
      pNew2->memUsed += vgMem;
16✔
2476
    }
2477
    TAOS_CHECK_GOTO(mndAddIncVgroupReplicaToTrans(pMnode, pTrans, pDb, &newVg, pNew2->id), NULL, _OVER);
16!
2478
    TAOS_CHECK_GOTO(mndAddDecVgroupReplicaFromTrans(pMnode, pTrans, pDb, &newVg, pOld2->id), NULL, _OVER);
16!
2479
  }
2480

2481
  if (pNew3 != NULL && pOld3 != NULL) {
77!
2482
    int32_t numOfVnodes = mndGetVnodesNum(pMnode, pNew3->id);
8✔
2483
    if (numOfVnodes >= pNew3->numOfSupportVnodes) {
8!
2484
      mError("vgId:%d, no enough vnodes in dnode:%d, numOfVnodes:%d support:%d", newVg.vgId, pNew3->id, numOfVnodes,
×
2485
             pNew3->numOfSupportVnodes);
2486
      code = TSDB_CODE_MND_NO_ENOUGH_VNODES;
×
2487
      goto _OVER;
×
2488
    }
2489
    int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
8✔
2490
    if (pNew3->memAvail - vgMem - pNew3->memUsed <= 0) {
8!
2491
      mError("db:%s, vgId:%d, no enough memory:%" PRId64 " in dnode:%d avail:%" PRId64 " used:%" PRId64,
×
2492
             pVgroup->dbName, pVgroup->vgId, vgMem, pNew3->id, pNew3->memAvail, pNew3->memUsed);
2493
      code = TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE;
×
2494
      goto _OVER;
×
2495
    } else {
2496
      pNew3->memUsed += vgMem;
8✔
2497
    }
2498
    TAOS_CHECK_GOTO(mndAddIncVgroupReplicaToTrans(pMnode, pTrans, pDb, &newVg, pNew3->id), NULL, _OVER);
8!
2499
    TAOS_CHECK_GOTO(mndAddDecVgroupReplicaFromTrans(pMnode, pTrans, pDb, &newVg, pOld3->id), NULL, _OVER);
8!
2500
  }
2501

2502
  {
2503
    SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
77✔
2504
    if (pRaw == NULL) {
77!
2505
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2506
      if (terrno != 0) code = terrno;
×
2507
      goto _OVER;
×
2508
    }
2509
    if ((code = mndTransAppendCommitlog(pTrans, pRaw)) != 0) {
77!
2510
      sdbFreeRaw(pRaw);
×
2511
      goto _OVER;
×
2512
    }
2513
    code = sdbSetRawStatus(pRaw, SDB_STATUS_READY);
77✔
2514
    if (code != 0) {
77!
2515
      mError("vgId:%d, failed to set raw status since %s at line:%d", newVg.vgId, tstrerror(code), __LINE__);
×
2516
      goto _OVER;
×
2517
    }
2518
  }
2519

2520
  mInfo("vgId:%d, vgroup info after redistribute, replica:%d", newVg.vgId, newVg.replica);
77!
2521
  for (int32_t i = 0; i < newVg.replica; ++i) {
230✔
2522
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg.vgId, i, newVg.vnodeGid[i].dnodeId);
153!
2523
  }
2524

2525
  TAOS_CHECK_GOTO(mndTransPrepare(pMnode, pTrans), NULL, _OVER);
77!
2526
  code = 0;
77✔
2527

2528
_OVER:
79✔
2529
  mndTransDrop(pTrans);
79✔
2530
  mndReleaseDb(pMnode, pDb);
79✔
2531
  TAOS_RETURN(code);
79✔
2532
}
2533

2534
static int32_t mndProcessRedistributeVgroupMsg(SRpcMsg *pReq) {
95✔
2535
  SMnode    *pMnode = pReq->info.node;
95✔
2536
  SDnodeObj *pNew1 = NULL;
95✔
2537
  SDnodeObj *pNew2 = NULL;
95✔
2538
  SDnodeObj *pNew3 = NULL;
95✔
2539
  SDnodeObj *pOld1 = NULL;
95✔
2540
  SDnodeObj *pOld2 = NULL;
95✔
2541
  SDnodeObj *pOld3 = NULL;
95✔
2542
  SVgObj    *pVgroup = NULL;
95✔
2543
  SDbObj    *pDb = NULL;
95✔
2544
  int32_t    code = -1;
95✔
2545
  int64_t    curMs = taosGetTimestampMs();
95✔
2546
  int32_t    newDnodeId[3] = {0};
95✔
2547
  int32_t    oldDnodeId[3] = {0};
95✔
2548
  int32_t    newIndex = -1;
95✔
2549
  int32_t    oldIndex = -1;
95✔
2550

2551
  SRedistributeVgroupReq req = {0};
95✔
2552
  if (tDeserializeSRedistributeVgroupReq(pReq->pCont, pReq->contLen, &req) != 0) {
95!
2553
    code = TSDB_CODE_INVALID_MSG;
×
2554
    goto _OVER;
×
2555
  }
2556

2557
  mInfo("vgId:%d, start to redistribute vgroup to dnode %d:%d:%d", req.vgId, req.dnodeId1, req.dnodeId2, req.dnodeId3);
95!
2558
  if ((code = mndCheckOperPrivilege(pMnode, pReq->info.conn.user, MND_OPER_REDISTRIBUTE_VGROUP)) != 0) {
95✔
2559
    goto _OVER;
1✔
2560
  }
2561

2562
  pVgroup = mndAcquireVgroup(pMnode, req.vgId);
94✔
2563
  if (pVgroup == NULL) {
94✔
2564
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
3✔
2565
    if (terrno != 0) code = terrno;
3!
2566
    goto _OVER;
3✔
2567
  }
2568

2569
  pDb = mndAcquireDb(pMnode, pVgroup->dbName);
91✔
2570
  if (pDb == NULL) {
91!
2571
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2572
    if (terrno != 0) code = terrno;
×
2573
    goto _OVER;
×
2574
  }
2575

2576
  if (pVgroup->replica == 1) {
91✔
2577
    if (req.dnodeId1 <= 0 || req.dnodeId2 > 0 || req.dnodeId3 > 0) {
43!
2578
      code = TSDB_CODE_MND_INVALID_REPLICA;
×
2579
      goto _OVER;
×
2580
    }
2581

2582
    if (req.dnodeId1 == pVgroup->vnodeGid[0].dnodeId) {
43✔
2583
      // terrno = TSDB_CODE_MND_VGROUP_UN_CHANGED;
2584
      code = 0;
1✔
2585
      goto _OVER;
1✔
2586
    }
2587

2588
    pNew1 = mndAcquireDnode(pMnode, req.dnodeId1);
42✔
2589
    if (pNew1 == NULL) {
42!
2590
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2591
      if (terrno != 0) code = terrno;
×
2592
      goto _OVER;
×
2593
    }
2594
    if (!mndIsDnodeOnline(pNew1, curMs)) {
42!
2595
      code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2596
      goto _OVER;
×
2597
    }
2598

2599
    pOld1 = mndAcquireDnode(pMnode, pVgroup->vnodeGid[0].dnodeId);
42✔
2600
    if (pOld1 == NULL) {
42!
2601
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2602
      if (terrno != 0) code = terrno;
×
2603
      goto _OVER;
×
2604
    }
2605
    if (!mndIsDnodeOnline(pOld1, curMs)) {
42✔
2606
      code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
2✔
2607
      goto _OVER;
2✔
2608
    }
2609

2610
    code = mndRedistributeVgroup(pMnode, pReq, pDb, pVgroup, pNew1, pOld1, NULL, NULL, NULL, NULL);
40✔
2611

2612
  } else if (pVgroup->replica == 3) {
48!
2613
    if (req.dnodeId1 <= 0 || req.dnodeId2 <= 0 || req.dnodeId3 <= 0) {
48!
2614
      code = TSDB_CODE_MND_INVALID_REPLICA;
4✔
2615
      goto _OVER;
4✔
2616
    }
2617

2618
    if (req.dnodeId1 == req.dnodeId2 || req.dnodeId1 == req.dnodeId3 || req.dnodeId2 == req.dnodeId3) {
44!
2619
      code = TSDB_CODE_MND_INVALID_REPLICA;
1✔
2620
      goto _OVER;
1✔
2621
    }
2622

2623
    if (req.dnodeId1 != pVgroup->vnodeGid[0].dnodeId && req.dnodeId1 != pVgroup->vnodeGid[1].dnodeId &&
43✔
2624
        req.dnodeId1 != pVgroup->vnodeGid[2].dnodeId) {
22✔
2625
      newDnodeId[++newIndex] = req.dnodeId1;
19✔
2626
      mInfo("vgId:%d, dnode:%d will be added, index:%d", pVgroup->vgId, newDnodeId[newIndex], newIndex);
19!
2627
    }
2628

2629
    if (req.dnodeId2 != pVgroup->vnodeGid[0].dnodeId && req.dnodeId2 != pVgroup->vnodeGid[1].dnodeId &&
43✔
2630
        req.dnodeId2 != pVgroup->vnodeGid[2].dnodeId) {
29✔
2631
      newDnodeId[++newIndex] = req.dnodeId2;
22✔
2632
      mInfo("vgId:%d, dnode:%d will be added, index:%d", pVgroup->vgId, newDnodeId[newIndex], newIndex);
22!
2633
    }
2634

2635
    if (req.dnodeId3 != pVgroup->vnodeGid[0].dnodeId && req.dnodeId3 != pVgroup->vnodeGid[1].dnodeId &&
43✔
2636
        req.dnodeId3 != pVgroup->vnodeGid[2].dnodeId) {
35✔
2637
      newDnodeId[++newIndex] = req.dnodeId3;
29✔
2638
      mInfo("vgId:%d, dnode:%d will be added, index:%d", pVgroup->vgId, newDnodeId[newIndex], newIndex);
29!
2639
    }
2640

2641
    if (req.dnodeId1 != pVgroup->vnodeGid[0].dnodeId && req.dnodeId2 != pVgroup->vnodeGid[0].dnodeId &&
43✔
2642
        req.dnodeId3 != pVgroup->vnodeGid[0].dnodeId) {
27✔
2643
      oldDnodeId[++oldIndex] = pVgroup->vnodeGid[0].dnodeId;
25✔
2644
      mInfo("vgId:%d, dnode:%d will be removed, index:%d", pVgroup->vgId, oldDnodeId[oldIndex], oldIndex);
25!
2645
    }
2646

2647
    if (req.dnodeId1 != pVgroup->vnodeGid[1].dnodeId && req.dnodeId2 != pVgroup->vnodeGid[1].dnodeId &&
43✔
2648
        req.dnodeId3 != pVgroup->vnodeGid[1].dnodeId) {
24✔
2649
      oldDnodeId[++oldIndex] = pVgroup->vnodeGid[1].dnodeId;
18✔
2650
      mInfo("vgId:%d, dnode:%d will be removed, index:%d", pVgroup->vgId, oldDnodeId[oldIndex], oldIndex);
18!
2651
    }
2652

2653
    if (req.dnodeId1 != pVgroup->vnodeGid[2].dnodeId && req.dnodeId2 != pVgroup->vnodeGid[2].dnodeId &&
43✔
2654
        req.dnodeId3 != pVgroup->vnodeGid[2].dnodeId) {
33✔
2655
      oldDnodeId[++oldIndex] = pVgroup->vnodeGid[2].dnodeId;
27✔
2656
      mInfo("vgId:%d, dnode:%d will be removed, index:%d", pVgroup->vgId, oldDnodeId[oldIndex], oldIndex);
27!
2657
    }
2658

2659
    if (newDnodeId[0] != 0) {
43✔
2660
      pNew1 = mndAcquireDnode(pMnode, newDnodeId[0]);
42✔
2661
      if (pNew1 == NULL) {
42!
2662
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2663
        if (terrno != 0) code = terrno;
×
2664
        goto _OVER;
×
2665
      }
2666
      if (!mndIsDnodeOnline(pNew1, curMs)) {
42✔
2667
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
1✔
2668
        goto _OVER;
1✔
2669
      }
2670
    }
2671

2672
    if (newDnodeId[1] != 0) {
42✔
2673
      pNew2 = mndAcquireDnode(pMnode, newDnodeId[1]);
18✔
2674
      if (pNew2 == NULL) {
18!
2675
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2676
        if (terrno != 0) code = terrno;
×
2677
        goto _OVER;
×
2678
      }
2679
      if (!mndIsDnodeOnline(pNew2, curMs)) {
18!
2680
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2681
        goto _OVER;
×
2682
      }
2683
    }
2684

2685
    if (newDnodeId[2] != 0) {
42✔
2686
      pNew3 = mndAcquireDnode(pMnode, newDnodeId[2]);
10✔
2687
      if (pNew3 == NULL) {
10!
2688
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2689
        if (terrno != 0) code = terrno;
×
2690
        goto _OVER;
×
2691
      }
2692
      if (!mndIsDnodeOnline(pNew3, curMs)) {
10!
2693
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2694
        goto _OVER;
×
2695
      }
2696
    }
2697

2698
    if (oldDnodeId[0] != 0) {
42✔
2699
      pOld1 = mndAcquireDnode(pMnode, oldDnodeId[0]);
41✔
2700
      if (pOld1 == NULL) {
41!
2701
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2702
        if (terrno != 0) code = terrno;
×
2703
        goto _OVER;
×
2704
      }
2705
      if (!mndIsDnodeOnline(pOld1, curMs)) {
41✔
2706
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
2✔
2707
        goto _OVER;
2✔
2708
      }
2709
    }
2710

2711
    if (oldDnodeId[1] != 0) {
40✔
2712
      pOld2 = mndAcquireDnode(pMnode, oldDnodeId[1]);
16✔
2713
      if (pOld2 == NULL) {
16!
2714
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2715
        if (terrno != 0) code = terrno;
×
2716
        goto _OVER;
×
2717
      }
2718
      if (!mndIsDnodeOnline(pOld2, curMs)) {
16!
2719
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2720
        goto _OVER;
×
2721
      }
2722
    }
2723

2724
    if (oldDnodeId[2] != 0) {
40✔
2725
      pOld3 = mndAcquireDnode(pMnode, oldDnodeId[2]);
8✔
2726
      if (pOld3 == NULL) {
8!
2727
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2728
        if (terrno != 0) code = terrno;
×
2729
        goto _OVER;
×
2730
      }
2731
      if (!mndIsDnodeOnline(pOld3, curMs)) {
8!
2732
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2733
        goto _OVER;
×
2734
      }
2735
    }
2736

2737
    if (pNew1 == NULL && pOld1 == NULL && pNew2 == NULL && pOld2 == NULL && pNew3 == NULL && pOld3 == NULL) {
40!
2738
      // terrno = TSDB_CODE_MND_VGROUP_UN_CHANGED;
2739
      code = 0;
1✔
2740
      goto _OVER;
1✔
2741
    }
2742

2743
    code = mndRedistributeVgroup(pMnode, pReq, pDb, pVgroup, pNew1, pOld1, pNew2, pOld2, pNew3, pOld3);
39✔
2744

2745
  } else {
2746
    code = TSDB_CODE_MND_REQ_REJECTED;
×
2747
    goto _OVER;
×
2748
  }
2749

2750
  if (code == 0) code = TSDB_CODE_ACTION_IN_PROGRESS;
79✔
2751

2752
  char obj[33] = {0};
79✔
2753
  (void)tsnprintf(obj, sizeof(obj), "%d", req.vgId);
79✔
2754

2755
  auditRecord(pReq, pMnode->clusterId, "RedistributeVgroup", "", obj, req.sql, req.sqlLen);
79✔
2756

2757
_OVER:
95✔
2758
  if (code != 0 && code != TSDB_CODE_ACTION_IN_PROGRESS) {
95✔
2759
    mError("vgId:%d, failed to redistribute to dnode %d:%d:%d since %s", req.vgId, req.dnodeId1, req.dnodeId2,
16!
2760
           req.dnodeId3, tstrerror(code));
2761
  }
2762

2763
  mndReleaseDnode(pMnode, pNew1);
95✔
2764
  mndReleaseDnode(pMnode, pNew2);
95✔
2765
  mndReleaseDnode(pMnode, pNew3);
95✔
2766
  mndReleaseDnode(pMnode, pOld1);
95✔
2767
  mndReleaseDnode(pMnode, pOld2);
95✔
2768
  mndReleaseDnode(pMnode, pOld3);
95✔
2769
  mndReleaseVgroup(pMnode, pVgroup);
95✔
2770
  mndReleaseDb(pMnode, pDb);
95✔
2771
  tFreeSRedistributeVgroupReq(&req);
95✔
2772

2773
  TAOS_RETURN(code);
95✔
2774
}
2775

2776
static void *mndBuildSForceBecomeFollowerReq(SMnode *pMnode, SVgObj *pVgroup, int32_t dnodeId, int32_t *pContLen) {
12✔
2777
  SForceBecomeFollowerReq balanceReq = {
12✔
2778
      .vgId = pVgroup->vgId,
12✔
2779
  };
2780

2781
  int32_t contLen = tSerializeSForceBecomeFollowerReq(NULL, 0, &balanceReq);
12✔
2782
  if (contLen < 0) {
12!
2783
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
2784
    return NULL;
×
2785
  }
2786
  contLen += sizeof(SMsgHead);
12✔
2787

2788
  void *pReq = taosMemoryMalloc(contLen);
12!
2789
  if (pReq == NULL) {
12!
2790
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
2791
    return NULL;
×
2792
  }
2793

2794
  SMsgHead *pHead = pReq;
12✔
2795
  pHead->contLen = htonl(contLen);
12✔
2796
  pHead->vgId = htonl(pVgroup->vgId);
12✔
2797

2798
  if (tSerializeSForceBecomeFollowerReq((char *)pReq + sizeof(SMsgHead), contLen, &balanceReq) < 0) {
12!
2799
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
2800
    taosMemoryFree(pReq);
×
2801
    return NULL;
×
2802
  }
2803
  *pContLen = contLen;
12✔
2804
  return pReq;
12✔
2805
}
2806

2807
int32_t mndAddBalanceVgroupLeaderAction(SMnode *pMnode, STrans *pTrans, SVgObj *pVgroup, int32_t dnodeId) {
12✔
2808
  int32_t    code = 0;
12✔
2809
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
12✔
2810
  if (pDnode == NULL) {
12!
2811
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2812
    if (terrno != 0) code = terrno;
×
2813
    TAOS_RETURN(code);
×
2814
  }
2815

2816
  STransAction action = {0};
12✔
2817
  action.epSet = mndGetDnodeEpset(pDnode);
12✔
2818
  mndReleaseDnode(pMnode, pDnode);
12✔
2819

2820
  int32_t contLen = 0;
12✔
2821
  void   *pReq = mndBuildSForceBecomeFollowerReq(pMnode, pVgroup, dnodeId, &contLen);
12✔
2822
  if (pReq == NULL) {
12!
2823
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2824
    if (terrno != 0) code = terrno;
×
2825
    TAOS_RETURN(code);
×
2826
  }
2827

2828
  action.pCont = pReq;
12✔
2829
  action.contLen = contLen;
12✔
2830
  action.msgType = TDMT_SYNC_FORCE_FOLLOWER;
12✔
2831

2832
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
12!
2833
    taosMemoryFree(pReq);
×
2834
    TAOS_RETURN(code);
×
2835
  }
2836

2837
  TAOS_RETURN(code);
12✔
2838
}
2839

2840
int32_t mndAddVgroupBalanceToTrans(SMnode *pMnode, SVgObj *pVgroup, STrans *pTrans) {
14✔
2841
  int32_t code = 0;
14✔
2842
  SSdb   *pSdb = pMnode->pSdb;
14✔
2843

2844
  int32_t vgid = pVgroup->vgId;
14✔
2845
  int8_t  replica = pVgroup->replica;
14✔
2846

2847
  if (pVgroup->replica <= 1) {
14✔
2848
    mInfo("trans:%d, vgid:%d no need to balance, replica:%d", pTrans->id, vgid, replica);
1!
2849
    return -1;
1✔
2850
  }
2851

2852
  int32_t dnodeId = 0;
13✔
2853

2854
  for (int i = 0; i < replica; i++) {
30✔
2855
    if (pVgroup->vnodeGid[i].syncState == TAOS_SYNC_STATE_LEADER) {
29✔
2856
      dnodeId = pVgroup->vnodeGid[i].dnodeId;
12✔
2857
      break;
12✔
2858
    }
2859
  }
2860

2861
  bool       exist = false;
13✔
2862
  bool       online = false;
13✔
2863
  int64_t    curMs = taosGetTimestampMs();
13✔
2864
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
13✔
2865
  if (pDnode != NULL) {
13✔
2866
    exist = true;
12✔
2867
    online = mndIsDnodeOnline(pDnode, curMs);
12✔
2868
    mndReleaseDnode(pMnode, pDnode);
12✔
2869
  }
2870

2871
  if (exist && online) {
25!
2872
    mInfo("trans:%d, vgid:%d leader to dnode:%d", pTrans->id, vgid, dnodeId);
12!
2873

2874
    if ((code = mndAddBalanceVgroupLeaderAction(pMnode, pTrans, pVgroup, dnodeId)) != 0) {
12!
2875
      mError("trans:%d, vgid:%d failed to be balanced to dnode:%d", pTrans->id, vgid, dnodeId);
×
2876
      TAOS_RETURN(code);
×
2877
    }
2878

2879
    SDbObj *pDb = mndAcquireDb(pMnode, pVgroup->dbName);
12✔
2880
    if (pDb == NULL) {
12!
2881
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2882
      if (terrno != 0) code = terrno;
×
2883
      mError("trans:%d, vgid:%d failed to be balanced to dnode:%d, because db not exist", pTrans->id, vgid, dnodeId);
×
2884
      TAOS_RETURN(code);
×
2885
    }
2886

2887
    mndReleaseDb(pMnode, pDb);
12✔
2888
  } else {
2889
    mInfo("trans:%d, vgid:%d cant be balanced to dnode:%d, exist:%d, online:%d", pTrans->id, vgid, dnodeId, exist,
1!
2890
          online);
2891
  }
2892

2893
  TAOS_RETURN(code);
13✔
2894
}
2895

2896
extern int32_t mndProcessVgroupBalanceLeaderMsgImp(SRpcMsg *pReq);
2897

2898
int32_t mndProcessVgroupBalanceLeaderMsg(SRpcMsg *pReq) { return mndProcessVgroupBalanceLeaderMsgImp(pReq); }
5✔
2899

2900
#ifndef TD_ENTERPRISE
2901
int32_t mndProcessVgroupBalanceLeaderMsgImp(SRpcMsg *pReq) { return 0; }
2902
#endif
2903

2904
static int32_t mndCheckDnodeMemory(SMnode *pMnode, SDbObj *pOldDb, SDbObj *pNewDb, SVgObj *pOldVgroup,
646✔
2905
                                   SVgObj *pNewVgroup, SArray *pArray) {
2906
  for (int32_t i = 0; i < (int32_t)taosArrayGetSize(pArray); ++i) {
1,530✔
2907
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
884✔
2908
    bool       inVgroup = false;
884✔
2909
    int64_t    oldMemUsed = 0;
884✔
2910
    int64_t    newMemUsed = 0;
884✔
2911
    mDebug("db:%s, vgId:%d, check dnode:%d, avail:%" PRId64 " used:%" PRId64, pNewVgroup->dbName, pNewVgroup->vgId,
884✔
2912
           pDnode->id, pDnode->memAvail, pDnode->memUsed);
2913
    for (int32_t j = 0; j < pOldVgroup->replica; ++j) {
2,392✔
2914
      SVnodeGid *pVgId = &pOldVgroup->vnodeGid[j];
1,508✔
2915
      if (pDnode->id == pVgId->dnodeId) {
1,508✔
2916
        oldMemUsed = mndGetVgroupMemory(pMnode, pOldDb, pOldVgroup);
854✔
2917
        inVgroup = true;
854✔
2918
      }
2919
    }
2920
    for (int32_t j = 0; j < pNewVgroup->replica; ++j) {
2,392✔
2921
      SVnodeGid *pVgId = &pNewVgroup->vnodeGid[j];
1,508✔
2922
      if (pDnode->id == pVgId->dnodeId) {
1,508✔
2923
        newMemUsed = mndGetVgroupMemory(pMnode, pNewDb, pNewVgroup);
854✔
2924
        inVgroup = true;
854✔
2925
      }
2926
    }
2927

2928
    mDebug("db:%s, vgId:%d, memory in dnode:%d, oldUsed:%" PRId64 ", newUsed:%" PRId64, pNewVgroup->dbName,
884✔
2929
           pNewVgroup->vgId, pDnode->id, oldMemUsed, newMemUsed);
2930

2931
    pDnode->memUsed = pDnode->memUsed - oldMemUsed + newMemUsed;
884✔
2932
    if (pDnode->memAvail - pDnode->memUsed <= 0) {
884!
2933
      mError("db:%s, vgId:%d, no enough memory in dnode:%d, avail:%" PRId64 " used:%" PRId64, pNewVgroup->dbName,
×
2934
             pNewVgroup->vgId, pDnode->id, pDnode->memAvail, pDnode->memUsed);
2935
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE);
×
2936
    } else if (inVgroup) {
884✔
2937
      mInfo("db:%s, vgId:%d, memory in dnode:%d, avail:%" PRId64 " used:%" PRId64, pNewVgroup->dbName, pNewVgroup->vgId,
854!
2938
            pDnode->id, pDnode->memAvail, pDnode->memUsed);
2939
    } else {
2940
    }
2941
  }
2942
  return 0;
646✔
2943
}
2944

2945
int32_t mndBuildAlterVgroupAction(SMnode *pMnode, STrans *pTrans, SDbObj *pOldDb, SDbObj *pNewDb, SVgObj *pVgroup,
733✔
2946
                                  SArray *pArray, SVgObj *pNewVgroup) {
2947
  int32_t code = 0;
733✔
2948
  memcpy(pNewVgroup, pVgroup, sizeof(SVgObj));
733✔
2949

2950
  if (pVgroup->replica <= 0 || pVgroup->replica == pNewDb->cfg.replications) {
733!
2951
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfigAction(pMnode, pTrans, pNewDb, pVgroup));
646!
2952
    TAOS_CHECK_RETURN(mndCheckDnodeMemory(pMnode, pOldDb, pNewDb, pNewVgroup, pVgroup, pArray));
646!
2953
    return 0;
646✔
2954
  }
2955

2956
  mndTransSetSerial(pTrans);
87✔
2957

2958
  if (pNewDb->cfg.replications == 3) {
87✔
2959
    mInfo("db:%s, vgId:%d, will add 2 vnodes, vn:0 dnode:%d", pVgroup->dbName, pVgroup->vgId,
83!
2960
          pVgroup->vnodeGid[0].dnodeId);
2961

2962
    // add second
2963
    if (pNewVgroup->replica == 1) {
83!
2964
      TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, pNewVgroup, pArray));
83!
2965
    }
2966

2967
    // learner stage
2968
    pNewVgroup->vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
83✔
2969
    pNewVgroup->vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_LEARNER;
83✔
2970
    TAOS_CHECK_RETURN(
83!
2971
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
2972

2973
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pNewDb, pNewVgroup, &pNewVgroup->vnodeGid[1]));
83!
2974

2975
    // follower stage
2976
    pNewVgroup->vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
83✔
2977
    TAOS_CHECK_RETURN(mndAddAlterVnodeTypeAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[1].dnodeId));
83!
2978
    TAOS_CHECK_RETURN(
83!
2979
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
2980

2981
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, pNewVgroup));
83!
2982

2983
    // add third
2984
    if (pNewVgroup->replica == 2) {
83!
2985
      TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, pNewVgroup, pArray));
83✔
2986
    }
2987

2988
    pNewVgroup->vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
72✔
2989
    pNewVgroup->vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
72✔
2990
    pNewVgroup->vnodeGid[2].nodeRole = TAOS_SYNC_ROLE_VOTER;
72✔
2991
    TAOS_CHECK_RETURN(
72!
2992
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
2993
    TAOS_CHECK_RETURN(
72!
2994
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[1].dnodeId));
2995
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pNewDb, pNewVgroup, &pNewVgroup->vnodeGid[2]));
72!
2996

2997
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, pNewVgroup));
72!
2998
  } else if (pNewDb->cfg.replications == 1) {
4!
2999
    mInfo("db:%s, vgId:%d, will remove 2 vnodes, vn:0 dnode:%d vn:1 dnode:%d vn:2 dnode:%d", pVgroup->dbName,
4!
3000
          pVgroup->vgId, pVgroup->vnodeGid[0].dnodeId, pVgroup->vnodeGid[1].dnodeId, pVgroup->vnodeGid[2].dnodeId);
3001

3002
    SVnodeGid del1 = {0};
4✔
3003
    SVnodeGid del2 = {0};
4✔
3004
    TAOS_CHECK_RETURN(mndRemoveVnodeFromVgroup(pMnode, pTrans, pNewVgroup, pArray, &del1));
4!
3005
    TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pNewDb, pNewVgroup, &del1, true));
4!
3006
    TAOS_CHECK_RETURN(
4!
3007
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
3008
    TAOS_CHECK_RETURN(
4!
3009
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[1].dnodeId));
3010
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, pNewVgroup));
4!
3011

3012
    TAOS_CHECK_RETURN(mndRemoveVnodeFromVgroup(pMnode, pTrans, pNewVgroup, pArray, &del2));
4!
3013
    TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pNewDb, pNewVgroup, &del2, true));
4!
3014
    TAOS_CHECK_RETURN(
4!
3015
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
3016
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, pNewVgroup));
4!
3017
  } else if (pNewDb->cfg.replications == 2) {
×
3018
    mInfo("db:%s, vgId:%d, will add 1 vnode, vn:0 dnode:%d", pVgroup->dbName, pVgroup->vgId,
×
3019
          pVgroup->vnodeGid[0].dnodeId);
3020

3021
    // add second
3022
    TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, pNewVgroup, pArray));
×
3023

3024
    // learner stage
3025
    pNewVgroup->vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3026
    pNewVgroup->vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3027
    TAOS_CHECK_RETURN(
×
3028
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
3029

3030
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pNewDb, pNewVgroup, &pNewVgroup->vnodeGid[1]));
×
3031

3032
    // follower stage
3033
    pNewVgroup->vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3034
    TAOS_CHECK_RETURN(mndAddAlterVnodeTypeAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[1].dnodeId));
×
3035
    TAOS_CHECK_RETURN(
×
3036
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
3037

3038
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, pNewVgroup));
×
3039
  } else {
3040
    return -1;
×
3041
  }
3042

3043
  mndSortVnodeGid(pNewVgroup);
76✔
3044

3045
  {
3046
    SSdbRaw *pVgRaw = mndVgroupActionEncode(pNewVgroup);
76✔
3047
    if (pVgRaw == NULL) {
76!
3048
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3049
      if (terrno != 0) code = terrno;
×
3050
      TAOS_RETURN(code);
×
3051
    }
3052
    if ((code = mndTransAppendCommitlog(pTrans, pVgRaw)) != 0) {
76!
3053
      sdbFreeRaw(pVgRaw);
×
3054
      TAOS_RETURN(code);
×
3055
    }
3056
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
76✔
3057
    if (code != 0) {
76!
3058
      mError("vgId:%d, failed to set raw status since %s at line:%d", pNewVgroup->vgId, tstrerror(code), __LINE__);
×
3059
      TAOS_RETURN(code);
×
3060
    }
3061
  }
3062

3063
  TAOS_RETURN(code);
76✔
3064
}
3065

3066
int32_t mndBuildRaftAlterVgroupAction(SMnode *pMnode, STrans *pTrans, SDbObj *pOldDb, SDbObj *pNewDb, SVgObj *pVgroup,
×
3067
                                      SArray *pArray) {
3068
  int32_t code = 0;
×
3069
  SVgObj  newVgroup = {0};
×
3070
  memcpy(&newVgroup, pVgroup, sizeof(SVgObj));
×
3071

3072
  if (pVgroup->replica <= 0 || pVgroup->replica == pNewDb->cfg.replications) {
×
3073
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfigAction(pMnode, pTrans, pNewDb, pVgroup));
×
3074
    TAOS_CHECK_RETURN(mndCheckDnodeMemory(pMnode, pOldDb, pNewDb, &newVgroup, pVgroup, pArray));
×
3075
    return 0;
×
3076
  }
3077

3078
  mndTransSetSerial(pTrans);
×
3079

3080
  mInfo("trans:%d, vgId:%d, alter vgroup, syncConfChangeVer:%d, version:%d, replica:%d", pTrans->id, pVgroup->vgId,
×
3081
        pVgroup->syncConfChangeVer, pVgroup->version, pVgroup->replica);
3082

3083
  if (newVgroup.replica == 1 && pNewDb->cfg.replications == 3) {
×
3084
    mInfo("db:%s, vgId:%d, will add 2 vnodes, vn:0 dnode:%d", pVgroup->dbName, pVgroup->vgId,
×
3085
          pVgroup->vnodeGid[0].dnodeId);
3086

3087
    // add second
3088
    TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, &newVgroup, pArray));
×
3089
    // add third
3090
    TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, &newVgroup, pArray));
×
3091

3092
    // add learner stage
3093
    newVgroup.vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3094
    newVgroup.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3095
    newVgroup.vnodeGid[2].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3096
    TAOS_CHECK_RETURN(
×
3097
        mndAddChangeConfigAction(pMnode, pTrans, pNewDb, pVgroup, &newVgroup, newVgroup.vnodeGid[0].dnodeId));
3098
    mInfo("trans:%d, vgId:%d, add change config, syncConfChangeVer:%d, version:%d, replica:%d", pTrans->id,
×
3099
          pVgroup->vgId, newVgroup.syncConfChangeVer, pVgroup->version, pVgroup->replica);
3100
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pNewDb, &newVgroup, &newVgroup.vnodeGid[1]));
×
3101
    mInfo("trans:%d, vgId:%d, create vnode, syncConfChangeVer:%d, version:%d, replica:%d", pTrans->id, pVgroup->vgId,
×
3102
          newVgroup.syncConfChangeVer, pVgroup->version, pVgroup->replica);
3103
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pNewDb, &newVgroup, &newVgroup.vnodeGid[2]));
×
3104
    mInfo("trans:%d, vgId:%d, create vnode, syncConfChangeVer:%d, version:%d, replica:%d", pTrans->id, pVgroup->vgId,
×
3105
          newVgroup.syncConfChangeVer, pVgroup->version, pVgroup->replica);
3106

3107
    // check learner
3108
    newVgroup.vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3109
    newVgroup.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3110
    newVgroup.vnodeGid[2].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3111
    TAOS_CHECK_RETURN(
×
3112
        mndAddCheckLearnerCatchupAction(pMnode, pTrans, pNewDb, &newVgroup, newVgroup.vnodeGid[1].dnodeId));
3113
    TAOS_CHECK_RETURN(
×
3114
        mndAddCheckLearnerCatchupAction(pMnode, pTrans, pNewDb, &newVgroup, newVgroup.vnodeGid[2].dnodeId));
3115

3116
    // change raft type
3117
    newVgroup.vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3118
    newVgroup.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3119
    newVgroup.vnodeGid[2].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3120
    TAOS_CHECK_RETURN(
×
3121
        mndAddChangeConfigAction(pMnode, pTrans, pNewDb, pVgroup, &newVgroup, newVgroup.vnodeGid[0].dnodeId));
3122

3123
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, &newVgroup));
×
3124

3125
    newVgroup.vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3126
    newVgroup.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3127
    newVgroup.vnodeGid[2].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3128
    TAOS_CHECK_RETURN(
×
3129
        mndAddChangeConfigAction(pMnode, pTrans, pNewDb, pVgroup, &newVgroup, newVgroup.vnodeGid[0].dnodeId));
3130

3131
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, &newVgroup));
×
3132

3133
    SSdbRaw *pVgRaw = mndVgroupActionEncode(&newVgroup);
×
3134
    if (pVgRaw == NULL) {
×
3135
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3136
      if (terrno != 0) code = terrno;
×
3137
      TAOS_RETURN(code);
×
3138
    }
3139
    if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
×
3140
      sdbFreeRaw(pVgRaw);
×
3141
      TAOS_RETURN(code);
×
3142
    }
3143
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
×
3144
    if (code != 0) {
×
3145
      mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVgroup.vgId, tstrerror(code),
×
3146
             __LINE__);
3147
      TAOS_RETURN(code);
×
3148
    }
3149
  } else if (newVgroup.replica == 3 && pNewDb->cfg.replications == 1) {
×
3150
    mInfo("db:%s, vgId:%d, will remove 2 vnodes, vn:0 dnode:%d vn:1 dnode:%d vn:2 dnode:%d", pVgroup->dbName,
×
3151
          pVgroup->vgId, pVgroup->vnodeGid[0].dnodeId, pVgroup->vnodeGid[1].dnodeId, pVgroup->vnodeGid[2].dnodeId);
3152

3153
    SVnodeGid del1 = {0};
×
3154
    TAOS_CHECK_RETURN(mndRemoveVnodeFromVgroupWithoutSave(pMnode, pTrans, &newVgroup, pArray, &del1));
×
3155

3156
    TAOS_CHECK_RETURN(
×
3157
        mndAddChangeConfigAction(pMnode, pTrans, pNewDb, pVgroup, &newVgroup, newVgroup.vnodeGid[0].dnodeId));
3158

3159
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, &newVgroup));
×
3160

3161
    TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pNewDb, &newVgroup, &del1, true));
×
3162

3163
    SSdbRaw *pVgRaw = mndVgroupActionEncode(&newVgroup);
×
3164
    if (pVgRaw == NULL) {
×
3165
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3166
      if (terrno != 0) code = terrno;
×
3167
      TAOS_RETURN(code);
×
3168
    }
3169
    if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
×
3170
      sdbFreeRaw(pVgRaw);
×
3171
      TAOS_RETURN(code);
×
3172
    }
3173
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
×
3174
    if (code != 0) {
×
3175
      mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVgroup.vgId, tstrerror(code),
×
3176
             __LINE__);
3177
      TAOS_RETURN(code);
×
3178
    }
3179

3180
    SVnodeGid del2 = {0};
×
3181
    TAOS_CHECK_RETURN(mndRemoveVnodeFromVgroupWithoutSave(pMnode, pTrans, &newVgroup, pArray, &del2));
×
3182

3183
    TAOS_CHECK_RETURN(
×
3184
        mndAddChangeConfigAction(pMnode, pTrans, pNewDb, pVgroup, &newVgroup, newVgroup.vnodeGid[0].dnodeId));
3185

3186
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, &newVgroup));
×
3187

3188
    TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pNewDb, &newVgroup, &del2, true));
×
3189

3190
    pVgRaw = mndVgroupActionEncode(&newVgroup);
×
3191
    if (pVgRaw == NULL) {
×
3192
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3193
      if (terrno != 0) code = terrno;
×
3194
      TAOS_RETURN(code);
×
3195
    }
3196
    if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
×
3197
      sdbFreeRaw(pVgRaw);
×
3198
      TAOS_RETURN(code);
×
3199
    }
3200
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
×
3201
    if (code != 0) {
×
3202
      mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVgroup.vgId, tstrerror(code),
×
3203
             __LINE__);
3204
      TAOS_RETURN(code);
×
3205
    }
3206
  } else {
3207
    return -1;
×
3208
  }
3209

3210
  mndSortVnodeGid(&newVgroup);
×
3211

3212
  {
3213
    SSdbRaw *pVgRaw = mndVgroupActionEncode(&newVgroup);
×
3214
    if (pVgRaw == NULL) {
×
3215
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3216
      if (terrno != 0) code = terrno;
×
3217
      TAOS_RETURN(code);
×
3218
    }
3219
    if ((code = mndTransAppendCommitlog(pTrans, pVgRaw)) != 0) {
×
3220
      sdbFreeRaw(pVgRaw);
×
3221
      TAOS_RETURN(code);
×
3222
    }
3223
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
×
3224
    if (code != 0) {
×
3225
      mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVgroup.vgId, tstrerror(code),
×
3226
             __LINE__);
3227
      TAOS_RETURN(code);
×
3228
    }
3229
  }
3230

3231
  TAOS_RETURN(code);
×
3232
}
3233

3234
int32_t mndBuildRestoreAlterVgroupAction(SMnode *pMnode, STrans *pTrans, SDbObj *db, SVgObj *pVgroup, SDnodeObj *pDnode,
20✔
3235
                                         SDnodeObj *pAnotherDnode) {
3236
  int32_t code = 0;
20✔
3237
  SVgObj  newVgroup = {0};
20✔
3238
  memcpy(&newVgroup, pVgroup, sizeof(SVgObj));
20✔
3239

3240
  mInfo("db:%s, vgId:%d, restore vnodes, vn:0 dnode:%d", pVgroup->dbName, pVgroup->vgId, pVgroup->vnodeGid[0].dnodeId);
20!
3241

3242
  if (newVgroup.replica == 1) {
20!
3243
    int selected = 0;
×
3244
    for (int i = 0; i < newVgroup.replica; i++) {
×
3245
      newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3246
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
×
3247
        selected = i;
×
3248
      }
3249
    }
3250
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, db, &newVgroup, &newVgroup.vnodeGid[selected]));
×
3251
  } else if (newVgroup.replica == 2) {
20!
3252
    for (int i = 0; i < newVgroup.replica; i++) {
×
3253
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
×
3254
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3255
      } else {
3256
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3257
      }
3258
    }
3259
    TAOS_CHECK_RETURN(mndRestoreAddAlterVnodeTypeAction(pMnode, pTrans, db, &newVgroup, pAnotherDnode));
×
3260

3261
    for (int i = 0; i < newVgroup.replica; i++) {
×
3262
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
×
3263
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3264
      } else {
3265
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3266
      }
3267
    }
3268
    TAOS_CHECK_RETURN(mndRestoreAddCreateVnodeAction(pMnode, pTrans, db, &newVgroup, pDnode));
×
3269

3270
    for (int i = 0; i < newVgroup.replica; i++) {
×
3271
      newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3272
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
×
3273
      }
3274
    }
3275
    TAOS_CHECK_RETURN(mndRestoreAddAlterVnodeTypeAction(pMnode, pTrans, db, &newVgroup, pDnode));
×
3276
    TAOS_CHECK_RETURN(mndRestoreAddAlterVnodeTypeAction(pMnode, pTrans, db, &newVgroup, pAnotherDnode));
×
3277
  } else if (newVgroup.replica == 3) {
20!
3278
    for (int i = 0; i < newVgroup.replica; i++) {
80✔
3279
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
60✔
3280
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_LEARNER;
20✔
3281
      } else {
3282
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
40✔
3283
      }
3284
    }
3285
    TAOS_CHECK_RETURN(mndRestoreAddCreateVnodeAction(pMnode, pTrans, db, &newVgroup, pDnode));
20!
3286

3287
    for (int i = 0; i < newVgroup.replica; i++) {
80✔
3288
      newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
60✔
3289
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
60✔
3290
      }
3291
    }
3292
    TAOS_CHECK_RETURN(mndRestoreAddAlterVnodeTypeAction(pMnode, pTrans, db, &newVgroup, pDnode));
20!
3293
  }
3294
  SSdbRaw *pVgRaw = mndVgroupActionEncode(&newVgroup);
20✔
3295
  if (pVgRaw == NULL) {
20!
3296
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3297
    if (terrno != 0) code = terrno;
×
3298
    TAOS_RETURN(code);
×
3299
  }
3300
  if ((code = mndTransAppendCommitlog(pTrans, pVgRaw)) != 0) {
20!
3301
    sdbFreeRaw(pVgRaw);
×
3302
    TAOS_RETURN(code);
×
3303
  }
3304
  code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
20✔
3305
  if (code != 0) {
20!
3306
    mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVgroup.vgId, tstrerror(code), __LINE__);
×
3307
    TAOS_RETURN(code);
×
3308
  }
3309

3310
  TAOS_RETURN(code);
20✔
3311
}
3312

3313
static int32_t mndAddAdjustVnodeHashRangeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup) {
×
3314
  return 0;
×
3315
}
3316

3317
typedef int32_t (*FpTransActionCb)(STrans *pTrans, SSdbRaw *pRaw);
3318

3319
static int32_t mndAddVgStatusAction(STrans *pTrans, SVgObj *pVg, ESdbStatus vgStatus, ETrnStage stage) {
263✔
3320
  int32_t         code = 0;
263✔
3321
  FpTransActionCb appendActionCb = (stage == TRN_STAGE_COMMIT_ACTION) ? mndTransAppendCommitlog : mndTransAppendRedolog;
263✔
3322
  SSdbRaw        *pRaw = mndVgroupActionEncode(pVg);
263✔
3323
  if (pRaw == NULL) {
263!
3324
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3325
    if (terrno != 0) code = terrno;
×
3326
    goto _err;
×
3327
  }
3328
  if ((code = appendActionCb(pTrans, pRaw)) != 0) goto _err;
263!
3329
  code = sdbSetRawStatus(pRaw, vgStatus);
263✔
3330
  if (code != 0) {
263!
3331
    mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", pVg->vgId, tstrerror(code), __LINE__);
×
3332
    goto _err;
×
3333
  }
3334
  pRaw = NULL;
263✔
3335
  TAOS_RETURN(code);
263✔
3336
_err:
×
3337
  sdbFreeRaw(pRaw);
×
3338
  TAOS_RETURN(code);
×
3339
}
3340

3341
static int32_t mndAddDbStatusAction(STrans *pTrans, SDbObj *pDb, ESdbStatus dbStatus, ETrnStage stage) {
101✔
3342
  int32_t         code = 0;
101✔
3343
  FpTransActionCb appendActionCb = (stage == TRN_STAGE_COMMIT_ACTION) ? mndTransAppendCommitlog : mndTransAppendRedolog;
101✔
3344
  SSdbRaw        *pRaw = mndDbActionEncode(pDb);
101✔
3345
  if (pRaw == NULL) {
101!
3346
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3347
    if (terrno != 0) code = terrno;
×
3348
    goto _err;
×
3349
  }
3350
  if ((code = appendActionCb(pTrans, pRaw)) != 0) goto _err;
101!
3351
  code = sdbSetRawStatus(pRaw, dbStatus);
101✔
3352
  if (code != 0) {
101!
3353
    mError("db:%s, failed to set raw status to ready, error:%s, line:%d", pDb->name, tstrerror(code), __LINE__);
×
3354
    goto _err;
×
3355
  }
3356
  pRaw = NULL;
101✔
3357
  TAOS_RETURN(code);
101✔
3358
_err:
×
3359
  sdbFreeRaw(pRaw);
×
3360
  TAOS_RETURN(code);
×
3361
}
3362

3363
int32_t mndSplitVgroup(SMnode *pMnode, SRpcMsg *pReq, SDbObj *pDb, SVgObj *pVgroup) {
57✔
3364
  int32_t code = -1;
57✔
3365
  STrans *pTrans = NULL;
57✔
3366
  SDbObj  dbObj = {0};
57✔
3367
  SArray *pArray = mndBuildDnodesArray(pMnode, 0, NULL);
57✔
3368

3369
  int32_t numOfStreams = 0;
57✔
3370
  if ((code = mndGetNumOfStreams(pMnode, pDb->name, &numOfStreams)) != 0) {
57!
3371
    goto _OVER;
×
3372
  }
3373
  if (numOfStreams > 0) {
57!
3374
    code = TSDB_CODE_MND_STREAM_MUST_BE_DELETED;
×
3375
    goto _OVER;
×
3376
  }
3377

3378
#if defined(USE_S3)
3379
  extern int8_t tsS3Enabled;
3380
  if (tsS3Enabled) {
57!
3381
    code = TSDB_CODE_OPS_NOT_SUPPORT;
×
3382
    mError("vgId:%d, db:%s, s3 exists, split vgroup not allowed", pVgroup->vgId, pVgroup->dbName);
×
3383
    goto _OVER;
×
3384
  }
3385
#endif
3386

3387
  if (pDb->cfg.withArbitrator) {
57!
3388
    code = TSDB_CODE_OPS_NOT_SUPPORT;
×
3389
    mError("vgId:%d, db:%s, with arbitrator, split vgroup not allowed", pVgroup->vgId, pVgroup->dbName);
×
3390
    goto _OVER;
×
3391
  }
3392

3393
  pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, TRN_CONFLICT_DB, pReq, "split-vgroup");
57✔
3394
  if (pTrans == NULL) {
57!
3395
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3396
    if (terrno != 0) code = terrno;
×
3397
    goto _OVER;
×
3398
  }
3399
  mndTransSetSerial(pTrans);
57✔
3400
  mInfo("trans:%d, used to split vgroup, vgId:%d", pTrans->id, pVgroup->vgId);
57!
3401

3402
  mndTransSetDbName(pTrans, pDb->name, NULL);
57✔
3403
  TAOS_CHECK_GOTO(mndTransCheckConflictWithCompact(pMnode, pTrans), NULL, _OVER);
57✔
3404

3405
  SVgObj newVg1 = {0};
56✔
3406
  memcpy(&newVg1, pVgroup, sizeof(SVgObj));
56✔
3407
  mInfo("vgId:%d, vgroup info before split, replica:%d hashBegin:%u hashEnd:%u", newVg1.vgId, newVg1.replica,
56!
3408
        newVg1.hashBegin, newVg1.hashEnd);
3409
  for (int32_t i = 0; i < newVg1.replica; ++i) {
174✔
3410
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg1.vgId, i, newVg1.vnodeGid[i].dnodeId);
118!
3411
  }
3412

3413
  if (newVg1.replica == 1) {
56✔
3414
    TAOS_CHECK_GOTO(mndAddVnodeToVgroup(pMnode, pTrans, &newVg1, pArray), NULL, _OVER);
25!
3415

3416
    newVg1.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_LEARNER;
25✔
3417
    TAOS_CHECK_GOTO(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[0].dnodeId), NULL,
25!
3418
                    _OVER);
3419
    TAOS_CHECK_GOTO(mndAddCreateVnodeAction(pMnode, pTrans, pDb, &newVg1, &newVg1.vnodeGid[1]), NULL, _OVER);
25!
3420

3421
    newVg1.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
25✔
3422
    TAOS_CHECK_GOTO(mndAddAlterVnodeTypeAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[1].dnodeId), NULL, _OVER);
25!
3423
    TAOS_CHECK_GOTO(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[0].dnodeId), NULL,
25!
3424
                    _OVER);
3425

3426
    TAOS_CHECK_GOTO(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg1), NULL, _OVER);
25!
3427
  } else if (newVg1.replica == 3) {
31!
3428
    SVnodeGid del1 = {0};
31✔
3429
    TAOS_CHECK_GOTO(mndRemoveVnodeFromVgroup(pMnode, pTrans, &newVg1, pArray, &del1), NULL, _OVER);
31!
3430
    TAOS_CHECK_GOTO(mndAddDropVnodeAction(pMnode, pTrans, pDb, &newVg1, &del1, true), NULL, _OVER);
31!
3431
    TAOS_CHECK_GOTO(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[0].dnodeId), NULL,
31!
3432
                    _OVER);
3433
    TAOS_CHECK_GOTO(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[1].dnodeId), NULL,
31!
3434
                    _OVER);
3435
  } else {
3436
    goto _OVER;
×
3437
  }
3438

3439
  for (int32_t i = 0; i < newVg1.replica; ++i) {
168✔
3440
    TAOS_CHECK_GOTO(mndAddDisableVnodeWriteAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[i].dnodeId), NULL,
112!
3441
                    _OVER);
3442
  }
3443
  TAOS_CHECK_GOTO(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg1), NULL, _OVER);
56!
3444

3445
  SVgObj newVg2 = {0};
56✔
3446
  memcpy(&newVg2, &newVg1, sizeof(SVgObj));
56✔
3447
  newVg1.replica = 1;
56✔
3448
  newVg1.hashEnd = newVg1.hashBegin / 2 + newVg1.hashEnd / 2;
56✔
3449
  memset(&newVg1.vnodeGid[1], 0, sizeof(SVnodeGid));
56✔
3450

3451
  newVg2.replica = 1;
56✔
3452
  newVg2.hashBegin = newVg1.hashEnd + 1;
56✔
3453
  memcpy(&newVg2.vnodeGid[0], &newVg2.vnodeGid[1], sizeof(SVnodeGid));
56✔
3454
  memset(&newVg2.vnodeGid[1], 0, sizeof(SVnodeGid));
56✔
3455

3456
  mInfo("vgId:%d, vgroup info after split, replica:%d hashrange:[%u, %u] vnode:0 dnode:%d", newVg1.vgId, newVg1.replica,
56!
3457
        newVg1.hashBegin, newVg1.hashEnd, newVg1.vnodeGid[0].dnodeId);
3458
  for (int32_t i = 0; i < newVg1.replica; ++i) {
112✔
3459
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg1.vgId, i, newVg1.vnodeGid[i].dnodeId);
56!
3460
  }
3461
  mInfo("vgId:%d, vgroup info after split, replica:%d hashrange:[%u, %u] vnode:0 dnode:%d", newVg2.vgId, newVg2.replica,
56!
3462
        newVg2.hashBegin, newVg2.hashEnd, newVg2.vnodeGid[0].dnodeId);
3463
  for (int32_t i = 0; i < newVg1.replica; ++i) {
112✔
3464
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg2.vgId, i, newVg2.vnodeGid[i].dnodeId);
56!
3465
  }
3466

3467
  // alter vgId and hash range
3468
  int32_t maxVgId = sdbGetMaxId(pMnode->pSdb, SDB_VGROUP);
56✔
3469
  int32_t srcVgId = newVg1.vgId;
56✔
3470
  newVg1.vgId = maxVgId;
56✔
3471
  TAOS_CHECK_GOTO(mndAddNewVgPrepareAction(pMnode, pTrans, &newVg1), NULL, _OVER);
56!
3472
  TAOS_CHECK_GOTO(mndAddAlterVnodeHashRangeAction(pMnode, pTrans, srcVgId, &newVg1), NULL, _OVER);
56!
3473

3474
  maxVgId++;
56✔
3475
  srcVgId = newVg2.vgId;
56✔
3476
  newVg2.vgId = maxVgId;
56✔
3477
  TAOS_CHECK_GOTO(mndAddNewVgPrepareAction(pMnode, pTrans, &newVg2), NULL, _OVER);
56!
3478
  TAOS_CHECK_GOTO(mndAddAlterVnodeHashRangeAction(pMnode, pTrans, srcVgId, &newVg2), NULL, _OVER);
56!
3479

3480
  TAOS_CHECK_GOTO(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg1), NULL, _OVER);
56!
3481
  TAOS_CHECK_GOTO(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg2), NULL, _OVER);
56!
3482

3483
  TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, &newVg1, SDB_STATUS_READY, TRN_STAGE_REDO_ACTION), NULL, _OVER);
56!
3484
  TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, &newVg2, SDB_STATUS_READY, TRN_STAGE_REDO_ACTION), NULL, _OVER);
56!
3485
  TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, pVgroup, SDB_STATUS_DROPPED, TRN_STAGE_REDO_ACTION), NULL, _OVER);
56!
3486

3487
  // update db status
3488
  memcpy(&dbObj, pDb, sizeof(SDbObj));
56✔
3489
  if (dbObj.cfg.pRetensions != NULL) {
56!
3490
    dbObj.cfg.pRetensions = taosArrayDup(pDb->cfg.pRetensions, NULL);
×
3491
    if (dbObj.cfg.pRetensions == NULL) {
×
3492
      code = terrno;
×
3493
      goto _OVER;
×
3494
    }
3495
  }
3496
  dbObj.vgVersion++;
56✔
3497
  dbObj.updateTime = taosGetTimestampMs();
56✔
3498
  dbObj.cfg.numOfVgroups++;
56✔
3499
  TAOS_CHECK_GOTO(mndAddDbStatusAction(pTrans, &dbObj, SDB_STATUS_READY, TRN_STAGE_REDO_ACTION), NULL, _OVER);
56!
3500

3501
  // adjust vgroup replica
3502
  if (pDb->cfg.replications != newVg1.replica) {
56✔
3503
    SVgObj tmpGroup = {0};
31✔
3504
    TAOS_CHECK_GOTO(mndBuildAlterVgroupAction(pMnode, pTrans, pDb, pDb, &newVg1, pArray, &tmpGroup), NULL, _OVER);
31!
3505
  } else {
3506
    TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, &newVg1, SDB_STATUS_READY, TRN_STAGE_COMMIT_ACTION), NULL, _OVER);
25!
3507
  }
3508

3509
  if (pDb->cfg.replications != newVg2.replica) {
56✔
3510
    SVgObj tmpGroup = {0};
31✔
3511
    TAOS_CHECK_GOTO(mndBuildAlterVgroupAction(pMnode, pTrans, pDb, pDb, &newVg2, pArray, &tmpGroup), NULL, _OVER);
31✔
3512
  } else {
3513
    TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, &newVg2, SDB_STATUS_READY, TRN_STAGE_COMMIT_ACTION), NULL, _OVER);
25!
3514
  }
3515

3516
  TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, pVgroup, SDB_STATUS_DROPPED, TRN_STAGE_COMMIT_ACTION), NULL, _OVER);
45!
3517

3518
  // commit db status
3519
  dbObj.vgVersion++;
45✔
3520
  dbObj.updateTime = taosGetTimestampMs();
45✔
3521
  TAOS_CHECK_GOTO(mndAddDbStatusAction(pTrans, &dbObj, SDB_STATUS_READY, TRN_STAGE_COMMIT_ACTION), NULL, _OVER);
45!
3522

3523
  TAOS_CHECK_GOTO(mndTransPrepare(pMnode, pTrans), NULL, _OVER);
45!
3524
  code = 0;
45✔
3525

3526
_OVER:
57✔
3527
  taosArrayDestroy(pArray);
57✔
3528
  mndTransDrop(pTrans);
57✔
3529
  taosArrayDestroy(dbObj.cfg.pRetensions);
57✔
3530
  TAOS_RETURN(code);
57✔
3531
}
3532

3533
extern int32_t mndProcessSplitVgroupMsgImp(SRpcMsg *pReq);
3534

3535
static int32_t mndProcessSplitVgroupMsg(SRpcMsg *pReq) { return mndProcessSplitVgroupMsgImp(pReq); }
61✔
3536

3537
#ifndef TD_ENTERPRISE
3538
int32_t mndProcessSplitVgroupMsgImp(SRpcMsg *pReq) { return 0; }
3539
#endif
3540

3541
static int32_t mndSetBalanceVgroupInfoToTrans(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
24✔
3542
                                              SDnodeObj *pSrc, SDnodeObj *pDst) {
3543
  int32_t code = 0;
24✔
3544
  SVgObj  newVg = {0};
24✔
3545
  memcpy(&newVg, pVgroup, sizeof(SVgObj));
24✔
3546
  mInfo("vgId:%d, vgroup info before balance, replica:%d", newVg.vgId, newVg.replica);
24!
3547
  for (int32_t i = 0; i < newVg.replica; ++i) {
68✔
3548
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg.vgId, i, newVg.vnodeGid[i].dnodeId);
44!
3549
  }
3550

3551
  TAOS_CHECK_RETURN(mndAddIncVgroupReplicaToTrans(pMnode, pTrans, pDb, &newVg, pDst->id));
24!
3552
  TAOS_CHECK_RETURN(mndAddDecVgroupReplicaFromTrans(pMnode, pTrans, pDb, &newVg, pSrc->id));
24!
3553

3554
  {
3555
    SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
24✔
3556
    if (pRaw == NULL) {
24!
3557
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3558
      if (terrno != 0) code = terrno;
×
3559
      TAOS_RETURN(code);
×
3560
    }
3561
    if ((code = mndTransAppendCommitlog(pTrans, pRaw)) != 0) {
24!
3562
      sdbFreeRaw(pRaw);
×
3563
      TAOS_RETURN(code);
×
3564
    }
3565
    code = sdbSetRawStatus(pRaw, SDB_STATUS_READY);
24✔
3566
    if (code != 0) {
24!
3567
      mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVg.vgId, tstrerror(code), __LINE__);
×
3568
      TAOS_RETURN(code);
×
3569
    }
3570
  }
3571

3572
  mInfo("vgId:%d, vgroup info after balance, replica:%d", newVg.vgId, newVg.replica);
24!
3573
  for (int32_t i = 0; i < newVg.replica; ++i) {
68✔
3574
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg.vgId, i, newVg.vnodeGid[i].dnodeId);
44!
3575
  }
3576
  TAOS_RETURN(code);
24✔
3577
}
3578

3579
static int32_t mndBalanceVgroupBetweenDnode(SMnode *pMnode, STrans *pTrans, SDnodeObj *pSrc, SDnodeObj *pDst,
24✔
3580
                                            SHashObj *pBalancedVgroups) {
3581
  void   *pIter = NULL;
24✔
3582
  int32_t code = -1;
24✔
3583
  SSdb   *pSdb = pMnode->pSdb;
24✔
3584

3585
  while (1) {
16✔
3586
    SVgObj *pVgroup = NULL;
40✔
3587
    pIter = sdbFetch(pSdb, SDB_VGROUP, pIter, (void **)&pVgroup);
40✔
3588
    if (pIter == NULL) break;
40!
3589
    if (taosHashGet(pBalancedVgroups, &pVgroup->vgId, sizeof(int32_t)) != NULL) {
40✔
3590
      sdbRelease(pSdb, pVgroup);
15✔
3591
      continue;
16✔
3592
    }
3593

3594
    bool existInSrc = false;
25✔
3595
    bool existInDst = false;
25✔
3596
    for (int32_t i = 0; i < pVgroup->replica; ++i) {
70✔
3597
      SVnodeGid *pGid = &pVgroup->vnodeGid[i];
45✔
3598
      if (pGid->dnodeId == pSrc->id) existInSrc = true;
45✔
3599
      if (pGid->dnodeId == pDst->id) existInDst = true;
45!
3600
    }
3601

3602
    if (!existInSrc || existInDst) {
25!
3603
      sdbRelease(pSdb, pVgroup);
1✔
3604
      continue;
1✔
3605
    }
3606

3607
    SDbObj *pDb = mndAcquireDb(pMnode, pVgroup->dbName);
24✔
3608
    if (pDb == NULL) {
24!
3609
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3610
      if (terrno != 0) code = terrno;
×
3611
      mError("vgId:%d, balance vgroup can't find db obj dbName:%s", pVgroup->vgId, pVgroup->dbName);
×
3612
      goto _OUT;
×
3613
    }
3614

3615
    if (pDb->cfg.withArbitrator) {
24!
3616
      mInfo("vgId:%d, db:%s, with arbitrator, balance vgroup not allowed", pVgroup->vgId, pVgroup->dbName);
×
3617
      goto _OUT;
×
3618
    }
3619

3620
    code = mndSetBalanceVgroupInfoToTrans(pMnode, pTrans, pDb, pVgroup, pSrc, pDst);
24✔
3621
    if (code == 0) {
24!
3622
      code = taosHashPut(pBalancedVgroups, &pVgroup->vgId, sizeof(int32_t), &pVgroup->vgId, sizeof(int32_t));
24✔
3623
    }
3624

3625
  _OUT:
×
3626
    mndReleaseDb(pMnode, pDb);
24✔
3627
    sdbRelease(pSdb, pVgroup);
24✔
3628
    sdbCancelFetch(pSdb, pIter);
24✔
3629
    break;
24✔
3630
  }
3631

3632
  return code;
24✔
3633
}
3634

3635
static int32_t mndBalanceVgroup(SMnode *pMnode, SRpcMsg *pReq, SArray *pArray) {
16✔
3636
  int32_t   code = -1;
16✔
3637
  int32_t   numOfVgroups = 0;
16✔
3638
  STrans   *pTrans = NULL;
16✔
3639
  SHashObj *pBalancedVgroups = NULL;
16✔
3640

3641
  pBalancedVgroups = taosHashInit(16, taosGetDefaultHashFunction(TSDB_DATA_TYPE_INT), false, HASH_NO_LOCK);
16✔
3642
  if (pBalancedVgroups == NULL) goto _OVER;
16!
3643

3644
  pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, TRN_CONFLICT_GLOBAL, pReq, "balance-vgroup");
16✔
3645
  if (pTrans == NULL) {
16!
3646
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3647
    if (terrno != 0) code = terrno;
×
3648
    goto _OVER;
×
3649
  }
3650
  mndTransSetSerial(pTrans);
16✔
3651
  mInfo("trans:%d, used to balance vgroup", pTrans->id);
16!
3652
  TAOS_CHECK_GOTO(mndTransCheckConflict(pMnode, pTrans), NULL, _OVER);
16!
3653
  TAOS_CHECK_GOTO(mndTransCheckConflictWithCompact(pMnode, pTrans), NULL, _OVER);
16✔
3654

3655
  while (1) {
24✔
3656
    taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes);
39✔
3657
    for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
169✔
3658
      SDnodeObj *pDnode = taosArrayGet(pArray, i);
130✔
3659
      mInfo("dnode:%d, equivalent vnodes:%d others:%d support:%d, score:%f", pDnode->id, pDnode->numOfVnodes,
130!
3660
            pDnode->numOfSupportVnodes, pDnode->numOfOtherNodes, mndGetDnodeScore(pDnode, 0, 1));
3661
    }
3662

3663
    SDnodeObj *pSrc = taosArrayGet(pArray, taosArrayGetSize(pArray) - 1);
39✔
3664
    SDnodeObj *pDst = taosArrayGet(pArray, 0);
39✔
3665

3666
    float srcScore = mndGetDnodeScore(pSrc, -1, 1);
39✔
3667
    float dstScore = mndGetDnodeScore(pDst, 1, 1);
39✔
3668
    mInfo("trans:%d, after balance, src dnode:%d score:%f, dst dnode:%d score:%f", pTrans->id, pSrc->id, dstScore,
39!
3669
          pDst->id, dstScore);
3670

3671
    if (srcScore > dstScore - 0.000001) {
39✔
3672
      code = mndBalanceVgroupBetweenDnode(pMnode, pTrans, pSrc, pDst, pBalancedVgroups);
24✔
3673
      if (code == 0) {
24!
3674
        pSrc->numOfVnodes--;
24✔
3675
        pDst->numOfVnodes++;
24✔
3676
        numOfVgroups++;
24✔
3677
        continue;
24✔
3678
      } else {
3679
        mInfo("trans:%d, no vgroup need to balance from dnode:%d to dnode:%d", pTrans->id, pSrc->id, pDst->id);
×
3680
        break;
×
3681
      }
3682
    } else {
3683
      mInfo("trans:%d, no vgroup need to balance any more", pTrans->id);
15!
3684
      break;
15✔
3685
    }
3686
  }
3687

3688
  if (numOfVgroups <= 0) {
15✔
3689
    mInfo("no need to balance vgroup");
1!
3690
    code = 0;
1✔
3691
  } else {
3692
    mInfo("start to balance vgroup, numOfVgroups:%d", numOfVgroups);
14!
3693
    if (mndTransPrepare(pMnode, pTrans) != 0) goto _OVER;
14!
3694
    code = TSDB_CODE_ACTION_IN_PROGRESS;
14✔
3695
  }
3696

3697
_OVER:
16✔
3698
  taosHashCleanup(pBalancedVgroups);
16✔
3699
  mndTransDrop(pTrans);
16✔
3700
  TAOS_RETURN(code);
16✔
3701
}
3702

3703
static int32_t mndProcessBalanceVgroupMsg(SRpcMsg *pReq) {
19✔
3704
  SMnode *pMnode = pReq->info.node;
19✔
3705
  int32_t code = -1;
19✔
3706
  SArray *pArray = NULL;
19✔
3707
  void   *pIter = NULL;
19✔
3708
  int64_t curMs = taosGetTimestampMs();
19✔
3709

3710
  SBalanceVgroupReq req = {0};
19✔
3711
  if (tDeserializeSBalanceVgroupReq(pReq->pCont, pReq->contLen, &req) != 0) {
19!
3712
    code = TSDB_CODE_INVALID_MSG;
×
3713
    goto _OVER;
×
3714
  }
3715

3716
  mInfo("start to balance vgroup");
19!
3717
  if ((code = mndCheckOperPrivilege(pMnode, pReq->info.conn.user, MND_OPER_BALANCE_VGROUP)) != 0) {
19✔
3718
    goto _OVER;
1✔
3719
  }
3720

3721
  while (1) {
56✔
3722
    SDnodeObj *pDnode = NULL;
74✔
3723
    pIter = sdbFetch(pMnode->pSdb, SDB_DNODE, pIter, (void **)&pDnode);
74✔
3724
    if (pIter == NULL) break;
74✔
3725
    if (!mndIsDnodeOnline(pDnode, curMs)) {
57✔
3726
      sdbCancelFetch(pMnode->pSdb, pIter);
1✔
3727
      code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
1✔
3728
      mError("failed to balance vgroup since %s, dnode:%d", terrstr(), pDnode->id);
1!
3729
      sdbRelease(pMnode->pSdb, pDnode);
1✔
3730
      goto _OVER;
1✔
3731
    }
3732

3733
    sdbRelease(pMnode->pSdb, pDnode);
56✔
3734
  }
3735

3736
  pArray = mndBuildDnodesArray(pMnode, 0, NULL);
17✔
3737
  if (pArray == NULL) {
17!
3738
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3739
    if (terrno != 0) code = terrno;
×
3740
    goto _OVER;
×
3741
  }
3742

3743
  if (taosArrayGetSize(pArray) < 2) {
17✔
3744
    mInfo("no need to balance vgroup since dnode num less than 2");
1!
3745
    code = 0;
1✔
3746
  } else {
3747
    code = mndBalanceVgroup(pMnode, pReq, pArray);
16✔
3748
  }
3749

3750
  auditRecord(pReq, pMnode->clusterId, "balanceVgroup", "", "", req.sql, req.sqlLen);
17✔
3751

3752
_OVER:
19✔
3753
  if (code != 0 && code != TSDB_CODE_ACTION_IN_PROGRESS) {
19✔
3754
    mError("failed to balance vgroup since %s", tstrerror(code));
3!
3755
  }
3756

3757
  taosArrayDestroy(pArray);
19✔
3758
  tFreeSBalanceVgroupReq(&req);
19✔
3759
  TAOS_RETURN(code);
19✔
3760
}
3761

3762
bool mndVgroupInDb(SVgObj *pVgroup, int64_t dbUid) { return !pVgroup->isTsma && pVgroup->dbUid == dbUid; }
91,170,230!
3763

3764
bool mndVgroupInDnode(SVgObj *pVgroup, int32_t dnodeId) {
32✔
3765
  for (int i = 0; i < pVgroup->replica; i++) {
80✔
3766
    if (pVgroup->vnodeGid[i].dnodeId == dnodeId) return true;
68✔
3767
  }
3768
  return false;
12✔
3769
}
3770

3771
static void *mndBuildCompactVnodeReq(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, int32_t *pContLen, int64_t compactTs,
51✔
3772
                                     STimeWindow tw, bool metaOnly) {
3773
  SCompactVnodeReq compactReq = {0};
51✔
3774
  compactReq.dbUid = pDb->uid;
51✔
3775
  compactReq.compactStartTime = compactTs;
51✔
3776
  compactReq.tw = tw;
51✔
3777
  compactReq.metaOnly = metaOnly;
51✔
3778
  tstrncpy(compactReq.db, pDb->name, TSDB_DB_FNAME_LEN);
51✔
3779

3780
  mInfo("vgId:%d, build compact vnode config req", pVgroup->vgId);
51!
3781
  int32_t contLen = tSerializeSCompactVnodeReq(NULL, 0, &compactReq);
51✔
3782
  if (contLen < 0) {
51!
3783
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
3784
    return NULL;
×
3785
  }
3786
  contLen += sizeof(SMsgHead);
51✔
3787

3788
  void *pReq = taosMemoryMalloc(contLen);
51!
3789
  if (pReq == NULL) {
51!
3790
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
3791
    return NULL;
×
3792
  }
3793

3794
  SMsgHead *pHead = pReq;
51✔
3795
  pHead->contLen = htonl(contLen);
51✔
3796
  pHead->vgId = htonl(pVgroup->vgId);
51✔
3797

3798
  if (tSerializeSCompactVnodeReq((char *)pReq + sizeof(SMsgHead), contLen, &compactReq) < 0) {
51!
3799
    taosMemoryFree(pReq);
×
3800
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
3801
    return NULL;
×
3802
  }
3803
  *pContLen = contLen;
51✔
3804
  return pReq;
51✔
3805
}
3806

3807
static int32_t mndAddCompactVnodeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int64_t compactTs,
51✔
3808
                                        STimeWindow tw, bool metaOnly) {
3809
  int32_t      code = 0;
51✔
3810
  STransAction action = {0};
51✔
3811
  action.epSet = mndGetVgroupEpset(pMnode, pVgroup);
51✔
3812

3813
  int32_t contLen = 0;
51✔
3814
  void   *pReq = mndBuildCompactVnodeReq(pMnode, pDb, pVgroup, &contLen, compactTs, tw, metaOnly);
51✔
3815
  if (pReq == NULL) {
51!
3816
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3817
    if (terrno != 0) code = terrno;
×
3818
    TAOS_RETURN(code);
×
3819
  }
3820

3821
  action.pCont = pReq;
51✔
3822
  action.contLen = contLen;
51✔
3823
  action.msgType = TDMT_VND_COMPACT;
51✔
3824

3825
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
51!
3826
    taosMemoryFree(pReq);
×
3827
    TAOS_RETURN(code);
×
3828
  }
3829

3830
  TAOS_RETURN(code);
51✔
3831
}
3832

3833
int32_t mndBuildCompactVgroupAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int64_t compactTs,
51✔
3834
                                    STimeWindow tw, bool metaOnly) {
3835
  TAOS_CHECK_RETURN(mndAddCompactVnodeAction(pMnode, pTrans, pDb, pVgroup, compactTs, tw, metaOnly));
51!
3836
  return 0;
51✔
3837
}
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc