• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

taosdata / TDengine / #4687

25 Aug 2025 07:22AM UTC coverage: 57.894% (-2.2%) from 60.092%
#4687

push

travis-ci

web-flow
fix: add taosBenchmark windows support params (#32708)

132643 of 292257 branches covered (45.39%)

Branch coverage included in aggregate %.

201266 of 284501 relevant lines covered (70.74%)

4743408.21 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

55.04
/source/dnode/mnode/impl/src/mndVgroup.c
1
/*
2
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
3
 *
4
 * This program is free software: you can use, redistribute, and/or modify
5
 * it under the terms of the GNU Affero General Public License, version 3
6
 * or later ("AGPL"), as published by the Free Software Foundation.
7
 *
8
 * This program is distributed in the hope that it will be useful, but WITHOUT
9
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10
 * FITNESS FOR A PARTICULAR PURPOSE.
11
 *
12
 * You should have received a copy of the GNU Affero General Public License
13
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
14
 */
15

16
#define _DEFAULT_SOURCE
17
#include "audit.h"
18
#include "mndArbGroup.h"
19
#include "mndDb.h"
20
#include "mndDnode.h"
21
#include "mndMnode.h"
22
#include "mndPrivilege.h"
23
#include "mndShow.h"
24
#include "mndStb.h"
25
#include "mndStream.h"
26
#include "mndTopic.h"
27
#include "mndTrans.h"
28
#include "mndUser.h"
29
#include "mndVgroup.h"
30
#include "tmisce.h"
31

32
#define VGROUP_VER_NUMBER   1
33
#define VGROUP_RESERVE_SIZE 60
34

35
static int32_t mndVgroupActionInsert(SSdb *pSdb, SVgObj *pVgroup);
36
static int32_t mndVgroupActionDelete(SSdb *pSdb, SVgObj *pVgroup);
37
static int32_t mndVgroupActionUpdate(SSdb *pSdb, SVgObj *pOld, SVgObj *pNew);
38
static int32_t mndNewVgActionValidate(SMnode *pMnode, STrans *pTrans, SSdbRaw *pRaw);
39

40
static int32_t mndRetrieveVgroups(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows);
41
static void    mndCancelGetNextVgroup(SMnode *pMnode, void *pIter);
42
static int32_t mndRetrieveVnodes(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows);
43
static void    mndCancelGetNextVnode(SMnode *pMnode, void *pIter);
44

45
static int32_t mndProcessRedistributeVgroupMsg(SRpcMsg *pReq);
46
static int32_t mndProcessSplitVgroupMsg(SRpcMsg *pReq);
47
static int32_t mndProcessBalanceVgroupMsg(SRpcMsg *pReq);
48
static int32_t mndProcessVgroupBalanceLeaderMsg(SRpcMsg *pReq);
49
int32_t mndTransProcessSsMigrateVgroupRsp(SRpcMsg *pRsp);
50

51
int32_t mndInitVgroup(SMnode *pMnode) {
1,923✔
52
  SSdbTable table = {
1,923✔
53
      .sdbType = SDB_VGROUP,
54
      .keyType = SDB_KEY_INT32,
55
      .encodeFp = (SdbEncodeFp)mndVgroupActionEncode,
56
      .decodeFp = (SdbDecodeFp)mndVgroupActionDecode,
57
      .insertFp = (SdbInsertFp)mndVgroupActionInsert,
58
      .updateFp = (SdbUpdateFp)mndVgroupActionUpdate,
59
      .deleteFp = (SdbDeleteFp)mndVgroupActionDelete,
60
      .validateFp = (SdbValidateFp)mndNewVgActionValidate,
61
  };
62

63
  mndSetMsgHandle(pMnode, TDMT_DND_CREATE_VNODE_RSP, mndTransProcessRsp);
1,923✔
64
  mndSetMsgHandle(pMnode, TDMT_VND_ALTER_REPLICA_RSP, mndTransProcessRsp);
1,923✔
65
  mndSetMsgHandle(pMnode, TDMT_VND_ALTER_CONFIG_RSP, mndTransProcessRsp);
1,923✔
66
  mndSetMsgHandle(pMnode, TDMT_VND_ALTER_CONFIRM_RSP, mndTransProcessRsp);
1,923✔
67
  mndSetMsgHandle(pMnode, TDMT_VND_ALTER_HASHRANGE_RSP, mndTransProcessRsp);
1,923✔
68
  mndSetMsgHandle(pMnode, TDMT_DND_DROP_VNODE_RSP, mndTransProcessRsp);
1,923✔
69
  mndSetMsgHandle(pMnode, TDMT_VND_COMPACT_RSP, mndTransProcessRsp);
1,923✔
70
  mndSetMsgHandle(pMnode, TDMT_VND_SSMIGRATE_RSP, mndTransProcessSsMigrateVgroupRsp);
1,923✔
71
  mndSetMsgHandle(pMnode, TDMT_VND_DISABLE_WRITE_RSP, mndTransProcessRsp);
1,923✔
72
  mndSetMsgHandle(pMnode, TDMT_SYNC_FORCE_FOLLOWER_RSP, mndTransProcessRsp);
1,923✔
73
  mndSetMsgHandle(pMnode, TDMT_DND_ALTER_VNODE_TYPE_RSP, mndTransProcessRsp);
1,923✔
74
  mndSetMsgHandle(pMnode, TDMT_DND_CHECK_VNODE_LEARNER_CATCHUP_RSP, mndTransProcessRsp);
1,923✔
75
  mndSetMsgHandle(pMnode, TDMT_SYNC_CONFIG_CHANGE_RSP, mndTransProcessRsp);
1,923✔
76

77
  mndSetMsgHandle(pMnode, TDMT_MND_REDISTRIBUTE_VGROUP, mndProcessRedistributeVgroupMsg);
1,923✔
78
  mndSetMsgHandle(pMnode, TDMT_MND_SPLIT_VGROUP, mndProcessSplitVgroupMsg);
1,923✔
79
  // mndSetMsgHandle(pMnode, TDMT_MND_BALANCE_VGROUP, mndProcessVgroupBalanceLeaderMsg);
80
  mndSetMsgHandle(pMnode, TDMT_MND_BALANCE_VGROUP, mndProcessBalanceVgroupMsg);
1,923✔
81
  mndSetMsgHandle(pMnode, TDMT_MND_BALANCE_VGROUP_LEADER, mndProcessVgroupBalanceLeaderMsg);
1,923✔
82

83
  mndAddShowRetrieveHandle(pMnode, TSDB_MGMT_TABLE_VGROUP, mndRetrieveVgroups);
1,923✔
84
  mndAddShowFreeIterHandle(pMnode, TSDB_MGMT_TABLE_VGROUP, mndCancelGetNextVgroup);
1,923✔
85
  mndAddShowRetrieveHandle(pMnode, TSDB_MGMT_TABLE_VNODES, mndRetrieveVnodes);
1,923✔
86
  mndAddShowFreeIterHandle(pMnode, TSDB_MGMT_TABLE_VNODES, mndCancelGetNextVnode);
1,923✔
87

88
  return sdbSetTable(pMnode->pSdb, table);
1,923✔
89
}
90

91
void mndCleanupVgroup(SMnode *pMnode) {}
1,923✔
92

93
SSdbRaw *mndVgroupActionEncode(SVgObj *pVgroup) {
36,828✔
94
  int32_t code = 0;
36,828✔
95
  int32_t lino = 0;
36,828✔
96
  terrno = TSDB_CODE_OUT_OF_MEMORY;
36,828✔
97

98
  SSdbRaw *pRaw = sdbAllocRaw(SDB_VGROUP, VGROUP_VER_NUMBER, sizeof(SVgObj) + VGROUP_RESERVE_SIZE);
36,828✔
99
  if (pRaw == NULL) goto _OVER;
36,828!
100

101
  int32_t dataPos = 0;
36,828✔
102
  SDB_SET_INT32(pRaw, dataPos, pVgroup->vgId, _OVER)
36,828!
103
  SDB_SET_INT64(pRaw, dataPos, pVgroup->createdTime, _OVER)
36,828!
104
  SDB_SET_INT64(pRaw, dataPos, pVgroup->updateTime, _OVER)
36,828!
105
  SDB_SET_INT32(pRaw, dataPos, pVgroup->version, _OVER)
36,828!
106
  SDB_SET_INT32(pRaw, dataPos, pVgroup->hashBegin, _OVER)
36,828!
107
  SDB_SET_INT32(pRaw, dataPos, pVgroup->hashEnd, _OVER)
36,828!
108
  SDB_SET_BINARY(pRaw, dataPos, pVgroup->dbName, TSDB_DB_FNAME_LEN, _OVER)
36,828!
109
  SDB_SET_INT64(pRaw, dataPos, pVgroup->dbUid, _OVER)
36,828!
110
  SDB_SET_INT8(pRaw, dataPos, pVgroup->isTsma, _OVER)
36,828!
111
  SDB_SET_INT8(pRaw, dataPos, pVgroup->replica, _OVER)
36,828!
112
  for (int8_t i = 0; i < pVgroup->replica; ++i) {
79,859✔
113
    SVnodeGid *pVgid = &pVgroup->vnodeGid[i];
43,031✔
114
    SDB_SET_INT32(pRaw, dataPos, pVgid->dnodeId, _OVER)
43,031!
115
  }
116
  SDB_SET_INT32(pRaw, dataPos, pVgroup->syncConfChangeVer, _OVER)
36,828!
117
  SDB_SET_INT32(pRaw, dataPos, pVgroup->mountVgId, _OVER)
36,828!
118
  SDB_SET_RESERVE(pRaw, dataPos, VGROUP_RESERVE_SIZE, _OVER)
36,828!
119
  SDB_SET_DATALEN(pRaw, dataPos, _OVER)
36,828!
120

121
  terrno = 0;
36,828✔
122

123
_OVER:
36,828✔
124
  if (terrno != 0) {
36,828!
125
    mError("vgId:%d, failed to encode to raw:%p since %s", pVgroup->vgId, pRaw, terrstr());
×
126
    sdbFreeRaw(pRaw);
×
127
    return NULL;
×
128
  }
129

130
  mTrace("vgId:%d, encode to raw:%p, row:%p", pVgroup->vgId, pRaw, pVgroup);
36,828✔
131
  return pRaw;
36,828✔
132
}
133

134
SSdbRow *mndVgroupActionDecode(SSdbRaw *pRaw) {
32,966✔
135
  int32_t code = 0;
32,966✔
136
  int32_t lino = 0;
32,966✔
137
  terrno = TSDB_CODE_OUT_OF_MEMORY;
32,966✔
138
  SSdbRow *pRow = NULL;
32,966✔
139
  SVgObj  *pVgroup = NULL;
32,966✔
140

141
  int8_t sver = 0;
32,966✔
142
  if (sdbGetRawSoftVer(pRaw, &sver) != 0) goto _OVER;
32,966!
143

144
  if (sver < 1 || sver > VGROUP_VER_NUMBER) {
32,966!
145
    terrno = TSDB_CODE_SDB_INVALID_DATA_VER;
×
146
    goto _OVER;
×
147
  }
148

149
  pRow = sdbAllocRow(sizeof(SVgObj));
32,966✔
150
  if (pRow == NULL) goto _OVER;
32,966!
151

152
  pVgroup = sdbGetRowObj(pRow);
32,966✔
153
  if (pVgroup == NULL) goto _OVER;
32,966!
154

155
  int32_t dataPos = 0;
32,966✔
156
  SDB_GET_INT32(pRaw, dataPos, &pVgroup->vgId, _OVER)
32,966!
157
  SDB_GET_INT64(pRaw, dataPos, &pVgroup->createdTime, _OVER)
32,966!
158
  SDB_GET_INT64(pRaw, dataPos, &pVgroup->updateTime, _OVER)
32,966!
159
  SDB_GET_INT32(pRaw, dataPos, &pVgroup->version, _OVER)
32,966!
160
  SDB_GET_INT32(pRaw, dataPos, &pVgroup->hashBegin, _OVER)
32,966!
161
  SDB_GET_INT32(pRaw, dataPos, &pVgroup->hashEnd, _OVER)
32,966!
162
  SDB_GET_BINARY(pRaw, dataPos, pVgroup->dbName, TSDB_DB_FNAME_LEN, _OVER)
32,966!
163
  SDB_GET_INT64(pRaw, dataPos, &pVgroup->dbUid, _OVER)
32,966!
164
  SDB_GET_INT8(pRaw, dataPos, &pVgroup->isTsma, _OVER)
32,966!
165
  SDB_GET_INT8(pRaw, dataPos, &pVgroup->replica, _OVER)
32,966!
166
  for (int8_t i = 0; i < pVgroup->replica; ++i) {
72,861✔
167
    SVnodeGid *pVgid = &pVgroup->vnodeGid[i];
39,895✔
168
    SDB_GET_INT32(pRaw, dataPos, &pVgid->dnodeId, _OVER)
39,895!
169
    if (pVgroup->replica == 1) {
39,895✔
170
      pVgid->syncState = TAOS_SYNC_STATE_LEADER;
29,366✔
171
    }
172
  }
173
  if (dataPos + 2 * sizeof(int32_t) + VGROUP_RESERVE_SIZE <= pRaw->dataLen) {
32,966!
174
    SDB_GET_INT32(pRaw, dataPos, &pVgroup->syncConfChangeVer, _OVER)
32,966!
175
  }
176
  SDB_GET_INT32(pRaw, dataPos, &pVgroup->mountVgId, _OVER)
32,966!
177
  SDB_GET_RESERVE(pRaw, dataPos, VGROUP_RESERVE_SIZE, _OVER)
32,966!
178

179
  terrno = 0;
32,966✔
180

181
_OVER:
32,966✔
182
  if (terrno != 0) {
32,966!
183
    mError("vgId:%d, failed to decode from raw:%p since %s", pVgroup == NULL ? 0 : pVgroup->vgId, pRaw, terrstr());
×
184
    taosMemoryFreeClear(pRow);
×
185
    return NULL;
×
186
  }
187

188
  mTrace("vgId:%d, decode from raw:%p, row:%p", pVgroup->vgId, pRaw, pVgroup);
32,966✔
189
  return pRow;
32,966✔
190
}
191

192
static int32_t mndNewVgActionValidate(SMnode *pMnode, STrans *pTrans, SSdbRaw *pRaw) {
9,064✔
193
  SSdb    *pSdb = pMnode->pSdb;
9,064✔
194
  SSdbRow *pRow = NULL;
9,064✔
195
  SVgObj  *pVgroup = NULL;
9,064✔
196
  int      code = -1;
9,064✔
197

198
  pRow = mndVgroupActionDecode(pRaw);
9,064✔
199
  if (pRow == NULL) {
9,064!
200
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
201
    if (terrno != 0) code = terrno;
×
202
    goto _OVER;
×
203
  }
204
  pVgroup = sdbGetRowObj(pRow);
9,064✔
205
  if (pVgroup == NULL) {
9,064!
206
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
207
    if (terrno != 0) code = terrno;
×
208
    goto _OVER;
×
209
  }
210

211
  int32_t maxVgId = sdbGetMaxId(pMnode->pSdb, SDB_VGROUP);
9,064✔
212
  if (maxVgId > pVgroup->vgId) {
9,064!
213
    mError("trans:%d, vgroup id %d already in use. maxVgId:%d", pTrans->id, pVgroup->vgId, maxVgId);
×
214
    goto _OVER;
×
215
  }
216

217
  code = 0;
9,064✔
218
_OVER:
9,064✔
219
  if (pVgroup) mndVgroupActionDelete(pSdb, pVgroup);
9,064!
220
  taosMemoryFreeClear(pRow);
9,064!
221
  TAOS_RETURN(code);
9,064✔
222
}
223

224
static int32_t mndVgroupActionInsert(SSdb *pSdb, SVgObj *pVgroup) {
10,348✔
225
  mTrace("vgId:%d, perform insert action, row:%p", pVgroup->vgId, pVgroup);
10,348✔
226
  return 0;
10,348✔
227
}
228

229
static int32_t mndVgroupActionDelete(SSdb *pSdb, SVgObj *pVgroup) {
32,902✔
230
  mTrace("vgId:%d, perform delete action, row:%p", pVgroup->vgId, pVgroup);
32,902✔
231
  return 0;
32,902✔
232
}
233

234
static int32_t mndVgroupActionUpdate(SSdb *pSdb, SVgObj *pOld, SVgObj *pNew) {
9,861✔
235
  mTrace("vgId:%d, perform update action, old row:%p new row:%p", pOld->vgId, pOld, pNew);
9,861✔
236
  pOld->updateTime = pNew->updateTime;
9,861✔
237
  pOld->version = pNew->version;
9,861✔
238
  pOld->hashBegin = pNew->hashBegin;
9,861✔
239
  pOld->hashEnd = pNew->hashEnd;
9,861✔
240
  pOld->replica = pNew->replica;
9,861✔
241
  pOld->isTsma = pNew->isTsma;
9,861✔
242
  for (int32_t i = 0; i < pNew->replica; ++i) {
22,444✔
243
    SVnodeGid *pNewGid = &pNew->vnodeGid[i];
12,583✔
244
    for (int32_t j = 0; j < pOld->replica; ++j) {
33,328✔
245
      SVnodeGid *pOldGid = &pOld->vnodeGid[j];
20,745✔
246
      if (pNewGid->dnodeId == pOldGid->dnodeId) {
20,745✔
247
        pNewGid->syncState = pOldGid->syncState;
12,160✔
248
        pNewGid->syncRestore = pOldGid->syncRestore;
12,160✔
249
        pNewGid->syncCanRead = pOldGid->syncCanRead;
12,160✔
250
        pNewGid->syncAppliedIndex = pOldGid->syncAppliedIndex;
12,160✔
251
        pNewGid->syncCommitIndex = pOldGid->syncCommitIndex;
12,160✔
252
        pNewGid->bufferSegmentUsed = pOldGid->bufferSegmentUsed;
12,160✔
253
        pNewGid->bufferSegmentSize = pOldGid->bufferSegmentSize;
12,160✔
254
      }
255
    }
256
  }
257
  pNew->numOfTables = pOld->numOfTables;
9,861✔
258
  pNew->numOfTimeSeries = pOld->numOfTimeSeries;
9,861✔
259
  pNew->totalStorage = pOld->totalStorage;
9,861✔
260
  pNew->compStorage = pOld->compStorage;
9,861✔
261
  pNew->pointsWritten = pOld->pointsWritten;
9,861✔
262
  pNew->compact = pOld->compact;
9,861✔
263
  memcpy(pOld->vnodeGid, pNew->vnodeGid, (TSDB_MAX_REPLICA + TSDB_MAX_LEARNER_REPLICA) * sizeof(SVnodeGid));
9,861✔
264
  pOld->syncConfChangeVer = pNew->syncConfChangeVer;
9,861✔
265
  return 0;
9,861✔
266
}
267

268
SVgObj *mndAcquireVgroup(SMnode *pMnode, int32_t vgId) {
252,570✔
269
  SSdb   *pSdb = pMnode->pSdb;
252,570✔
270
  SVgObj *pVgroup = sdbAcquire(pSdb, SDB_VGROUP, &vgId);
252,570✔
271
  if (pVgroup == NULL && terrno == TSDB_CODE_SDB_OBJ_NOT_THERE) {
252,570✔
272
    terrno = TSDB_CODE_MND_VGROUP_NOT_EXIST;
3,131✔
273
  }
274
  return pVgroup;
252,570✔
275
}
276

277
void mndReleaseVgroup(SMnode *pMnode, SVgObj *pVgroup) {
249,758✔
278
  SSdb *pSdb = pMnode->pSdb;
249,758✔
279
  sdbRelease(pSdb, pVgroup);
249,758✔
280
}
249,758✔
281

282
void *mndBuildCreateVnodeReq(SMnode *pMnode, SDnodeObj *pDnode, SDbObj *pDb, SVgObj *pVgroup, int32_t *pContLen) {
9,534✔
283
  SCreateVnodeReq createReq = {0};
9,534✔
284
  createReq.vgId = pVgroup->vgId;
9,534✔
285
  memcpy(createReq.db, pDb->name, TSDB_DB_FNAME_LEN);
9,534✔
286
  createReq.dbUid = pDb->uid;
9,534✔
287
  createReq.vgVersion = pVgroup->version;
9,534✔
288
  createReq.numOfStables = pDb->cfg.numOfStables;
9,534✔
289
  createReq.buffer = pDb->cfg.buffer;
9,534✔
290
  createReq.pageSize = pDb->cfg.pageSize;
9,534✔
291
  createReq.pages = pDb->cfg.pages;
9,534✔
292
  createReq.cacheLastSize = pDb->cfg.cacheLastSize;
9,534✔
293
  createReq.daysPerFile = pDb->cfg.daysPerFile;
9,534✔
294
  createReq.daysToKeep0 = pDb->cfg.daysToKeep0;
9,534✔
295
  createReq.daysToKeep1 = pDb->cfg.daysToKeep1;
9,534✔
296
  createReq.daysToKeep2 = pDb->cfg.daysToKeep2;
9,534✔
297
  createReq.keepTimeOffset = pDb->cfg.keepTimeOffset;
9,534✔
298
  createReq.ssChunkSize = pDb->cfg.ssChunkSize;
9,534✔
299
  createReq.ssKeepLocal = pDb->cfg.ssKeepLocal;
9,534✔
300
  createReq.ssCompact = pDb->cfg.ssCompact;
9,534✔
301
  createReq.minRows = pDb->cfg.minRows;
9,534✔
302
  createReq.maxRows = pDb->cfg.maxRows;
9,534✔
303
  createReq.walFsyncPeriod = pDb->cfg.walFsyncPeriod;
9,534✔
304
  createReq.walLevel = pDb->cfg.walLevel;
9,534✔
305
  createReq.precision = pDb->cfg.precision;
9,534✔
306
  createReq.compression = pDb->cfg.compression;
9,534✔
307
  createReq.strict = pDb->cfg.strict;
9,534✔
308
  createReq.cacheLast = pDb->cfg.cacheLast;
9,534✔
309
  createReq.replica = 0;
9,534✔
310
  createReq.learnerReplica = 0;
9,534✔
311
  createReq.selfIndex = -1;
9,534✔
312
  createReq.learnerSelfIndex = -1;
9,534✔
313
  createReq.hashBegin = pVgroup->hashBegin;
9,534✔
314
  createReq.hashEnd = pVgroup->hashEnd;
9,534✔
315
  createReq.hashMethod = pDb->cfg.hashMethod;
9,534✔
316
  createReq.numOfRetensions = pDb->cfg.numOfRetensions;
9,534✔
317
  createReq.pRetensions = pDb->cfg.pRetensions;
9,534✔
318
  createReq.isTsma = pVgroup->isTsma;
9,534✔
319
  createReq.pTsma = pVgroup->pTsma;
9,534✔
320
  createReq.walRetentionPeriod = pDb->cfg.walRetentionPeriod;
9,534✔
321
  createReq.walRetentionSize = pDb->cfg.walRetentionSize;
9,534✔
322
  createReq.walRollPeriod = pDb->cfg.walRollPeriod;
9,534✔
323
  createReq.walSegmentSize = pDb->cfg.walSegmentSize;
9,534✔
324
  createReq.sstTrigger = pDb->cfg.sstTrigger;
9,534✔
325
  createReq.hashPrefix = pDb->cfg.hashPrefix;
9,534✔
326
  createReq.hashSuffix = pDb->cfg.hashSuffix;
9,534✔
327
  createReq.tsdbPageSize = pDb->cfg.tsdbPageSize;
9,534✔
328
  createReq.changeVersion = ++(pVgroup->syncConfChangeVer);
9,534✔
329
  createReq.encryptAlgorithm = pDb->cfg.encryptAlgorithm;
9,534✔
330
  int32_t code = 0;
9,534✔
331

332
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
22,281✔
333
    SReplica *pReplica = NULL;
12,747✔
334

335
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
12,747✔
336
      pReplica = &createReq.replicas[createReq.replica];
12,515✔
337
    } else {
338
      pReplica = &createReq.learnerReplicas[createReq.learnerReplica];
232✔
339
    }
340

341
    SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
12,747✔
342
    SDnodeObj *pVgidDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
12,747✔
343
    if (pVgidDnode == NULL) {
12,747!
344
      return NULL;
×
345
    }
346

347
    pReplica->id = pVgidDnode->id;
12,747✔
348
    pReplica->port = pVgidDnode->port;
12,747✔
349
    memcpy(pReplica->fqdn, pVgidDnode->fqdn, TSDB_FQDN_LEN);
12,747✔
350
    mndReleaseDnode(pMnode, pVgidDnode);
12,747✔
351

352
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
12,747✔
353
      if (pDnode->id == pVgid->dnodeId) {
12,515✔
354
        createReq.selfIndex = createReq.replica;
9,302✔
355
      }
356
    } else {
357
      if (pDnode->id == pVgid->dnodeId) {
232!
358
        createReq.learnerSelfIndex = createReq.learnerReplica;
232✔
359
      }
360
    }
361

362
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
12,747✔
363
      createReq.replica++;
12,515✔
364
    } else {
365
      createReq.learnerReplica++;
232✔
366
    }
367
  }
368

369
  if (createReq.selfIndex == -1 && createReq.learnerSelfIndex == -1) {
9,534!
370
    terrno = TSDB_CODE_APP_ERROR;
×
371
    return NULL;
×
372
  }
373

374
  createReq.changeVersion = pVgroup->syncConfChangeVer;
9,534✔
375

376
  mInfo(
9,534!
377
      "vgId:%d, build create vnode req, replica:%d selfIndex:%d learnerReplica:%d learnerSelfIndex:%d strict:%d "
378
      "changeVersion:%d",
379
      createReq.vgId, createReq.replica, createReq.selfIndex, createReq.learnerReplica, createReq.learnerSelfIndex,
380
      createReq.strict, createReq.changeVersion);
381
  for (int32_t i = 0; i < createReq.replica; ++i) {
22,049✔
382
    mInfo("vgId:%d, replica:%d ep:%s:%u", createReq.vgId, i, createReq.replicas[i].fqdn, createReq.replicas[i].port);
12,515!
383
  }
384
  for (int32_t i = 0; i < createReq.learnerReplica; ++i) {
9,766✔
385
    mInfo("vgId:%d, replica:%d ep:%s:%u", createReq.vgId, i, createReq.learnerReplicas[i].fqdn,
232!
386
          createReq.learnerReplicas[i].port);
387
  }
388

389
  int32_t contLen = tSerializeSCreateVnodeReq(NULL, 0, &createReq);
9,534✔
390
  if (contLen < 0) {
9,534!
391
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
392
    return NULL;
×
393
  }
394

395
  void *pReq = taosMemoryMalloc(contLen);
9,534!
396
  if (pReq == NULL) {
9,534!
397
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
398
    return NULL;
×
399
  }
400

401
  code = tSerializeSCreateVnodeReq(pReq, contLen, &createReq);
9,534✔
402
  if (code < 0) {
9,534!
403
    terrno = TSDB_CODE_APP_ERROR;
×
404
    taosMemoryFree(pReq);
×
405
    mError("vgId:%d, failed to serialize create vnode req,since %s", createReq.vgId, terrstr());
×
406
    return NULL;
×
407
  }
408
  *pContLen = contLen;
9,534✔
409
  return pReq;
9,534✔
410
}
411

412
static void *mndBuildAlterVnodeConfigReq(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, int32_t *pContLen) {
418✔
413
  SAlterVnodeConfigReq alterReq = {0};
418✔
414
  alterReq.vgVersion = pVgroup->version;
418✔
415
  alterReq.buffer = pDb->cfg.buffer;
418✔
416
  alterReq.pageSize = pDb->cfg.pageSize;
418✔
417
  alterReq.pages = pDb->cfg.pages;
418✔
418
  alterReq.cacheLastSize = pDb->cfg.cacheLastSize;
418✔
419
  alterReq.daysPerFile = pDb->cfg.daysPerFile;
418✔
420
  alterReq.daysToKeep0 = pDb->cfg.daysToKeep0;
418✔
421
  alterReq.daysToKeep1 = pDb->cfg.daysToKeep1;
418✔
422
  alterReq.daysToKeep2 = pDb->cfg.daysToKeep2;
418✔
423
  alterReq.keepTimeOffset = pDb->cfg.keepTimeOffset;
418✔
424
  alterReq.walFsyncPeriod = pDb->cfg.walFsyncPeriod;
418✔
425
  alterReq.walLevel = pDb->cfg.walLevel;
418✔
426
  alterReq.strict = pDb->cfg.strict;
418✔
427
  alterReq.cacheLast = pDb->cfg.cacheLast;
418✔
428
  alterReq.sttTrigger = pDb->cfg.sstTrigger;
418✔
429
  alterReq.minRows = pDb->cfg.minRows;
418✔
430
  alterReq.walRetentionPeriod = pDb->cfg.walRetentionPeriod;
418✔
431
  alterReq.walRetentionSize = pDb->cfg.walRetentionSize;
418✔
432
  alterReq.ssKeepLocal = pDb->cfg.ssKeepLocal;
418✔
433
  alterReq.ssCompact = pDb->cfg.ssCompact;
418✔
434

435
  mInfo("vgId:%d, build alter vnode config req", pVgroup->vgId);
418!
436
  int32_t contLen = tSerializeSAlterVnodeConfigReq(NULL, 0, &alterReq);
418✔
437
  if (contLen < 0) {
418!
438
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
439
    return NULL;
×
440
  }
441
  contLen += sizeof(SMsgHead);
418✔
442

443
  void *pReq = taosMemoryMalloc(contLen);
418!
444
  if (pReq == NULL) {
418!
445
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
446
    return NULL;
×
447
  }
448

449
  SMsgHead *pHead = pReq;
418✔
450
  pHead->contLen = htonl(contLen);
418✔
451
  pHead->vgId = htonl(pVgroup->vgId);
418✔
452

453
  if (tSerializeSAlterVnodeConfigReq((char *)pReq + sizeof(SMsgHead), contLen, &alterReq) < 0) {
418!
454
    taosMemoryFree(pReq);
×
455
    mError("vgId:%d, failed to serialize alter vnode config req,since %s", pVgroup->vgId, terrstr());
×
456
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
457
    return NULL;
×
458
  }
459
  *pContLen = contLen;
418✔
460
  return pReq;
418✔
461
}
462

463
static void *mndBuildAlterVnodeReplicaReq(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId,
1,602✔
464
                                          int32_t *pContLen) {
465
  SAlterVnodeReplicaReq alterReq = {
1,602✔
466
      .vgId = pVgroup->vgId,
1,602✔
467
      .strict = pDb->cfg.strict,
1,602✔
468
      .replica = 0,
469
      .learnerReplica = 0,
470
      .selfIndex = -1,
471
      .learnerSelfIndex = -1,
472
      .changeVersion = ++(pVgroup->syncConfChangeVer),
1,602✔
473
  };
474

475
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
6,323✔
476
    SReplica *pReplica = NULL;
4,721✔
477

478
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
4,721✔
479
      pReplica = &alterReq.replicas[alterReq.replica];
4,355✔
480
      alterReq.replica++;
4,355✔
481
    } else {
482
      pReplica = &alterReq.learnerReplicas[alterReq.learnerReplica];
366✔
483
      alterReq.learnerReplica++;
366✔
484
    }
485

486
    SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
4,721✔
487
    SDnodeObj *pVgidDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
4,721✔
488
    if (pVgidDnode == NULL) return NULL;
4,721!
489

490
    pReplica->id = pVgidDnode->id;
4,721✔
491
    pReplica->port = pVgidDnode->port;
4,721✔
492
    memcpy(pReplica->fqdn, pVgidDnode->fqdn, TSDB_FQDN_LEN);
4,721✔
493
    mndReleaseDnode(pMnode, pVgidDnode);
4,721✔
494

495
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
4,721✔
496
      if (dnodeId == pVgid->dnodeId) {
4,355✔
497
        alterReq.selfIndex = v;
1,602✔
498
      }
499
    } else {
500
      if (dnodeId == pVgid->dnodeId) {
366!
501
        alterReq.learnerSelfIndex = v;
×
502
      }
503
    }
504
  }
505

506
  mInfo(
1,602!
507
      "vgId:%d, build alter vnode req, replica:%d selfIndex:%d learnerReplica:%d learnerSelfIndex:%d strict:%d "
508
      "changeVersion:%d",
509
      alterReq.vgId, alterReq.replica, alterReq.selfIndex, alterReq.learnerReplica, alterReq.learnerSelfIndex,
510
      alterReq.strict, alterReq.changeVersion);
511
  for (int32_t i = 0; i < alterReq.replica; ++i) {
5,957✔
512
    mInfo("vgId:%d, replica:%d ep:%s:%u", alterReq.vgId, i, alterReq.replicas[i].fqdn, alterReq.replicas[i].port);
4,355!
513
  }
514
  for (int32_t i = 0; i < alterReq.learnerReplica; ++i) {
1,968✔
515
    mInfo("vgId:%d, learnerReplica:%d ep:%s:%u", alterReq.vgId, i, alterReq.learnerReplicas[i].fqdn,
366!
516
          alterReq.learnerReplicas[i].port);
517
  }
518

519
  if (alterReq.selfIndex == -1 && alterReq.learnerSelfIndex == -1) {
1,602!
520
    terrno = TSDB_CODE_APP_ERROR;
×
521
    return NULL;
×
522
  }
523

524
  int32_t contLen = tSerializeSAlterVnodeReplicaReq(NULL, 0, &alterReq);
1,602✔
525
  if (contLen < 0) {
1,602!
526
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
527
    return NULL;
×
528
  }
529

530
  void *pReq = taosMemoryMalloc(contLen);
1,602!
531
  if (pReq == NULL) {
1,602!
532
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
533
    return NULL;
×
534
  }
535

536
  if (tSerializeSAlterVnodeReplicaReq(pReq, contLen, &alterReq) < 0) {
1,602!
537
    mError("vgId:%d, failed to serialize alter vnode req,since %s", alterReq.vgId, terrstr());
×
538
    taosMemoryFree(pReq);
×
539
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
540
    return NULL;
×
541
  }
542
  *pContLen = contLen;
1,602✔
543
  return pReq;
1,602✔
544
}
545

546
static void *mndBuildCheckLearnCatchupReq(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId,
×
547
                                          int32_t *pContLen) {
548
  SCheckLearnCatchupReq req = {
×
549
      .vgId = pVgroup->vgId,
×
550
      .strict = pDb->cfg.strict,
×
551
      .replica = 0,
552
      .learnerReplica = 0,
553
      .selfIndex = -1,
554
      .learnerSelfIndex = -1,
555
  };
556

557
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
×
558
    SReplica *pReplica = NULL;
×
559

560
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
×
561
      pReplica = &req.replicas[req.replica];
×
562
      req.replica++;
×
563
    } else {
564
      pReplica = &req.learnerReplicas[req.learnerReplica];
×
565
      req.learnerReplica++;
×
566
    }
567

568
    SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
×
569
    SDnodeObj *pVgidDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
×
570
    if (pVgidDnode == NULL) return NULL;
×
571

572
    pReplica->id = pVgidDnode->id;
×
573
    pReplica->port = pVgidDnode->port;
×
574
    memcpy(pReplica->fqdn, pVgidDnode->fqdn, TSDB_FQDN_LEN);
×
575
    mndReleaseDnode(pMnode, pVgidDnode);
×
576

577
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
×
578
      if (dnodeId == pVgid->dnodeId) {
×
579
        req.selfIndex = v;
×
580
      }
581
    } else {
582
      if (dnodeId == pVgid->dnodeId) {
×
583
        req.learnerSelfIndex = v;
×
584
      }
585
    }
586
  }
587

588
  mInfo("vgId:%d, build alter vnode req, replica:%d selfIndex:%d learnerReplica:%d learnerSelfIndex:%d strict:%d",
×
589
        req.vgId, req.replica, req.selfIndex, req.learnerReplica, req.learnerSelfIndex, req.strict);
590
  for (int32_t i = 0; i < req.replica; ++i) {
×
591
    mInfo("vgId:%d, replica:%d ep:%s:%u", req.vgId, i, req.replicas[i].fqdn, req.replicas[i].port);
×
592
  }
593
  for (int32_t i = 0; i < req.learnerReplica; ++i) {
×
594
    mInfo("vgId:%d, learnerReplica:%d ep:%s:%u", req.vgId, i, req.learnerReplicas[i].fqdn, req.learnerReplicas[i].port);
×
595
  }
596

597
  if (req.selfIndex == -1 && req.learnerSelfIndex == -1) {
×
598
    terrno = TSDB_CODE_APP_ERROR;
×
599
    return NULL;
×
600
  }
601

602
  int32_t contLen = tSerializeSAlterVnodeReplicaReq(NULL, 0, &req);
×
603
  if (contLen < 0) {
×
604
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
605
    return NULL;
×
606
  }
607

608
  void *pReq = taosMemoryMalloc(contLen);
×
609
  if (pReq == NULL) {
×
610
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
611
    return NULL;
×
612
  }
613

614
  if (tSerializeSAlterVnodeReplicaReq(pReq, contLen, &req) < 0) {
×
615
    mError("vgId:%d, failed to serialize alter vnode req,since %s", req.vgId, terrstr());
×
616
    taosMemoryFree(pReq);
×
617
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
618
    return NULL;
×
619
  }
620
  *pContLen = contLen;
×
621
  return pReq;
×
622
}
623

624
static void *mndBuildDisableVnodeWriteReq(SMnode *pMnode, SDbObj *pDb, int32_t vgId, int32_t *pContLen) {
86✔
625
  SDisableVnodeWriteReq disableReq = {
86✔
626
      .vgId = vgId,
627
      .disable = 1,
628
  };
629

630
  mInfo("vgId:%d, build disable vnode write req", vgId);
86!
631
  int32_t contLen = tSerializeSDisableVnodeWriteReq(NULL, 0, &disableReq);
86✔
632
  if (contLen < 0) {
86!
633
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
634
    return NULL;
×
635
  }
636

637
  void *pReq = taosMemoryMalloc(contLen);
86!
638
  if (pReq == NULL) {
86!
639
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
640
    return NULL;
×
641
  }
642

643
  if (tSerializeSDisableVnodeWriteReq(pReq, contLen, &disableReq) < 0) {
86!
644
    mError("vgId:%d, failed to serialize disable vnode write req,since %s", vgId, terrstr());
×
645
    taosMemoryFree(pReq);
×
646
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
647
    return NULL;
×
648
  }
649
  *pContLen = contLen;
86✔
650
  return pReq;
86✔
651
}
652

653
static void *mndBuildAlterVnodeHashRangeReq(SMnode *pMnode, int32_t srcVgId, SVgObj *pVgroup, int32_t *pContLen) {
86✔
654
  SAlterVnodeHashRangeReq alterReq = {
86✔
655
      .srcVgId = srcVgId,
656
      .dstVgId = pVgroup->vgId,
86✔
657
      .hashBegin = pVgroup->hashBegin,
86✔
658
      .hashEnd = pVgroup->hashEnd,
86✔
659
      .changeVersion = ++(pVgroup->syncConfChangeVer),
86✔
660
  };
661

662
  mInfo("vgId:%d, build alter vnode hashrange req, dstVgId:%d, hashrange:[%u, %u]", srcVgId, pVgroup->vgId,
86!
663
        pVgroup->hashBegin, pVgroup->hashEnd);
664
  int32_t contLen = tSerializeSAlterVnodeHashRangeReq(NULL, 0, &alterReq);
86✔
665
  if (contLen < 0) {
86!
666
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
667
    return NULL;
×
668
  }
669

670
  void *pReq = taosMemoryMalloc(contLen);
86!
671
  if (pReq == NULL) {
86!
672
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
673
    return NULL;
×
674
  }
675

676
  if (tSerializeSAlterVnodeHashRangeReq(pReq, contLen, &alterReq) < 0) {
86!
677
    mError("vgId:%d, failed to serialize alter vnode hashrange req,since %s", srcVgId, terrstr());
×
678
    taosMemoryFree(pReq);
×
679
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
680
    return NULL;
×
681
  }
682
  *pContLen = contLen;
86✔
683
  return pReq;
86✔
684
}
685

686
void *mndBuildDropVnodeReq(SMnode *pMnode, SDnodeObj *pDnode, SDbObj *pDb, SVgObj *pVgroup, int32_t *pContLen) {
13,017✔
687
  SDropVnodeReq dropReq = {0};
13,017✔
688
  dropReq.dnodeId = pDnode->id;
13,017✔
689
  dropReq.vgId = pVgroup->vgId;
13,017✔
690
  memcpy(dropReq.db, pDb->name, TSDB_DB_FNAME_LEN);
13,017✔
691
  dropReq.dbUid = pDb->uid;
13,017✔
692

693
  mInfo("vgId:%d, build drop vnode req", dropReq.vgId);
13,017!
694
  int32_t contLen = tSerializeSDropVnodeReq(NULL, 0, &dropReq);
13,017✔
695
  if (contLen < 0) {
13,017!
696
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
697
    return NULL;
×
698
  }
699

700
  void *pReq = taosMemoryMalloc(contLen);
13,017!
701
  if (pReq == NULL) {
13,017!
702
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
703
    return NULL;
×
704
  }
705

706
  if (tSerializeSDropVnodeReq(pReq, contLen, &dropReq) < 0) {
13,017!
707
    mError("vgId:%d, failed to serialize drop vnode req,since %s", dropReq.vgId, terrstr());
×
708
    taosMemoryFree(pReq);
×
709
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
710
    return NULL;
×
711
  }
712
  *pContLen = contLen;
13,017✔
713
  return pReq;
13,017✔
714
}
715

716
static bool mndResetDnodesArrayFp(SMnode *pMnode, void *pObj, void *p1, void *p2, void *p3) {
5,518✔
717
  SDnodeObj *pDnode = pObj;
5,518✔
718
  pDnode->numOfVnodes = 0;
5,518✔
719
  pDnode->numOfOtherNodes = 0;
5,518✔
720
  return true;
5,518✔
721
}
722

723
static bool mndBuildDnodesArrayFp(SMnode *pMnode, void *pObj, void *p1, void *p2, void *p3) {
5,518✔
724
  SDnodeObj *pDnode = pObj;
5,518✔
725
  SArray    *pArray = p1;
5,518✔
726
  int32_t    exceptDnodeId = *(int32_t *)p2;
5,518✔
727
  SArray    *dnodeList = p3;
5,518✔
728

729
  if (exceptDnodeId == pDnode->id) {
5,518✔
730
    return true;
14✔
731
  }
732

733
  if (dnodeList != NULL) {
5,504✔
734
    int32_t dnodeListSize = taosArrayGetSize(dnodeList);
95✔
735
    if (dnodeListSize > 0) {
95!
736
      bool inDnodeList = false;
95✔
737
      for (int32_t index = 0; index < dnodeListSize; ++index) {
310✔
738
        int32_t dnodeId = *(int32_t *)taosArrayGet(dnodeList, index);
215✔
739
        if (pDnode->id == dnodeId) {
215✔
740
          inDnodeList = true;
43✔
741
        }
742
      }
743
      if (!inDnodeList) {
95✔
744
        return true;
52✔
745
      }
746
    } else {
747
      return true;  // TS-6191
×
748
    }
749
  }
750

751
  int64_t curMs = taosGetTimestampMs();
5,452✔
752
  bool    online = mndIsDnodeOnline(pDnode, curMs);
5,452✔
753
  bool    isMnode = mndIsMnode(pMnode, pDnode->id);
5,452✔
754
  pDnode->numOfVnodes = mndGetVnodesNum(pMnode, pDnode->id);
5,452✔
755
  pDnode->memUsed = mndGetVnodesMemory(pMnode, pDnode->id);
5,452✔
756

757
  mInfo("dnode:%d, vnodes:%d supportVnodes:%d isMnode:%d online:%d memory avail:%" PRId64 " used:%" PRId64, pDnode->id,
5,452!
758
        pDnode->numOfVnodes, pDnode->numOfSupportVnodes, isMnode, online, pDnode->memAvail, pDnode->memUsed);
759

760
  if (isMnode) {
5,452✔
761
    pDnode->numOfOtherNodes++;
4,338✔
762
  }
763

764
  if (online && pDnode->numOfSupportVnodes > 0) {
5,452✔
765
    if (taosArrayPush(pArray, pDnode) == NULL) return false;
5,349!
766
  }
767
  return true;
5,452✔
768
}
769

770
static bool isDnodeInList(SArray *dnodeList, int32_t dnodeId) {
×
771
  int32_t dnodeListSize = taosArrayGetSize(dnodeList);
×
772
  for (int32_t i = 0; i < dnodeListSize; ++i) {
×
773
    int32_t id = *(int32_t *)TARRAY_GET_ELEM(dnodeList, i);
×
774
    if (id == dnodeId) {
×
775
      return true;
×
776
    }
777
  }
778
  return false;
×
779
}
780

781
#ifdef TD_ENTERPRISE
782
static float mndGetDnodeScore1(SDnodeObj *pDnode, int32_t additionDnodes, float ratio) {
×
783
  float totalDnodes = pDnode->numOfVnodes + (float)pDnode->numOfOtherNodes * ratio + additionDnodes;
×
784
  float result = totalDnodes / pDnode->numOfSupportVnodes;
×
785
  return pDnode->numOfVnodes > 0 ? -result : result;
×
786
}
787

788
static int32_t mndCompareDnodeVnodes1(SDnodeObj *pDnode1, SDnodeObj *pDnode2) {
×
789
  float d1Score = mndGetDnodeScore1(pDnode1, 0, 0.9);
×
790
  float d2Score = mndGetDnodeScore1(pDnode2, 0, 0.9);
×
791
  if (d1Score == d2Score) {
×
792
    if (pDnode1->id == pDnode2->id) {
×
793
      return 0;
×
794
    }
795
    return pDnode1->id > pDnode2->id ? 1 : -1;
×
796
  }
797
  return d1Score > d2Score ? 1 : -1;
×
798
}
799

800
static bool mndBuildDnodesListFp(SMnode *pMnode, void *pObj, void *p1, void *p2, void *p3) {
×
801
  SDnodeObj *pDnode = pObj;
×
802
  SArray    *pArray = p1;
×
803

804
  bool isMnode = mndIsMnode(pMnode, pDnode->id);
×
805
  pDnode->numOfVnodes = mndGetVnodesNum(pMnode, pDnode->id);
×
806

807
  if (isMnode) {
×
808
    pDnode->numOfOtherNodes++;
×
809
  }
810

811
  if (pDnode->numOfSupportVnodes > 0) {
×
812
    if (taosArrayPush(pArray, pDnode) == NULL) return false;
×
813
  }
814
  return true;
×
815
}
816

817
// TS-6191
818
static int32_t mndBuildNodesCheckDualReplica(SMnode *pMnode, int32_t nDnodes, SArray *dnodeList, SArray **ppDnodeList) {
4,123✔
819
  int32_t code = 0;
4,123✔
820
  if (!grantCheckDualReplicaDnodes(pMnode)) {
4,123!
821
    TAOS_RETURN(code);
4,123✔
822
  }
823
  SSdb   *pSdb = pMnode->pSdb;
×
824
  SArray *pArray = taosArrayInit(nDnodes, sizeof(SDnodeObj));
×
825
  if (pArray == NULL) {
×
826
    TAOS_RETURN(code = terrno);
×
827
  }
828
  *ppDnodeList = pArray;
×
829

830
  sdbTraverse(pSdb, SDB_DNODE, mndResetDnodesArrayFp, NULL, NULL, NULL);
×
831
  sdbTraverse(pSdb, SDB_DNODE, mndBuildDnodesListFp, pArray, NULL, NULL);
×
832

833
  int32_t arrSize = taosArrayGetSize(pArray);
×
834
  if (arrSize <= 0) {
×
835
    TAOS_RETURN(code);
×
836
  }
837
  if (arrSize > 1) taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes1);
×
838

839
  int32_t dnodeListSize = taosArrayGetSize(dnodeList);
×
840
  if (dnodeListSize <= 0) {
×
841
    if (arrSize > 2) taosArrayRemoveBatch(pArray, 2, arrSize - 2, NULL);
×
842
  } else {
843
    int32_t nDnodesWithVnodes = 0;
×
844
    for (int32_t i = 0; i < arrSize; ++i) {
×
845
      SDnodeObj *pDnode = TARRAY_GET_ELEM(pArray, i);
×
846
      if (pDnode->numOfVnodes <= 0) {
×
847
        break;
×
848
      }
849
      ++nDnodesWithVnodes;
×
850
    }
851
    int32_t dnodeId = -1;
×
852
    if (nDnodesWithVnodes == 1) {
×
853
      dnodeId = ((SDnodeObj *)TARRAY_GET_ELEM(pArray, 0))->id;
×
854
    } else if (nDnodesWithVnodes >= 2) {
×
855
      // must select the dnodes from the 1st 2 dnodes
856
      taosArrayRemoveBatch(pArray, 2, arrSize - 2, NULL);
×
857
    }
858
    for (int32_t i = 0; i < TARRAY_SIZE(pArray);) {
×
859
      SDnodeObj *pDnode = taosArrayGet(pArray, i);
×
860
      if (!isDnodeInList(dnodeList, pDnode->id)) {
×
861
        taosArrayRemove(pArray, i);
×
862
        continue;
×
863
      }
864
      ++i;
×
865
    }
866
    if (nDnodesWithVnodes == 1) {
×
867
      SDnodeObj *pDnode = taosArrayGet(pArray, 0);
×
868
      if (pDnode && (pDnode->id != dnodeId)) {  // the first dnode is not in dnodeList, remove the last element
×
869
        taosArrayRemove(pArray, taosArrayGetSize(pArray) - 1);
×
870
      }
871
    }
872
  }
873

874
  TAOS_RETURN(code);
×
875
}
876
#endif
877

878
SArray *mndBuildDnodesArray(SMnode *pMnode, int32_t exceptDnodeId, SArray *dnodeList) {
4,123✔
879
  SSdb   *pSdb = pMnode->pSdb;
4,123✔
880
  int32_t numOfDnodes = mndGetDnodeSize(pMnode);
4,123✔
881
  SArray *tDnodeList = NULL;
4,123✔
882
  SArray *pDnodeList = NULL;
4,123✔
883

884
  SArray *pArray = taosArrayInit(numOfDnodes, sizeof(SDnodeObj));
4,123✔
885
  if (pArray == NULL) {
4,123!
886
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
887
    return NULL;
×
888
  }
889
  if (taosArrayGetSize(dnodeList) > 0) {
4,123✔
890
    tDnodeList = dnodeList;
19✔
891
  }
892
#ifdef TD_ENTERPRISE
893
  if (0 != mndBuildNodesCheckDualReplica(pMnode, numOfDnodes, tDnodeList, &pDnodeList)) {
4,123!
894
    taosArrayDestroy(pArray);
×
895
    return NULL;
×
896
  }
897
#endif
898
  sdbTraverse(pSdb, SDB_DNODE, mndResetDnodesArrayFp, NULL, NULL, NULL);
4,123✔
899
  sdbTraverse(pSdb, SDB_DNODE, mndBuildDnodesArrayFp, pArray, &exceptDnodeId, pDnodeList ? pDnodeList : tDnodeList);
4,123!
900

901
  mDebug("build %d dnodes array", (int32_t)taosArrayGetSize(pArray));
4,123✔
902
  for (int32_t i = 0; i < (int32_t)taosArrayGetSize(pArray); ++i) {
9,472✔
903
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
5,349✔
904
    mDebug("dnode:%d, vnodes:%d others:%d", pDnode->id, pDnode->numOfVnodes, pDnode->numOfOtherNodes);
5,349✔
905
  }
906
  taosArrayDestroy(pDnodeList);
4,123✔
907
  return pArray;
4,123✔
908
}
909

910
static int32_t mndCompareDnodeId(int32_t *dnode1Id, int32_t *dnode2Id) {
×
911
  if (*dnode1Id == *dnode2Id) {
×
912
    return 0;
×
913
  }
914
  return *dnode1Id > *dnode2Id ? 1 : -1;
×
915
}
916

917
static float mndGetDnodeScore(SDnodeObj *pDnode, int32_t additionDnodes, float ratio) {
21,027✔
918
  float totalDnodes = pDnode->numOfVnodes + (float)pDnode->numOfOtherNodes * ratio + additionDnodes;
21,027✔
919
  return totalDnodes / pDnode->numOfSupportVnodes;
21,027✔
920
}
921

922
static int32_t mndCompareDnodeVnodes(SDnodeObj *pDnode1, SDnodeObj *pDnode2) {
5,043✔
923
  float d1Score = mndGetDnodeScore(pDnode1, 0, 0.9);
5,043✔
924
  float d2Score = mndGetDnodeScore(pDnode2, 0, 0.9);
5,043✔
925
  if (d1Score == d2Score) {
5,043✔
926
    return 0;
1,759✔
927
  }
928
  return d1Score > d2Score ? 1 : -1;
3,284✔
929
}
930

931
void mndSortVnodeGid(SVgObj *pVgroup) {
8,412✔
932
  for (int32_t i = 0; i < pVgroup->replica; ++i) {
17,865✔
933
    for (int32_t j = 0; j < pVgroup->replica - 1 - i; ++j) {
11,010✔
934
      if (pVgroup->vnodeGid[j].dnodeId > pVgroup->vnodeGid[j + 1].dnodeId) {
1,557✔
935
        TSWAP(pVgroup->vnodeGid[j], pVgroup->vnodeGid[j + 1]);
589✔
936
      }
937
    }
938
  }
939
}
8,412✔
940

941
static int32_t mndGetAvailableDnode(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, SArray *pArray) {
8,329✔
942
  mDebug("start to sort %d dnodes", (int32_t)taosArrayGetSize(pArray));
8,329✔
943
  taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes);
8,329✔
944
  for (int32_t i = 0; i < (int32_t)taosArrayGetSize(pArray); ++i) {
19,340✔
945
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
11,011✔
946
    mDebug("dnode:%d, score:%f", pDnode->id, mndGetDnodeScore(pDnode, 0, 0.9));
11,011✔
947
  }
948

949
  int32_t size = taosArrayGetSize(pArray);
8,329✔
950
  if (size < pVgroup->replica) {
8,329✔
951
    mError("db:%s, vgId:%d, no enough online dnodes:%d to alloc %d replica", pVgroup->dbName, pVgroup->vgId, size,
9!
952
           pVgroup->replica);
953
    TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_DNODES);
9✔
954
  }
955

956
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
17,505✔
957
    SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
9,185✔
958
    SDnodeObj *pDnode = taosArrayGet(pArray, v);
9,185✔
959
    if (pDnode == NULL) {
9,185!
960
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_DNODES);
×
961
    }
962
    if (pDnode->numOfVnodes >= pDnode->numOfSupportVnodes) {
9,185!
963
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_VNODES);
×
964
    }
965

966
    int64_t vgMem = mndGetVgroupMemory(pMnode, pDb, pVgroup);
9,185✔
967
    if (pDnode->memAvail - vgMem - pDnode->memUsed <= 0) {
9,185!
968
      mError("db:%s, vgId:%d, no enough memory:%" PRId64 " in dnode:%d, avail:%" PRId64 " used:%" PRId64,
×
969
             pVgroup->dbName, pVgroup->vgId, vgMem, pDnode->id, pDnode->memAvail, pDnode->memUsed);
970
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE);
×
971
    } else {
972
      pDnode->memUsed += vgMem;
9,185✔
973
    }
974

975
    pVgid->dnodeId = pDnode->id;
9,185✔
976
    if (pVgroup->replica == 1) {
9,185✔
977
      pVgid->syncState = TAOS_SYNC_STATE_LEADER;
7,883✔
978
    } else {
979
      pVgid->syncState = TAOS_SYNC_STATE_FOLLOWER;
1,302✔
980
    }
981

982
    mInfo("db:%s, vgId:%d, vn:%d is alloced, memory:%" PRId64 ", dnode:%d avail:%" PRId64 " used:%" PRId64,
9,185!
983
          pVgroup->dbName, pVgroup->vgId, v, vgMem, pVgid->dnodeId, pDnode->memAvail, pDnode->memUsed);
984
    pDnode->numOfVnodes++;
9,185✔
985
  }
986

987
  mndSortVnodeGid(pVgroup);
8,320✔
988
  return 0;
8,320✔
989
}
990

991
int32_t mndAllocSmaVgroup(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup) {
×
992
  int32_t code = 0;
×
993
  SArray *pArray = mndBuildDnodesArray(pMnode, 0, NULL);
×
994
  if (pArray == NULL) {
×
995
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
996
    if (terrno != 0) code = terrno;
×
997
    TAOS_RETURN(code);
×
998
  }
999

1000
  pVgroup->vgId = sdbGetMaxId(pMnode->pSdb, SDB_VGROUP);
×
1001
  pVgroup->isTsma = 1;
×
1002
  pVgroup->createdTime = taosGetTimestampMs();
×
1003
  pVgroup->updateTime = pVgroup->createdTime;
×
1004
  pVgroup->version = 1;
×
1005
  memcpy(pVgroup->dbName, pDb->name, TSDB_DB_FNAME_LEN);
×
1006
  pVgroup->dbUid = pDb->uid;
×
1007
  pVgroup->replica = 1;
×
1008

1009
  if (mndGetAvailableDnode(pMnode, pDb, pVgroup, pArray) != 0) return -1;
×
1010
  taosArrayDestroy(pArray);
×
1011

1012
  mInfo("db:%s, sma vgId:%d is alloced", pDb->name, pVgroup->vgId);
×
1013
  return 0;
×
1014
}
1015

1016
int32_t mndAllocVgroup(SMnode *pMnode, SDbObj *pDb, SVgObj **ppVgroups, SArray *dnodeList) {
3,888✔
1017
  int32_t code = -1;
3,888✔
1018
  SArray *pArray = NULL;
3,888✔
1019
  SVgObj *pVgroups = NULL;
3,888✔
1020

1021
  pVgroups = taosMemoryCalloc(pDb->cfg.numOfVgroups, sizeof(SVgObj));
3,888!
1022
  if (pVgroups == NULL) {
3,888!
1023
    code = terrno;
×
1024
    goto _OVER;
×
1025
  }
1026

1027
  pArray = mndBuildDnodesArray(pMnode, 0, dnodeList);
3,888✔
1028
  if (pArray == NULL) {
3,888!
1029
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1030
    if (terrno != 0) code = terrno;
×
1031
    goto _OVER;
×
1032
  }
1033

1034
  mInfo("db:%s, total %d dnodes used to create %d vgroups (%d vnodes)", pDb->name, (int32_t)taosArrayGetSize(pArray),
3,888!
1035
        pDb->cfg.numOfVgroups, pDb->cfg.numOfVgroups * pDb->cfg.replications);
1036

1037
  int32_t  allocedVgroups = 0;
3,888✔
1038
  int32_t  maxVgId = sdbGetMaxId(pMnode->pSdb, SDB_VGROUP);
3,888✔
1039
  uint32_t hashMin = 0;
3,888✔
1040
  uint32_t hashMax = UINT32_MAX;
3,888✔
1041
  uint32_t hashInterval = (hashMax - hashMin) / pDb->cfg.numOfVgroups;
3,888✔
1042

1043
  if (maxVgId < 2) maxVgId = 2;
3,888✔
1044

1045
  for (uint32_t v = 0; v < pDb->cfg.numOfVgroups; v++) {
12,208✔
1046
    SVgObj *pVgroup = &pVgroups[v];
8,329✔
1047
    pVgroup->vgId = maxVgId++;
8,329✔
1048
    pVgroup->createdTime = taosGetTimestampMs();
8,329✔
1049
    pVgroup->updateTime = pVgroups->createdTime;
8,329✔
1050
    pVgroup->version = 1;
8,329✔
1051
    pVgroup->hashBegin = hashMin + hashInterval * v;
8,329✔
1052
    if (v == pDb->cfg.numOfVgroups - 1) {
8,329✔
1053
      pVgroup->hashEnd = hashMax;
3,883✔
1054
    } else {
1055
      pVgroup->hashEnd = hashMin + hashInterval * (v + 1) - 1;
4,446✔
1056
    }
1057

1058
    memcpy(pVgroup->dbName, pDb->name, TSDB_DB_FNAME_LEN);
8,329✔
1059
    pVgroup->dbUid = pDb->uid;
8,329✔
1060
    pVgroup->replica = pDb->cfg.replications;
8,329✔
1061

1062
    if ((code = mndGetAvailableDnode(pMnode, pDb, pVgroup, pArray)) != 0) {
8,329✔
1063
      goto _OVER;
9✔
1064
    }
1065

1066
    allocedVgroups++;
8,320✔
1067
  }
1068

1069
  *ppVgroups = pVgroups;
3,879✔
1070
  code = 0;
3,879✔
1071

1072
  mInfo("db:%s, total %d vgroups is alloced, replica:%d", pDb->name, pDb->cfg.numOfVgroups, pDb->cfg.replications);
3,879!
1073

1074
_OVER:
×
1075
  if (code != 0) taosMemoryFree(pVgroups);
3,888!
1076
  taosArrayDestroy(pArray);
3,888✔
1077
  TAOS_RETURN(code);
3,888✔
1078
}
1079

1080
SEpSet mndGetVgroupEpset(SMnode *pMnode, const SVgObj *pVgroup) {
75,141✔
1081
  SEpSet epset = {0};
75,141✔
1082

1083
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
168,837✔
1084
    const SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
93,696✔
1085
    SDnodeObj       *pDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
93,696✔
1086
    if (pDnode == NULL) continue;
93,696✔
1087

1088
    if (pVgid->syncState == TAOS_SYNC_STATE_LEADER || pVgid->syncState == TAOS_SYNC_STATE_ASSIGNED_LEADER) {
93,663✔
1089
      epset.inUse = epset.numOfEps;
74,182✔
1090
    }
1091

1092
    if (addEpIntoEpSet(&epset, pDnode->fqdn, pDnode->port) != 0) {
93,663!
1093
      mWarn("vgId:%d, failed to add ep:%s:%d into epset", pVgroup->vgId, pDnode->fqdn, pDnode->port);
×
1094
    }
1095
    mndReleaseDnode(pMnode, pDnode);
93,663✔
1096
  }
1097
  epsetSort(&epset);
75,141✔
1098

1099
  return epset;
75,141✔
1100
}
1101

1102
SEpSet mndGetVgroupEpsetById(SMnode *pMnode, int32_t vgId) {
537✔
1103
  SEpSet epset = {0};
537✔
1104

1105
  SVgObj *pVgroup = mndAcquireVgroup(pMnode, vgId);
537✔
1106
  if (!pVgroup) return epset;
537!
1107

1108
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
1,179✔
1109
    const SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
642✔
1110
    SDnodeObj       *pDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
642✔
1111
    if (pDnode == NULL) continue;
642✔
1112

1113
    if (pVgid->syncState == TAOS_SYNC_STATE_LEADER || pVgid->syncState == TAOS_SYNC_STATE_ASSIGNED_LEADER) {
638✔
1114
      epset.inUse = epset.numOfEps;
516✔
1115
    }
1116

1117
    if (addEpIntoEpSet(&epset, pDnode->fqdn, pDnode->port) != 0) {
638!
1118
      mWarn("vgId:%d, failed to add ep:%s:%d into epset", pVgroup->vgId, pDnode->fqdn, pDnode->port);
×
1119
    }
1120
    mndReleaseDnode(pMnode, pDnode);
638✔
1121
  }
1122

1123
  mndReleaseVgroup(pMnode, pVgroup);
537✔
1124
  return epset;
537✔
1125
}
1126

1127
static int32_t mndRetrieveVgroups(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows) {
608✔
1128
  SMnode *pMnode = pReq->info.node;
608✔
1129
  SSdb   *pSdb = pMnode->pSdb;
608✔
1130
  int32_t numOfRows = 0;
608✔
1131
  SVgObj *pVgroup = NULL;
608✔
1132
  int32_t cols = 0;
608✔
1133
  int64_t curMs = taosGetTimestampMs();
608✔
1134
  int32_t code = 0, lino = 0;
608✔
1135

1136
  SDbObj *pDb = NULL;
608✔
1137
  if (strlen(pShow->db) > 0) {
608✔
1138
    pDb = mndAcquireDb(pMnode, pShow->db);
499✔
1139
    if (pDb == NULL) {
499!
1140
      return 0;
×
1141
    }
1142
  }
1143

1144
  while (numOfRows < rows) {
2,975!
1145
    pShow->pIter = sdbFetch(pSdb, SDB_VGROUP, pShow->pIter, (void **)&pVgroup);
2,975✔
1146
    if (pShow->pIter == NULL) break;
2,975✔
1147

1148
    if (pDb != NULL && pVgroup->dbUid != pDb->uid) {
2,367✔
1149
      sdbRelease(pSdb, pVgroup);
648✔
1150
      continue;
648✔
1151
    }
1152

1153
    cols = 0;
1,719✔
1154
    SColumnInfoData *pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,719✔
1155
    COL_DATA_SET_VAL_GOTO((const char *)&pVgroup->vgId, false, pVgroup, pShow->pIter, _OVER);
1,719!
1156

1157
    SName name = {0};
1,719✔
1158
    char  db[TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
1,719✔
1159
    code = tNameFromString(&name, pVgroup->dbName, T_NAME_ACCT | T_NAME_DB);
1,719✔
1160
    if (code != 0) {
1,719!
1161
      mError("vgId:%d, failed to set dbName, since %s", pVgroup->vgId, tstrerror(code));
×
1162
      sdbRelease(pSdb, pVgroup);
×
1163
      sdbCancelFetch(pSdb, pShow->pIter);
×
1164
      return code;
×
1165
    }
1166
    (void)tNameGetDbName(&name, varDataVal(db));
1,719✔
1167
    varDataSetLen(db, strlen(varDataVal(db)));
1,719✔
1168

1169
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,719✔
1170
    COL_DATA_SET_VAL_GOTO((const char *)db, false, pVgroup, pShow->pIter, _OVER);
1,719!
1171

1172
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,719✔
1173
    COL_DATA_SET_VAL_GOTO((const char *)&pVgroup->numOfTables, false, pVgroup, pShow->pIter, _OVER);
1,719!
1174

1175
    // default 3 replica, add 1 replica if move vnode
1176
    for (int32_t i = 0; i < 4; ++i) {
8,595✔
1177
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
6,876✔
1178
      if (i < pVgroup->replica) {
6,876✔
1179
        int16_t dnodeId = (int16_t)pVgroup->vnodeGid[i].dnodeId;
3,292✔
1180
        COL_DATA_SET_VAL_GOTO((const char *)&dnodeId, false, pVgroup, pShow->pIter, _OVER);
3,292!
1181

1182
        bool       exist = false;
3,292✔
1183
        bool       online = false;
3,292✔
1184
        SDnodeObj *pDnode = mndAcquireDnode(pMnode, pVgroup->vnodeGid[i].dnodeId);
3,292✔
1185
        if (pDnode != NULL) {
3,292!
1186
          exist = true;
3,292✔
1187
          online = mndIsDnodeOnline(pDnode, curMs);
3,292✔
1188
          mndReleaseDnode(pMnode, pDnode);
3,292✔
1189
        }
1190

1191
        char buf1[20] = {0};
3,292✔
1192
        char role[20] = "offline";
3,292✔
1193
        if (!exist) {
3,292!
1194
          tstrncpy(role, "dropping", sizeof(role));
×
1195
        } else if (online) {
3,292✔
1196
          char *star = "";
3,197✔
1197
          if (pVgroup->vnodeGid[i].syncState == TAOS_SYNC_STATE_LEADER ||
3,197✔
1198
              pVgroup->vnodeGid[i].syncState == TAOS_SYNC_STATE_ASSIGNED_LEADER) {
1,802✔
1199
            if (!pVgroup->vnodeGid[i].syncRestore && !pVgroup->vnodeGid[i].syncCanRead) {
1,397!
1200
              star = "**";
352✔
1201
            } else if (!pVgroup->vnodeGid[i].syncRestore && pVgroup->vnodeGid[i].syncCanRead) {
1,045!
1202
              star = "*";
×
1203
            } else {
1204
            }
1205
          }
1206
          snprintf(role, sizeof(role), "%s%s", syncStr(pVgroup->vnodeGid[i].syncState), star);
3,197✔
1207
          /*
1208
          mInfo("db:%s, learner progress:%d", pDb->name, pVgroup->vnodeGid[i].learnerProgress);
1209

1210
          if (pVgroup->vnodeGid[i].syncState == TAOS_SYNC_STATE_LEARNER) {
1211
            if(pVgroup->vnodeGid[i].learnerProgress < 0){
1212
              snprintf(role, sizeof(role), "%s-",
1213
                syncStr(pVgroup->vnodeGid[i].syncState));
1214

1215
            }
1216
            else if(pVgroup->vnodeGid[i].learnerProgress >= 100){
1217
              snprintf(role, sizeof(role), "%s--",
1218
                syncStr(pVgroup->vnodeGid[i].syncState));
1219
            }
1220
            else{
1221
              snprintf(role, sizeof(role), "%s%d",
1222
                syncStr(pVgroup->vnodeGid[i].syncState), pVgroup->vnodeGid[i].learnerProgress);
1223
            }
1224
          }
1225
          else{
1226
            snprintf(role, sizeof(role), "%s%s", syncStr(pVgroup->vnodeGid[i].syncState), star);
1227
          }
1228
          */
1229
        } else {
1230
        }
1231
        STR_WITH_MAXSIZE_TO_VARSTR(buf1, role, pShow->pMeta->pSchemas[cols].bytes);
3,292✔
1232

1233
        pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
3,292✔
1234
        COL_DATA_SET_VAL_GOTO((const char *)buf1, false, pVgroup, pShow->pIter, _OVER);
3,292!
1235

1236
        char applyStr[TSDB_SYNC_APPLY_COMMIT_LEN + 1] = {0};
3,292✔
1237
        char buf[TSDB_SYNC_APPLY_COMMIT_LEN + VARSTR_HEADER_SIZE + 1] = {0};
3,292✔
1238
        snprintf(applyStr, sizeof(applyStr), "%" PRId64 "/%" PRId64, pVgroup->vnodeGid[i].syncAppliedIndex,
3,292✔
1239
                 pVgroup->vnodeGid[i].syncCommitIndex);
3,292✔
1240
        STR_WITH_MAXSIZE_TO_VARSTR(buf, applyStr, pShow->pMeta->pSchemas[cols].bytes);
3,292✔
1241

1242
        pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
3,292✔
1243
        COL_DATA_SET_VAL_GOTO((const char *)&buf, false, pVgroup, pShow->pIter, _OVER);
3,292!
1244
      } else {
1245
        colDataSetNULL(pColInfo, numOfRows);
3,584!
1246
        pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
3,584✔
1247
        colDataSetNULL(pColInfo, numOfRows);
3,584!
1248
        pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
3,584✔
1249
        colDataSetNULL(pColInfo, numOfRows);
3,584!
1250
      }
1251
    }
1252

1253
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,719✔
1254
    int32_t cacheUsage = (int32_t)pVgroup->cacheUsage;
1,719✔
1255
    COL_DATA_SET_VAL_GOTO((const char *)&cacheUsage, false, pVgroup, pShow->pIter, _OVER);
1,719!
1256

1257
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,719✔
1258
    COL_DATA_SET_VAL_GOTO((const char *)&pVgroup->numOfCachedTables, false, pVgroup, pShow->pIter, _OVER);
1,719!
1259

1260
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,719✔
1261
    COL_DATA_SET_VAL_GOTO((const char *)&pVgroup->isTsma, false, pVgroup, pShow->pIter, _OVER);
1,719!
1262

1263
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,719✔
1264
    COL_DATA_SET_VAL_GOTO((const char *)&pVgroup->mountVgId, false, pVgroup, pShow->pIter, _OVER);
1,719!
1265

1266
    numOfRows++;
1,719✔
1267
    sdbRelease(pSdb, pVgroup);
1,719✔
1268
  }
1269
_OVER:
×
1270
  if (pDb != NULL) {
608✔
1271
    mndReleaseDb(pMnode, pDb);
499✔
1272
  }
1273
  if (code != 0) {
608!
1274
    mError("failed to retrieve vgroup info at line %d since %s", lino, tstrerror(code));
×
1275
    TAOS_RETURN(code);
×
1276
  }
1277

1278
  pShow->numOfRows += numOfRows;
608✔
1279
  return numOfRows;
608✔
1280
}
1281

1282
static void mndCancelGetNextVgroup(SMnode *pMnode, void *pIter) {
×
1283
  SSdb *pSdb = pMnode->pSdb;
×
1284
  sdbCancelFetchByType(pSdb, pIter, SDB_VGROUP);
×
1285
}
×
1286

1287
static bool mndGetVnodesNumFp(SMnode *pMnode, void *pObj, void *p1, void *p2, void *p3) {
21,323✔
1288
  SVgObj  *pVgroup = pObj;
21,323✔
1289
  int32_t  dnodeId = *(int32_t *)p1;
21,323✔
1290
  int32_t *pNumOfVnodes = (int32_t *)p2;
21,323✔
1291

1292
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
57,126✔
1293
    if (pVgroup->vnodeGid[v].dnodeId == dnodeId) {
35,803✔
1294
      (*pNumOfVnodes)++;
13,154✔
1295
    }
1296
  }
1297

1298
  return true;
21,323✔
1299
}
1300

1301
int32_t mndGetVnodesNum(SMnode *pMnode, int32_t dnodeId) {
11,112✔
1302
  int32_t numOfVnodes = 0;
11,112✔
1303
  sdbTraverse(pMnode->pSdb, SDB_VGROUP, mndGetVnodesNumFp, &dnodeId, &numOfVnodes, NULL);
11,112✔
1304
  return numOfVnodes;
11,112✔
1305
}
1306

1307
int64_t mndGetVgroupMemory(SMnode *pMnode, SDbObj *pDbInput, SVgObj *pVgroup) {
19,797✔
1308
  SDbObj *pDb = pDbInput;
19,797✔
1309
  if (pDbInput == NULL) {
19,797✔
1310
    pDb = mndAcquireDb(pMnode, pVgroup->dbName);
9,376✔
1311
  }
1312

1313
  int64_t vgroupMemroy = 0;
19,797✔
1314
  if (pDb != NULL) {
19,797!
1315
    int64_t buffer = (int64_t)pDb->cfg.buffer * 1024 * 1024;
19,797✔
1316
    int64_t cache = (int64_t)pDb->cfg.pages * pDb->cfg.pageSize * 1024;
19,797✔
1317
    vgroupMemroy = buffer + cache;
19,797✔
1318
    int64_t cacheLast = (int64_t)pDb->cfg.cacheLastSize * 1024 * 1024;
19,797✔
1319
    if (pDb->cfg.cacheLast > 0) {
19,797✔
1320
      vgroupMemroy += cacheLast;
1,744✔
1321
    }
1322
    mDebug("db:%s, vgroup:%d, buffer:%" PRId64 " cache:%" PRId64 " cacheLast:%" PRId64, pDb->name, pVgroup->vgId,
19,797✔
1323
           buffer, cache, cacheLast);
1324
  }
1325

1326
  if (pDbInput == NULL) {
19,797✔
1327
    mndReleaseDb(pMnode, pDb);
9,376✔
1328
  }
1329
  return vgroupMemroy;
19,797✔
1330
}
1331

1332
static bool mndGetVnodeMemroyFp(SMnode *pMnode, void *pObj, void *p1, void *p2, void *p3) {
12,290✔
1333
  SVgObj  *pVgroup = pObj;
12,290✔
1334
  int32_t  dnodeId = *(int32_t *)p1;
12,290✔
1335
  int64_t *pVnodeMemory = (int64_t *)p2;
12,290✔
1336

1337
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
30,064✔
1338
    if (pVgroup->vnodeGid[v].dnodeId == dnodeId) {
17,774✔
1339
      *pVnodeMemory += mndGetVgroupMemory(pMnode, NULL, pVgroup);
9,019✔
1340
    }
1341
  }
1342

1343
  return true;
12,290✔
1344
}
1345

1346
int64_t mndGetVnodesMemory(SMnode *pMnode, int32_t dnodeId) {
5,454✔
1347
  int64_t vnodeMemory = 0;
5,454✔
1348
  sdbTraverse(pMnode->pSdb, SDB_VGROUP, mndGetVnodeMemroyFp, &dnodeId, &vnodeMemory, NULL);
5,454✔
1349
  return vnodeMemory;
5,454✔
1350
}
1351

1352
void calculateRstoreFinishTime(double rate, int64_t applyCount, char *restoreStr, size_t restoreStrSize) {
2✔
1353
  if (rate == 0) {
2!
1354
    snprintf(restoreStr, restoreStrSize, "0:0:0");
2✔
1355
    return;
2✔
1356
  }
1357

1358
  int64_t costTime = applyCount / rate;
×
1359
  int64_t totalSeconds = costTime / 1000;
×
1360
  int64_t hours = totalSeconds / 3600;
×
1361
  totalSeconds %= 3600;
×
1362
  int64_t minutes = totalSeconds / 60;
×
1363
  int64_t seconds = totalSeconds % 60;
×
1364
  snprintf(restoreStr, restoreStrSize, "%" PRId64 ":%" PRId64 ":%" PRId64, hours, minutes, seconds);
×
1365
}
1366

1367
static int32_t mndRetrieveVnodes(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows) {
47✔
1368
  SMnode *pMnode = pReq->info.node;
47✔
1369
  SSdb   *pSdb = pMnode->pSdb;
47✔
1370
  int32_t numOfRows = 0;
47✔
1371
  SVgObj *pVgroup = NULL;
47✔
1372
  int32_t cols = 0;
47✔
1373
  int64_t curMs = taosGetTimestampMs();
47✔
1374
  int32_t code = 0;
47✔
1375

1376
  while (numOfRows < rows - TSDB_MAX_REPLICA) {
139!
1377
    pShow->pIter = sdbFetch(pSdb, SDB_VGROUP, pShow->pIter, (void **)&pVgroup);
139✔
1378
    if (pShow->pIter == NULL) break;
139✔
1379

1380
    for (int32_t i = 0; i < pVgroup->replica && numOfRows < rows; ++i) {
263!
1381
      SVnodeGid       *pGid = &pVgroup->vnodeGid[i];
171✔
1382
      SColumnInfoData *pColInfo = NULL;
171✔
1383
      cols = 0;
171✔
1384

1385
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
171✔
1386
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&pGid->dnodeId, false);
171✔
1387
      if (code != 0) {
171!
1388
        mError("vgId:%d, failed to set dnodeId, since %s", pVgroup->vgId, tstrerror(code));
×
1389
        return code;
×
1390
      }
1391
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
171✔
1392
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&pVgroup->vgId, false);
171✔
1393
      if (code != 0) {
171!
1394
        mError("vgId:%d, failed to set vgId, since %s", pVgroup->vgId, tstrerror(code));
×
1395
        return code;
×
1396
      }
1397

1398
      // db_name
1399
      const char *dbname = mndGetDbStr(pVgroup->dbName);
171✔
1400
      char        b1[TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
171✔
1401
      if (dbname != NULL) {
171!
1402
        STR_WITH_MAXSIZE_TO_VARSTR(b1, dbname, TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE);
171✔
1403
      } else {
1404
        STR_WITH_MAXSIZE_TO_VARSTR(b1, "NULL", TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE);
×
1405
      }
1406
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
171✔
1407
      code = colDataSetVal(pColInfo, numOfRows, (const char *)b1, false);
171✔
1408
      if (code != 0) {
171!
1409
        mError("vgId:%d, failed to set dbName, since %s", pVgroup->vgId, tstrerror(code));
×
1410
        return code;
×
1411
      }
1412

1413
      // dnode is online?
1414
      SDnodeObj *pDnode = mndAcquireDnode(pMnode, pGid->dnodeId);
171✔
1415
      if (pDnode == NULL) {
171!
1416
        mError("failed to acquire dnode. dnodeId:%d", pGid->dnodeId);
×
1417
        break;
×
1418
      }
1419
      bool isDnodeOnline = mndIsDnodeOnline(pDnode, curMs);
171✔
1420

1421
      char       buf[20] = {0};
171✔
1422
      ESyncState syncState = (isDnodeOnline) ? pGid->syncState : TAOS_SYNC_STATE_OFFLINE;
171✔
1423
      STR_TO_VARSTR(buf, syncStr(syncState));
171✔
1424
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
171✔
1425
      code = colDataSetVal(pColInfo, numOfRows, (const char *)buf, false);
171✔
1426
      if (code != 0) {
171!
1427
        mError("vgId:%d, failed to set syncState, since %s", pVgroup->vgId, tstrerror(code));
×
1428
        return code;
×
1429
      }
1430

1431
      int64_t roleTimeMs = (isDnodeOnline) ? pGid->roleTimeMs : 0;
171✔
1432
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
171✔
1433
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&roleTimeMs, false);
171✔
1434
      if (code != 0) {
171!
1435
        mError("vgId:%d, failed to set roleTimeMs, since %s", pVgroup->vgId, tstrerror(code));
×
1436
        return code;
×
1437
      }
1438

1439
      int64_t startTimeMs = (isDnodeOnline) ? pGid->startTimeMs : 0;
171✔
1440
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
171✔
1441
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&startTimeMs, false);
171✔
1442
      if (code != 0) {
171!
1443
        mError("vgId:%d, failed to set startTimeMs, since %s", pVgroup->vgId, tstrerror(code));
×
1444
        return code;
×
1445
      }
1446

1447
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
171✔
1448
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&pGid->syncRestore, false);
171✔
1449
      if (code != 0) {
171!
1450
        mError("vgId:%d, failed to set syncRestore, since %s", pVgroup->vgId, tstrerror(code));
×
1451
        return code;
×
1452
      }
1453

1454
      int64_t unappliedCount = pGid->syncCommitIndex - pGid->syncAppliedIndex;
171✔
1455
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
171✔
1456
      char restoreStr[20] = {0};
171✔
1457
      if (unappliedCount > 0) {
171✔
1458
        calculateRstoreFinishTime(pGid->appliedRate, unappliedCount, restoreStr, sizeof(restoreStr));
2✔
1459
      }
1460
      STR_TO_VARSTR(buf, restoreStr);
171✔
1461
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&buf, false);
171✔
1462
      if (code != 0) {
171!
1463
        mError("vgId:%d, failed to set syncRestore finish time, since %s", pVgroup->vgId, tstrerror(code));
×
1464
        return code;
×
1465
      }
1466

1467
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
171✔
1468
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&unappliedCount, false);
171✔
1469
      if (code != 0) {
171!
1470
        mError("vgId:%d, failed to set syncRestore, since %s", pVgroup->vgId, tstrerror(code));
×
1471
        return code;
×
1472
      }
1473

1474
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
171✔
1475
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&pGid->bufferSegmentUsed, false);
171✔
1476
      if (code != 0) {
171!
1477
        mError("vgId:%d, failed to set buffer segment used, since %s", pVgroup->vgId, tstrerror(code));
×
1478
        return code;
×
1479
      }
1480

1481
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
171✔
1482
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&pGid->bufferSegmentSize, false);
171✔
1483
      if (code != 0) {
171!
1484
        mError("vgId:%d, failed to set buffer segment size, since %s", pVgroup->vgId, tstrerror(code));
×
1485
        return code;
×
1486
      }
1487

1488
      numOfRows++;
171✔
1489
      sdbRelease(pSdb, pDnode);
171✔
1490
    }
1491

1492
    sdbRelease(pSdb, pVgroup);
92✔
1493
  }
1494

1495
  pShow->numOfRows += numOfRows;
47✔
1496
  return numOfRows;
47✔
1497
}
1498

1499
static void mndCancelGetNextVnode(SMnode *pMnode, void *pIter) {
×
1500
  SSdb *pSdb = pMnode->pSdb;
×
1501
  sdbCancelFetchByType(pSdb, pIter, SDB_VGROUP);
×
1502
}
×
1503

1504
static int32_t mndAddVnodeToVgroup(SMnode *pMnode, STrans *pTrans, SVgObj *pVgroup, SArray *pArray) {
239✔
1505
  int32_t code = 0;
239✔
1506
  taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes);
239✔
1507
  for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
900✔
1508
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
661✔
1509
    mInfo("trans:%d, dnode:%d, equivalent vnodes:%d others:%d", pTrans->id, pDnode->id, pDnode->numOfVnodes,
661!
1510
          pDnode->numOfOtherNodes);
1511
  }
1512

1513
  SVnodeGid *pVgid = &pVgroup->vnodeGid[pVgroup->replica];
239✔
1514
  for (int32_t d = 0; d < taosArrayGetSize(pArray); ++d) {
305✔
1515
    SDnodeObj *pDnode = taosArrayGet(pArray, d);
293✔
1516

1517
    bool used = false;
293✔
1518
    for (int32_t vn = 0; vn < pVgroup->replica; ++vn) {
671✔
1519
      if (pDnode->id == pVgroup->vnodeGid[vn].dnodeId) {
444✔
1520
        used = true;
66✔
1521
        break;
66✔
1522
      }
1523
    }
1524
    if (used) continue;
293✔
1525

1526
    if (pDnode == NULL) {
227!
1527
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_DNODES);
×
1528
    }
1529
    if (pDnode->numOfVnodes >= pDnode->numOfSupportVnodes) {
227!
1530
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_VNODES);
×
1531
    }
1532

1533
    int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
227✔
1534
    if (pDnode->memAvail - vgMem - pDnode->memUsed <= 0) {
227!
1535
      mError("trans:%d, db:%s, vgId:%d, no enough memory:%" PRId64 " in dnode:%d avail:%" PRId64 " used:%" PRId64,
×
1536
             pTrans->id, pVgroup->dbName, pVgroup->vgId, vgMem, pDnode->id, pDnode->memAvail, pDnode->memUsed);
1537
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE);
×
1538
    } else {
1539
      pDnode->memUsed += vgMem;
227✔
1540
    }
1541

1542
    pVgid->dnodeId = pDnode->id;
227✔
1543
    pVgid->syncState = TAOS_SYNC_STATE_OFFLINE;
227✔
1544
    mInfo("trans:%id, db:%s, vgId:%d, vn:%d is added, memory:%" PRId64 ", dnode:%d avail:%" PRId64 " used:%" PRId64,
227!
1545
          pTrans->id, pVgroup->dbName, pVgroup->vgId, pVgroup->replica, vgMem, pVgid->dnodeId, pDnode->memAvail,
1546
          pDnode->memUsed);
1547

1548
    pVgroup->replica++;
227✔
1549
    pDnode->numOfVnodes++;
227✔
1550

1551
    SSdbRaw *pVgRaw = mndVgroupActionEncode(pVgroup);
227✔
1552
    if (pVgRaw == NULL) {
227!
1553
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1554
      if (terrno != 0) code = terrno;
×
1555
      TAOS_RETURN(code);
×
1556
    }
1557
    if ((code = mndTransAppendGroupRedolog(pTrans, pVgRaw, pVgroup->vgId)) != 0) {
227!
1558
      sdbFreeRaw(pVgRaw);
×
1559
      TAOS_RETURN(code);
×
1560
    }
1561
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
227✔
1562
    if (code != 0) {
227!
1563
      mError("trans:%d, vgId:%d, failed to set raw status since %s at line:%d", pTrans->id, pVgroup->vgId,
×
1564
             tstrerror(code), __LINE__);
1565
    }
1566
    TAOS_RETURN(code);
227✔
1567
  }
1568

1569
  code = TSDB_CODE_MND_NO_ENOUGH_DNODES;
12✔
1570
  mError("trans:%d, db:%s, failed to add vnode to vgId:%d since %s", pTrans->id, pVgroup->dbName, pVgroup->vgId,
12!
1571
         tstrerror(code));
1572
  TAOS_RETURN(code);
12✔
1573
}
1574

1575
static int32_t mndRemoveVnodeFromVgroup(SMnode *pMnode, STrans *pTrans, SVgObj *pVgroup, SArray *pArray,
40✔
1576
                                        SVnodeGid *pDelVgid) {
1577
  taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes);
40✔
1578
  for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
149✔
1579
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
109✔
1580
    mInfo("trans:%d, dnode:%d, equivalent vnodes:%d others:%d", pTrans->id, pDnode->id, pDnode->numOfVnodes,
109!
1581
          pDnode->numOfOtherNodes);
1582
  }
1583

1584
  int32_t code = -1;
40✔
1585
  for (int32_t d = taosArrayGetSize(pArray) - 1; d >= 0; --d) {
41!
1586
    SDnodeObj *pDnode = taosArrayGet(pArray, d);
41✔
1587

1588
    for (int32_t vn = 0; vn < pVgroup->replica; ++vn) {
73✔
1589
      SVnodeGid *pVgid = &pVgroup->vnodeGid[vn];
72✔
1590
      if (pVgid->dnodeId == pDnode->id) {
72✔
1591
        int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
40✔
1592
        pDnode->memUsed -= vgMem;
40✔
1593
        mInfo("trans:%d, db:%s, vgId:%d, vn:%d is removed, memory:%" PRId64 ", dnode:%d avail:%" PRId64
40!
1594
              " used:%" PRId64,
1595
              pTrans->id, pVgroup->dbName, pVgroup->vgId, vn, vgMem, pVgid->dnodeId, pDnode->memAvail, pDnode->memUsed);
1596
        pDnode->numOfVnodes--;
40✔
1597
        pVgroup->replica--;
40✔
1598
        *pDelVgid = *pVgid;
40✔
1599
        *pVgid = pVgroup->vnodeGid[pVgroup->replica];
40✔
1600
        memset(&pVgroup->vnodeGid[pVgroup->replica], 0, sizeof(SVnodeGid));
40✔
1601
        code = 0;
40✔
1602
        goto _OVER;
40✔
1603
      }
1604
    }
1605
  }
1606

1607
_OVER:
×
1608
  if (code != 0) {
40!
1609
    code = TSDB_CODE_APP_ERROR;
×
1610
    mError("trans:%d, db:%s, failed to remove vnode from vgId:%d since %s", pTrans->id, pVgroup->dbName, pVgroup->vgId,
×
1611
           tstrerror(code));
1612
    TAOS_RETURN(code);
×
1613
  }
1614

1615
  for (int32_t vn = 0; vn < pVgroup->replica; ++vn) {
116✔
1616
    SVnodeGid *pVgid = &pVgroup->vnodeGid[vn];
76✔
1617
    mInfo("trans:%d, db:%s, vgId:%d, vn:%d dnode:%d is reserved", pTrans->id, pVgroup->dbName, pVgroup->vgId, vn,
76!
1618
          pVgid->dnodeId);
1619
  }
1620

1621
  SSdbRaw *pVgRaw = mndVgroupActionEncode(pVgroup);
40✔
1622
  if (pVgRaw == NULL) {
40!
1623
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1624
    if (terrno != 0) code = terrno;
×
1625
    TAOS_RETURN(code);
×
1626
  }
1627
  if (mndTransAppendGroupRedolog(pTrans, pVgRaw, pVgroup->vgId) != 0) {
40!
1628
    sdbFreeRaw(pVgRaw);
×
1629
    TAOS_RETURN(code);
×
1630
  }
1631
  code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
40✔
1632
  if (code != 0) {
40!
1633
    mError("trans:%d, vgId:%d, failed to set raw status since %s at line:%d", pTrans->id, pVgroup->vgId,
×
1634
           tstrerror(code), __LINE__);
1635
  }
1636

1637
  TAOS_RETURN(code);
40✔
1638
}
1639

1640
static int32_t mndRemoveVnodeFromVgroupWithoutSave(SMnode *pMnode, STrans *pTrans, SVgObj *pVgroup, SArray *pArray,
×
1641
                                                   SVnodeGid *pDelVgid) {
1642
  taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes);
×
1643
  for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
×
1644
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
×
1645
    mInfo("dnode:%d, equivalent vnodes:%d others:%d", pDnode->id, pDnode->numOfVnodes, pDnode->numOfOtherNodes);
×
1646
  }
1647

1648
  int32_t code = -1;
×
1649
  for (int32_t d = taosArrayGetSize(pArray) - 1; d >= 0; --d) {
×
1650
    SDnodeObj *pDnode = taosArrayGet(pArray, d);
×
1651

1652
    for (int32_t vn = 0; vn < pVgroup->replica; ++vn) {
×
1653
      SVnodeGid *pVgid = &pVgroup->vnodeGid[vn];
×
1654
      if (pVgid->dnodeId == pDnode->id) {
×
1655
        int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
×
1656
        pDnode->memUsed -= vgMem;
×
1657
        mInfo("db:%s, vgId:%d, vn:%d is removed, memory:%" PRId64 ", dnode:%d avail:%" PRId64 " used:%" PRId64,
×
1658
              pVgroup->dbName, pVgroup->vgId, vn, vgMem, pVgid->dnodeId, pDnode->memAvail, pDnode->memUsed);
1659
        pDnode->numOfVnodes--;
×
1660
        pVgroup->replica--;
×
1661
        *pDelVgid = *pVgid;
×
1662
        *pVgid = pVgroup->vnodeGid[pVgroup->replica];
×
1663
        memset(&pVgroup->vnodeGid[pVgroup->replica], 0, sizeof(SVnodeGid));
×
1664
        code = 0;
×
1665
        goto _OVER;
×
1666
      }
1667
    }
1668
  }
1669

1670
_OVER:
×
1671
  if (code != 0) {
×
1672
    code = TSDB_CODE_APP_ERROR;
×
1673
    mError("db:%s, failed to remove vnode from vgId:%d since %s", pVgroup->dbName, pVgroup->vgId, tstrerror(code));
×
1674
    TAOS_RETURN(code);
×
1675
  }
1676

1677
  for (int32_t vn = 0; vn < pVgroup->replica; ++vn) {
×
1678
    SVnodeGid *pVgid = &pVgroup->vnodeGid[vn];
×
1679
    mInfo("db:%s, vgId:%d, vn:%d dnode:%d is reserved", pVgroup->dbName, pVgroup->vgId, vn, pVgid->dnodeId);
×
1680
  }
1681

1682
  TAOS_RETURN(code);
×
1683
}
1684

1685
int32_t mndAddCreateVnodeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, SVnodeGid *pVgid) {
9,524✔
1686
  int32_t      code = 0;
9,524✔
1687
  STransAction action = {0};
9,524✔
1688

1689
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
9,524✔
1690
  if (pDnode == NULL) return -1;
9,524!
1691
  action.epSet = mndGetDnodeEpset(pDnode);
9,524✔
1692
  mndReleaseDnode(pMnode, pDnode);
9,524✔
1693

1694
  int32_t contLen = 0;
9,524✔
1695
  void   *pReq = mndBuildCreateVnodeReq(pMnode, pDnode, pDb, pVgroup, &contLen);
9,524✔
1696
  if (pReq == NULL) return -1;
9,524!
1697

1698
  action.pCont = pReq;
9,524✔
1699
  action.contLen = contLen;
9,524✔
1700
  action.msgType = TDMT_DND_CREATE_VNODE;
9,524✔
1701
  action.acceptableCode = TSDB_CODE_VND_ALREADY_EXIST;
9,524✔
1702
  action.groupId = pVgroup->vgId;
9,524✔
1703

1704
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
9,524!
1705
    taosMemoryFree(pReq);
×
1706
    TAOS_RETURN(code);
×
1707
  }
1708

1709
  TAOS_RETURN(code);
9,524✔
1710
}
1711

1712
int32_t mndRestoreAddCreateVnodeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
10✔
1713
                                       SDnodeObj *pDnode) {
1714
  int32_t      code = 0;
10✔
1715
  STransAction action = {0};
10✔
1716

1717
  action.epSet = mndGetDnodeEpset(pDnode);
10✔
1718

1719
  int32_t contLen = 0;
10✔
1720
  void   *pReq = mndBuildCreateVnodeReq(pMnode, pDnode, pDb, pVgroup, &contLen);
10✔
1721
  if (pReq == NULL) {
10!
1722
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1723
    if (terrno != 0) code = terrno;
×
1724
    TAOS_RETURN(code);
×
1725
  }
1726

1727
  action.pCont = pReq;
10✔
1728
  action.contLen = contLen;
10✔
1729
  action.msgType = TDMT_DND_CREATE_VNODE;
10✔
1730
  action.acceptableCode = TSDB_CODE_VND_ALREADY_EXIST;
10✔
1731
  action.groupId = pVgroup->vgId;
10✔
1732

1733
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
10!
1734
    taosMemoryFree(pReq);
×
1735
    TAOS_RETURN(code);
×
1736
  }
1737

1738
  TAOS_RETURN(code);
10✔
1739
}
1740

1741
int32_t mndAddAlterVnodeConfirmAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup) {
617✔
1742
  int32_t      code = 0;
617✔
1743
  STransAction action = {0};
617✔
1744
  action.epSet = mndGetVgroupEpset(pMnode, pVgroup);
617✔
1745

1746
  mInfo("trans:%d, vgId:%d, build alter vnode confirm req", pTrans->id, pVgroup->vgId);
617!
1747
  int32_t   contLen = sizeof(SMsgHead);
617✔
1748
  SMsgHead *pHead = taosMemoryMalloc(contLen);
617!
1749
  if (pHead == NULL) {
617!
1750
    TAOS_RETURN(terrno);
×
1751
  }
1752

1753
  pHead->contLen = htonl(contLen);
617✔
1754
  pHead->vgId = htonl(pVgroup->vgId);
617✔
1755

1756
  action.pCont = pHead;
617✔
1757
  action.contLen = contLen;
617✔
1758
  action.msgType = TDMT_VND_ALTER_CONFIRM;
617✔
1759
  // incorrect redirect result will cause this erro
1760
  action.retryCode = TSDB_CODE_VND_INVALID_VGROUP_ID;
617✔
1761
  action.groupId = pVgroup->vgId;
617✔
1762

1763
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
617!
1764
    taosMemoryFree(pHead);
×
1765
    TAOS_RETURN(code);
×
1766
  }
1767

1768
  TAOS_RETURN(code);
617✔
1769
}
1770

1771
int32_t mndAddChangeConfigAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pOldVgroup, SVgObj *pNewVgroup,
×
1772
                                 int32_t dnodeId) {
1773
  int32_t      code = 0;
×
1774
  STransAction action = {0};
×
1775
  action.epSet = mndGetVgroupEpset(pMnode, pNewVgroup);
×
1776

1777
  int32_t contLen = 0;
×
1778
  void   *pReq = mndBuildAlterVnodeReplicaReq(pMnode, pDb, pNewVgroup, dnodeId, &contLen);
×
1779
  if (pReq == NULL) {
×
1780
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1781
    if (terrno != 0) code = terrno;
×
1782
    TAOS_RETURN(code);
×
1783
  }
1784

1785
  int32_t totallen = contLen + sizeof(SMsgHead);
×
1786

1787
  SMsgHead *pHead = taosMemoryMalloc(totallen);
×
1788
  if (pHead == NULL) {
×
1789
    taosMemoryFree(pReq);
×
1790
    TAOS_RETURN(terrno);
×
1791
  }
1792

1793
  pHead->contLen = htonl(totallen);
×
1794
  pHead->vgId = htonl(pNewVgroup->vgId);
×
1795

1796
  memcpy((void *)(pHead + 1), pReq, contLen);
×
1797
  taosMemoryFree(pReq);
×
1798

1799
  action.pCont = pHead;
×
1800
  action.contLen = totallen;
×
1801
  action.msgType = TDMT_SYNC_CONFIG_CHANGE;
×
1802

1803
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
×
1804
    taosMemoryFree(pHead);
×
1805
    TAOS_RETURN(code);
×
1806
  }
1807

1808
  TAOS_RETURN(code);
×
1809
}
1810

1811
static int32_t mndAddAlterVnodeHashRangeAction(SMnode *pMnode, STrans *pTrans, int32_t srcVgId, SVgObj *pVgroup) {
86✔
1812
  int32_t      code = 0;
86✔
1813
  STransAction action = {0};
86✔
1814
  action.epSet = mndGetVgroupEpset(pMnode, pVgroup);
86✔
1815

1816
  int32_t contLen = 0;
86✔
1817
  void   *pReq = mndBuildAlterVnodeHashRangeReq(pMnode, srcVgId, pVgroup, &contLen);
86✔
1818
  if (pReq == NULL) {
86!
1819
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1820
    if (terrno != 0) code = terrno;
×
1821
    TAOS_RETURN(code);
×
1822
  }
1823

1824
  action.pCont = pReq;
86✔
1825
  action.contLen = contLen;
86✔
1826
  action.msgType = TDMT_VND_ALTER_HASHRANGE;
86✔
1827
  action.acceptableCode = TSDB_CODE_VND_ALREADY_EXIST;
86✔
1828

1829
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
86!
1830
    taosMemoryFree(pReq);
×
1831
    TAOS_RETURN(code);
×
1832
  }
1833

1834
  mInfo("trans:%d, add alter vnode hash range action for from vgId:%d to vgId:%d", pTrans->id, srcVgId, pVgroup->vgId);
86!
1835
  TAOS_RETURN(code);
86✔
1836
}
1837

1838
int32_t mndAddAlterVnodeConfigAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup) {
418✔
1839
  int32_t      code = 0;
418✔
1840
  STransAction action = {0};
418✔
1841
  action.epSet = mndGetVgroupEpset(pMnode, pVgroup);
418✔
1842

1843
  int32_t contLen = 0;
418✔
1844
  void   *pReq = mndBuildAlterVnodeConfigReq(pMnode, pDb, pVgroup, &contLen);
418✔
1845
  if (pReq == NULL) {
418!
1846
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1847
    if (terrno != 0) code = terrno;
×
1848
    TAOS_RETURN(code);
×
1849
  }
1850

1851
  action.pCont = pReq;
418✔
1852
  action.contLen = contLen;
418✔
1853
  action.msgType = TDMT_VND_ALTER_CONFIG;
418✔
1854
  action.groupId = pVgroup->vgId;
418✔
1855

1856
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
418!
1857
    taosMemoryFree(pReq);
×
1858
    TAOS_RETURN(code);
×
1859
  }
1860

1861
  TAOS_RETURN(code);
418✔
1862
}
1863

1864
int32_t mndAddNewVgPrepareAction(SMnode *pMnode, STrans *pTrans, SVgObj *pVg) {
8,414✔
1865
  int32_t  code = 0;
8,414✔
1866
  SSdbRaw *pRaw = mndVgroupActionEncode(pVg);
8,414✔
1867
  if (pRaw == NULL) {
8,414!
1868
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1869
    if (terrno != 0) code = terrno;
×
1870
    goto _err;
×
1871
  }
1872

1873
  TAOS_CHECK_GOTO(mndTransAppendPrepareLog(pTrans, pRaw), NULL, _err);
8,414!
1874
  if (sdbSetRawStatus(pRaw, SDB_STATUS_CREATING) != 0) {
8,414!
1875
    mError("vgId:%d, failed to set raw status at line:%d", pVg->vgId, __LINE__);
×
1876
  }
1877
  if (code != 0) {
8,414!
1878
    mError("vgId:%d, failed to set raw status since %s at line:%d", pVg->vgId, tstrerror(code), __LINE__);
×
1879
    TAOS_RETURN(code);
×
1880
  }
1881
  pRaw = NULL;
8,414✔
1882
  TAOS_RETURN(code);
8,414✔
1883

1884
_err:
×
1885
  sdbFreeRaw(pRaw);
×
1886
  TAOS_RETURN(code);
×
1887
}
1888

1889
int32_t mndAddAlterVnodeReplicaAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId) {
1,370✔
1890
  int32_t    code = 0;
1,370✔
1891
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
1,370✔
1892
  if (pDnode == NULL) {
1,370!
1893
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1894
    if (terrno != 0) code = terrno;
×
1895
    TAOS_RETURN(code);
×
1896
  }
1897

1898
  STransAction action = {0};
1,370✔
1899
  action.epSet = mndGetDnodeEpset(pDnode);
1,370✔
1900
  mndReleaseDnode(pMnode, pDnode);
1,370✔
1901

1902
  int32_t contLen = 0;
1,370✔
1903
  void   *pReq = mndBuildAlterVnodeReplicaReq(pMnode, pDb, pVgroup, dnodeId, &contLen);
1,370✔
1904
  if (pReq == NULL) {
1,370!
1905
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1906
    if (terrno != 0) code = terrno;
×
1907
    TAOS_RETURN(code);
×
1908
  }
1909

1910
  action.pCont = pReq;
1,370✔
1911
  action.contLen = contLen;
1,370✔
1912
  action.msgType = TDMT_VND_ALTER_REPLICA;
1,370✔
1913
  action.groupId = pVgroup->vgId;
1,370✔
1914

1915
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
1,370!
1916
    taosMemoryFree(pReq);
×
1917
    TAOS_RETURN(code);
×
1918
  }
1919

1920
  TAOS_RETURN(code);
1,370✔
1921
}
1922

1923
int32_t mndAddCheckLearnerCatchupAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId) {
×
1924
  int32_t    code = 0;
×
1925
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
×
1926
  if (pDnode == NULL) {
×
1927
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1928
    if (terrno != 0) code = terrno;
×
1929
    TAOS_RETURN(code);
×
1930
  }
1931

1932
  STransAction action = {0};
×
1933
  action.epSet = mndGetDnodeEpset(pDnode);
×
1934
  mndReleaseDnode(pMnode, pDnode);
×
1935

1936
  int32_t contLen = 0;
×
1937
  void   *pReq = mndBuildCheckLearnCatchupReq(pMnode, pDb, pVgroup, dnodeId, &contLen);
×
1938
  if (pReq == NULL) {
×
1939
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1940
    if (terrno != 0) code = terrno;
×
1941
    TAOS_RETURN(code);
×
1942
  }
1943

1944
  action.pCont = pReq;
×
1945
  action.contLen = contLen;
×
1946
  action.msgType = TDMT_DND_CHECK_VNODE_LEARNER_CATCHUP;
×
1947
  action.acceptableCode = TSDB_CODE_VND_ALREADY_IS_VOTER;
×
1948
  action.retryCode = TSDB_CODE_VND_NOT_CATCH_UP;
×
1949

1950
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
×
1951
    taosMemoryFree(pReq);
×
1952
    TAOS_RETURN(code);
×
1953
  }
1954

1955
  TAOS_RETURN(code);
×
1956
}
1957

1958
int32_t mndAddAlterVnodeTypeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId) {
222✔
1959
  int32_t    code = 0;
222✔
1960
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
222✔
1961
  if (pDnode == NULL) {
222!
1962
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1963
    if (terrno != 0) code = terrno;
×
1964
    TAOS_RETURN(code);
×
1965
  }
1966

1967
  STransAction action = {0};
222✔
1968
  action.epSet = mndGetDnodeEpset(pDnode);
222✔
1969
  mndReleaseDnode(pMnode, pDnode);
222✔
1970

1971
  int32_t contLen = 0;
222✔
1972
  void   *pReq = mndBuildAlterVnodeReplicaReq(pMnode, pDb, pVgroup, dnodeId, &contLen);
222✔
1973
  if (pReq == NULL) {
222!
1974
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1975
    if (terrno != 0) code = terrno;
×
1976
    TAOS_RETURN(code);
×
1977
  }
1978

1979
  action.pCont = pReq;
222✔
1980
  action.contLen = contLen;
222✔
1981
  action.msgType = TDMT_DND_ALTER_VNODE_TYPE;
222✔
1982
  action.acceptableCode = TSDB_CODE_VND_ALREADY_IS_VOTER;
222✔
1983
  action.retryCode = TSDB_CODE_VND_NOT_CATCH_UP;
222✔
1984
  action.groupId = pVgroup->vgId;
222✔
1985

1986
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
222!
1987
    taosMemoryFree(pReq);
×
1988
    TAOS_RETURN(code);
×
1989
  }
1990

1991
  TAOS_RETURN(code);
222✔
1992
}
1993

1994
int32_t mndRestoreAddAlterVnodeTypeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
10✔
1995
                                          SDnodeObj *pDnode) {
1996
  int32_t      code = 0;
10✔
1997
  STransAction action = {0};
10✔
1998
  action.epSet = mndGetDnodeEpset(pDnode);
10✔
1999

2000
  int32_t contLen = 0;
10✔
2001
  void   *pReq = mndBuildAlterVnodeReplicaReq(pMnode, pDb, pVgroup, pDnode->id, &contLen);
10✔
2002
  if (pReq == NULL) {
10!
2003
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2004
    if (terrno != 0) code = terrno;
×
2005
    TAOS_RETURN(code);
×
2006
  }
2007

2008
  action.pCont = pReq;
10✔
2009
  action.contLen = contLen;
10✔
2010
  action.msgType = TDMT_DND_ALTER_VNODE_TYPE;
10✔
2011
  action.acceptableCode = TSDB_CODE_VND_ALREADY_IS_VOTER;
10✔
2012
  action.retryCode = TSDB_CODE_VND_NOT_CATCH_UP;
10✔
2013
  action.groupId = pVgroup->vgId;
10✔
2014

2015
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
10!
2016
    taosMemoryFree(pReq);
×
2017
    TAOS_RETURN(code);
×
2018
  }
2019

2020
  TAOS_RETURN(code);
10✔
2021
}
2022

2023
static int32_t mndAddDisableVnodeWriteAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
86✔
2024
                                             int32_t dnodeId) {
2025
  int32_t    code = 0;
86✔
2026
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
86✔
2027
  if (pDnode == NULL) {
86!
2028
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2029
    if (terrno != 0) code = terrno;
×
2030
    TAOS_RETURN(code);
×
2031
  }
2032

2033
  STransAction action = {0};
86✔
2034
  action.epSet = mndGetDnodeEpset(pDnode);
86✔
2035
  mndReleaseDnode(pMnode, pDnode);
86✔
2036

2037
  int32_t contLen = 0;
86✔
2038
  void   *pReq = mndBuildDisableVnodeWriteReq(pMnode, pDb, pVgroup->vgId, &contLen);
86✔
2039
  if (pReq == NULL) {
86!
2040
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2041
    if (terrno != 0) code = terrno;
×
2042
    TAOS_RETURN(code);
×
2043
  }
2044

2045
  action.pCont = pReq;
86✔
2046
  action.contLen = contLen;
86✔
2047
  action.msgType = TDMT_VND_DISABLE_WRITE;
86✔
2048

2049
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
86!
2050
    taosMemoryFree(pReq);
×
2051
    TAOS_RETURN(code);
×
2052
  }
2053

2054
  TAOS_RETURN(code);
86✔
2055
}
2056

2057
int32_t mndAddDropVnodeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, SVnodeGid *pVgid,
13,017✔
2058
                              bool isRedo) {
2059
  int32_t      code = 0;
13,017✔
2060
  STransAction action = {0};
13,017✔
2061

2062
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
13,017✔
2063
  if (pDnode == NULL) {
13,017!
2064
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2065
    if (terrno != 0) code = terrno;
×
2066
    TAOS_RETURN(code);
×
2067
  }
2068
  action.epSet = mndGetDnodeEpset(pDnode);
13,017✔
2069
  mndReleaseDnode(pMnode, pDnode);
13,017✔
2070

2071
  int32_t contLen = 0;
13,017✔
2072
  void   *pReq = mndBuildDropVnodeReq(pMnode, pDnode, pDb, pVgroup, &contLen);
13,017✔
2073
  if (pReq == NULL) {
13,017!
2074
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2075
    if (terrno != 0) code = terrno;
×
2076
    TAOS_RETURN(code);
×
2077
  }
2078

2079
  action.pCont = pReq;
13,017✔
2080
  action.contLen = contLen;
13,017✔
2081
  action.msgType = TDMT_DND_DROP_VNODE;
13,017✔
2082
  action.acceptableCode = TSDB_CODE_VND_NOT_EXIST;
13,017✔
2083
  action.groupId = pVgroup->vgId;
13,017✔
2084

2085
  if (isRedo) {
13,017✔
2086
    if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
3,832!
2087
      taosMemoryFree(pReq);
×
2088
      TAOS_RETURN(code);
×
2089
    }
2090
  } else {
2091
    if ((code = mndTransAppendUndoAction(pTrans, &action)) != 0) {
9,185!
2092
      taosMemoryFree(pReq);
×
2093
      TAOS_RETURN(code);
×
2094
    }
2095
  }
2096

2097
  TAOS_RETURN(code);
13,017✔
2098
}
2099

2100
int32_t mndSetMoveVgroupInfoToTrans(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int32_t vnIndex,
29✔
2101
                                    SArray *pArray, bool force, bool unsafe) {
2102
  int32_t code = 0;
29✔
2103
  SVgObj  newVg = {0};
29✔
2104
  memcpy(&newVg, pVgroup, sizeof(SVgObj));
29✔
2105

2106
  mInfo("vgId:%d, trans:%d, vgroup info before move, replica:%d", newVg.vgId, pTrans->id, newVg.replica);
29!
2107
  for (int32_t i = 0; i < newVg.replica; ++i) {
94✔
2108
    mInfo("vgId:%d, trans:%d, vnode:%d dnode:%d", newVg.vgId, pTrans->id, i, newVg.vnodeGid[i].dnodeId);
65!
2109
  }
2110

2111
  if (!force) {
29!
2112
#if 1
2113
    {
2114
#else
2115
    if (newVg.replica == 1) {
2116
#endif
2117
      mInfo("vgId:%d, trans:%d, will add 1 vnode, replca:%d", pVgroup->vgId, pTrans->id, newVg.replica);
29!
2118
      TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, &newVg, pArray));
29!
2119
      for (int32_t i = 0; i < newVg.replica - 1; ++i) {
94✔
2120
        TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg, newVg.vnodeGid[i].dnodeId));
65!
2121
      }
2122
      TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pDb, &newVg, &newVg.vnodeGid[newVg.replica - 1]));
29!
2123
      TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg));
29!
2124

2125
      mInfo("vgId:%d, trans:%d, will remove 1 vnode, replca:2", pVgroup->vgId, pTrans->id);
29!
2126
      newVg.replica--;
29✔
2127
      SVnodeGid del = newVg.vnodeGid[vnIndex];
29✔
2128
      newVg.vnodeGid[vnIndex] = newVg.vnodeGid[newVg.replica];
29✔
2129
      memset(&newVg.vnodeGid[newVg.replica], 0, sizeof(SVnodeGid));
29✔
2130
      {
2131
        SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
29✔
2132
        if (pRaw == NULL) {
29!
2133
          code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2134
          if (terrno != 0) code = terrno;
×
2135
          TAOS_RETURN(code);
×
2136
        }
2137
        if ((code = mndTransAppendGroupRedolog(pTrans, pRaw, pVgroup->vgId)) != 0) {
29!
2138
          sdbFreeRaw(pRaw);
×
2139
          TAOS_RETURN(code);
×
2140
        }
2141
        code = sdbSetRawStatus(pRaw, SDB_STATUS_READY);
29✔
2142
        if (code != 0) {
29!
2143
          mError("vgId:%d, failed to set raw status since %s at line:%d", newVg.vgId, tstrerror(code), __LINE__);
×
2144
          return code;
×
2145
        }
2146
      }
2147

2148
      TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pDb, &newVg, &del, true));
29!
2149
      for (int32_t i = 0; i < newVg.replica; ++i) {
94✔
2150
        TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg, newVg.vnodeGid[i].dnodeId));
65!
2151
      }
2152
      TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg));
29!
2153
#if 1
2154
    }
2155
#else
2156
    } else {  // new replica == 3
2157
      mInfo("vgId:%d, will add 1 vnode, replca:3", pVgroup->vgId);
2158
      if (mndAddVnodeToVgroup(pMnode, pTrans, &newVg, pArray) != 0) return -1;
2159
      mInfo("vgId:%d, will remove 1 vnode, replca:4", pVgroup->vgId);
2160
      newVg.replica--;
2161
      SVnodeGid del = newVg.vnodeGid[vnIndex];
2162
      newVg.vnodeGid[vnIndex] = newVg.vnodeGid[newVg.replica];
2163
      memset(&newVg.vnodeGid[newVg.replica], 0, sizeof(SVnodeGid));
2164
      {
2165
        SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
2166
        if (pRaw == NULL) return -1;
2167
        if (mndTransAppendRedolog(pTrans, pRaw) != 0) {
2168
          sdbFreeRaw(pRaw);
2169
          return -1;
2170
        }
2171
      }
2172

2173
      if (mndAddDropVnodeAction(pMnode, pTrans, pDb, &newVg, &del, true) != 0) return -1;
2174
      for (int32_t i = 0; i < newVg.replica; ++i) {
2175
        if (i == vnIndex) continue;
2176
        if (mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg, newVg.vnodeGid[i].dnodeId) != 0) return -1;
2177
      }
2178
      if (mndAddCreateVnodeAction(pMnode, pTrans, pDb, &newVg, &newVg.vnodeGid[vnIndex]) != 0) return -1;
2179
      if (mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg) != 0) return -1;
2180
    }
2181
#endif
2182
  } else {
2183
    mInfo("vgId:%d, will add 1 vnode and force remove 1 vnode", pVgroup->vgId);
×
2184
    TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, &newVg, pArray));
×
2185
    newVg.replica--;
×
2186
    // SVnodeGid del = newVg.vnodeGid[vnIndex];
2187
    newVg.vnodeGid[vnIndex] = newVg.vnodeGid[newVg.replica];
×
2188
    memset(&newVg.vnodeGid[newVg.replica], 0, sizeof(SVnodeGid));
×
2189
    {
2190
      SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
×
2191
      if (pRaw == NULL) {
×
2192
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2193
        if (terrno != 0) code = terrno;
×
2194
        TAOS_RETURN(code);
×
2195
      }
2196
      if ((code = mndTransAppendGroupRedolog(pTrans, pRaw, pVgroup->vgId)) != 0) {
×
2197
        sdbFreeRaw(pRaw);
×
2198
        TAOS_RETURN(code);
×
2199
      }
2200
      code = sdbSetRawStatus(pRaw, SDB_STATUS_READY);
×
2201
      if (code != 0) {
×
2202
        mError("vgId:%d, failed to set raw status since %s at line:%d", newVg.vgId, tstrerror(code), __LINE__);
×
2203
        return code;
×
2204
      }
2205
    }
2206

2207
    for (int32_t i = 0; i < newVg.replica; ++i) {
×
2208
      if (i != vnIndex) {
×
2209
        TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg, newVg.vnodeGid[i].dnodeId));
×
2210
      }
2211
    }
2212
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pDb, &newVg, &newVg.vnodeGid[vnIndex]));
×
2213
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg));
×
2214

2215
    if (newVg.replica == 1) {
×
2216
      if (force && !unsafe) {
×
2217
        TAOS_RETURN(TSDB_CODE_VND_META_DATA_UNSAFE_DELETE);
×
2218
      }
2219

2220
      SSdb *pSdb = pMnode->pSdb;
×
2221
      void *pIter = NULL;
×
2222

2223
      while (1) {
×
2224
        SStbObj *pStb = NULL;
×
2225
        pIter = sdbFetch(pSdb, SDB_STB, pIter, (void **)&pStb);
×
2226
        if (pIter == NULL) break;
×
2227

2228
        if (strcmp(pStb->db, pDb->name) == 0) {
×
2229
          if ((code = mndSetForceDropCreateStbRedoActions(pMnode, pTrans, &newVg, pStb)) != 0) {
×
2230
            sdbCancelFetch(pSdb, pIter);
×
2231
            sdbRelease(pSdb, pStb);
×
2232
            TAOS_RETURN(code);
×
2233
          }
2234
        }
2235

2236
        sdbRelease(pSdb, pStb);
×
2237
      }
2238

2239
      mInfo("vgId:%d, all data is dropped since replica=1", pVgroup->vgId);
×
2240
    }
2241
  }
2242

2243
  {
2244
    SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
29✔
2245
    if (pRaw == NULL) {
29!
2246
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2247
      if (terrno != 0) code = terrno;
×
2248
      TAOS_RETURN(code);
×
2249
    }
2250
    if ((code = mndTransAppendCommitlog(pTrans, pRaw)) != 0) {
29!
2251
      sdbFreeRaw(pRaw);
×
2252
      TAOS_RETURN(code);
×
2253
    }
2254
    code = sdbSetRawStatus(pRaw, SDB_STATUS_READY);
29✔
2255
    if (code != 0) {
29!
2256
      mError("vgId:%d, failed to set raw status since %s at line:%d", newVg.vgId, tstrerror(code), __LINE__);
×
2257
      return code;
×
2258
    }
2259
  }
2260

2261
  mInfo("vgId:%d, vgroup info after move, replica:%d", newVg.vgId, newVg.replica);
29!
2262
  for (int32_t i = 0; i < newVg.replica; ++i) {
94✔
2263
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg.vgId, i, newVg.vnodeGid[i].dnodeId);
65!
2264
  }
2265
  TAOS_RETURN(code);
29✔
2266
}
2267

2268
int32_t mndSetMoveVgroupsInfoToTrans(SMnode *pMnode, STrans *pTrans, int32_t delDnodeId, bool force, bool unsafe) {
14✔
2269
  int32_t code = 0;
14✔
2270
  SArray *pArray = mndBuildDnodesArray(pMnode, delDnodeId, NULL);
14✔
2271
  if (pArray == NULL) {
14!
2272
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2273
    if (terrno != 0) code = terrno;
×
2274
    TAOS_RETURN(code);
×
2275
  }
2276

2277
  void *pIter = NULL;
14✔
2278
  while (1) {
39✔
2279
    SVgObj *pVgroup = NULL;
53✔
2280
    pIter = sdbFetch(pMnode->pSdb, SDB_VGROUP, pIter, (void **)&pVgroup);
53✔
2281
    if (pIter == NULL) break;
53✔
2282

2283
    int32_t vnIndex = -1;
39✔
2284
    for (int32_t i = 0; i < pVgroup->replica; ++i) {
71✔
2285
      if (pVgroup->vnodeGid[i].dnodeId == delDnodeId) {
61✔
2286
        vnIndex = i;
29✔
2287
        break;
29✔
2288
      }
2289
    }
2290

2291
    code = 0;
39✔
2292
    if (vnIndex != -1) {
39✔
2293
      mInfo("vgId:%d, trans:%d, vnode:%d will be removed from dnode:%d, force:%d", pVgroup->vgId, pTrans->id, vnIndex,
29!
2294
            delDnodeId, force);
2295
      SDbObj *pDb = mndAcquireDb(pMnode, pVgroup->dbName);
29✔
2296
      code = mndSetMoveVgroupInfoToTrans(pMnode, pTrans, pDb, pVgroup, vnIndex, pArray, force, unsafe);
29✔
2297
      mndReleaseDb(pMnode, pDb);
29✔
2298
    }
2299

2300
    sdbRelease(pMnode->pSdb, pVgroup);
39✔
2301

2302
    if (code != 0) {
39!
2303
      sdbCancelFetch(pMnode->pSdb, pIter);
×
2304
      break;
×
2305
    }
2306
  }
2307

2308
  taosArrayDestroy(pArray);
14✔
2309
  TAOS_RETURN(code);
14✔
2310
}
2311

2312
static int32_t mndAddIncVgroupReplicaToTrans(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
112✔
2313
                                             int32_t newDnodeId) {
2314
  int32_t code = 0;
112✔
2315
  mInfo("vgId:%d, will add 1 vnode, replica:%d dnode:%d", pVgroup->vgId, pVgroup->replica, newDnodeId);
112!
2316

2317
  // assoc dnode
2318
  SVnodeGid *pGid = &pVgroup->vnodeGid[pVgroup->replica];
112✔
2319
  pVgroup->replica++;
112✔
2320
  pGid->dnodeId = newDnodeId;
112✔
2321
  pGid->syncState = TAOS_SYNC_STATE_OFFLINE;
112✔
2322
  pGid->nodeRole = TAOS_SYNC_ROLE_LEARNER;
112✔
2323

2324
  SSdbRaw *pVgRaw = mndVgroupActionEncode(pVgroup);
112✔
2325
  if (pVgRaw == NULL) {
112!
2326
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2327
    if (terrno != 0) code = terrno;
×
2328
    TAOS_RETURN(code);
×
2329
  }
2330
  if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
112!
2331
    sdbFreeRaw(pVgRaw);
×
2332
    TAOS_RETURN(code);
×
2333
  }
2334
  code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
112✔
2335
  if (code != 0) {
112!
2336
    mError("vgId:%d, failed to set raw status since %s at line:%d", pVgroup->vgId, tstrerror(code), __LINE__);
×
2337
    TAOS_RETURN(code);
×
2338
  }
2339

2340
  // learner
2341
  for (int32_t i = 0; i < pVgroup->replica - 1; ++i) {
368✔
2342
    TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, pVgroup, pVgroup->vnodeGid[i].dnodeId));
256!
2343
  }
2344
  TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pDb, pVgroup, pGid));
112!
2345

2346
  // voter
2347
  pGid->nodeRole = TAOS_SYNC_ROLE_VOTER;
112✔
2348
  TAOS_CHECK_RETURN(mndAddAlterVnodeTypeAction(pMnode, pTrans, pDb, pVgroup, pGid->dnodeId));
112!
2349
  for (int32_t i = 0; i < pVgroup->replica - 1; ++i) {
368✔
2350
    TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, pVgroup, pVgroup->vnodeGid[i].dnodeId));
256!
2351
  }
2352

2353
  // confirm
2354
  TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, pVgroup));
112!
2355

2356
  TAOS_RETURN(code);
112✔
2357
}
2358

2359
static int32_t mndAddDecVgroupReplicaFromTrans(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
112✔
2360
                                               int32_t delDnodeId) {
2361
  int32_t code = 0;
112✔
2362
  mInfo("vgId:%d, will remove 1 vnode, replica:%d dnode:%d", pVgroup->vgId, pVgroup->replica, delDnodeId);
112!
2363

2364
  SVnodeGid *pGid = NULL;
112✔
2365
  SVnodeGid  delGid = {0};
112✔
2366
  for (int32_t i = 0; i < pVgroup->replica; ++i) {
187!
2367
    if (pVgroup->vnodeGid[i].dnodeId == delDnodeId) {
187✔
2368
      pGid = &pVgroup->vnodeGid[i];
112✔
2369
      break;
112✔
2370
    }
2371
  }
2372

2373
  if (pGid == NULL) return 0;
112!
2374

2375
  pVgroup->replica--;
112✔
2376
  memcpy(&delGid, pGid, sizeof(SVnodeGid));
112✔
2377
  memcpy(pGid, &pVgroup->vnodeGid[pVgroup->replica], sizeof(SVnodeGid));
112✔
2378
  memset(&pVgroup->vnodeGid[pVgroup->replica], 0, sizeof(SVnodeGid));
112✔
2379

2380
  SSdbRaw *pVgRaw = mndVgroupActionEncode(pVgroup);
112✔
2381
  if (pVgRaw == NULL) {
112!
2382
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2383
    if (terrno != 0) code = terrno;
×
2384
    TAOS_RETURN(code);
×
2385
  }
2386
  if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
112!
2387
    sdbFreeRaw(pVgRaw);
×
2388
    TAOS_RETURN(code);
×
2389
  }
2390
  code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
112✔
2391
  if (code != 0) {
112!
2392
    mError("vgId:%d, failed to set raw status since %s at line:%d", pVgroup->vgId, tstrerror(code), __LINE__);
×
2393
    TAOS_RETURN(code);
×
2394
  }
2395

2396
  TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pDb, pVgroup, &delGid, true));
112!
2397
  for (int32_t i = 0; i < pVgroup->replica; ++i) {
368✔
2398
    TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, pVgroup, pVgroup->vnodeGid[i].dnodeId));
256!
2399
  }
2400
  TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, pVgroup));
112!
2401

2402
  TAOS_RETURN(code);
112✔
2403
}
2404

2405
static int32_t mndRedistributeVgroup(SMnode *pMnode, SRpcMsg *pReq, SDbObj *pDb, SVgObj *pVgroup, SDnodeObj *pNew1,
68✔
2406
                                     SDnodeObj *pOld1, SDnodeObj *pNew2, SDnodeObj *pOld2, SDnodeObj *pNew3,
2407
                                     SDnodeObj *pOld3) {
2408
  int32_t code = -1;
68✔
2409
  STrans *pTrans = NULL;
68✔
2410

2411
  pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, TRN_CONFLICT_GLOBAL, pReq, "red-vgroup");
68✔
2412
  if (pTrans == NULL) {
68!
2413
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2414
    if (terrno != 0) code = terrno;
×
2415
    goto _OVER;
×
2416
  }
2417

2418
  mndTransSetDbName(pTrans, pVgroup->dbName, NULL);
68✔
2419
  TAOS_CHECK_GOTO(mndTransCheckConflictWithCompact(pMnode, pTrans), NULL, _OVER);
68✔
2420

2421
  mndTransSetSerial(pTrans);
67✔
2422
  mInfo("trans:%d, used to redistribute vgroup, vgId:%d", pTrans->id, pVgroup->vgId);
67!
2423

2424
  SVgObj newVg = {0};
67✔
2425
  memcpy(&newVg, pVgroup, sizeof(SVgObj));
67✔
2426
  mInfo("vgId:%d, vgroup info before redistribute, replica:%d", newVg.vgId, newVg.replica);
67!
2427
  for (int32_t i = 0; i < newVg.replica; ++i) {
212✔
2428
    mInfo("vgId:%d, vnode:%d dnode:%d role:%s", newVg.vgId, i, newVg.vnodeGid[i].dnodeId,
145!
2429
          syncStr(newVg.vnodeGid[i].syncState));
2430
  }
2431

2432
  if (pNew1 != NULL && pOld1 != NULL) {
67!
2433
    int32_t numOfVnodes = mndGetVnodesNum(pMnode, pNew1->id);
67✔
2434
    if (numOfVnodes >= pNew1->numOfSupportVnodes) {
67✔
2435
      mError("vgId:%d, no enough vnodes in dnode:%d, numOfVnodes:%d support:%d", newVg.vgId, pNew1->id, numOfVnodes,
1!
2436
             pNew1->numOfSupportVnodes);
2437
      code = TSDB_CODE_MND_NO_ENOUGH_VNODES;
1✔
2438
      goto _OVER;
1✔
2439
    }
2440

2441
    int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
66✔
2442
    if (pNew1->memAvail - vgMem - pNew1->memUsed <= 0) {
66!
2443
      mError("db:%s, vgId:%d, no enough memory:%" PRId64 " in dnode:%d avail:%" PRId64 " used:%" PRId64,
×
2444
             pVgroup->dbName, pVgroup->vgId, vgMem, pNew1->id, pNew1->memAvail, pNew1->memUsed);
2445
      code = TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE;
×
2446
      goto _OVER;
×
2447
    } else {
2448
      pNew1->memUsed += vgMem;
66✔
2449
    }
2450

2451
    TAOS_CHECK_GOTO(mndAddIncVgroupReplicaToTrans(pMnode, pTrans, pDb, &newVg, pNew1->id), NULL, _OVER);
66!
2452
    TAOS_CHECK_GOTO(mndAddDecVgroupReplicaFromTrans(pMnode, pTrans, pDb, &newVg, pOld1->id), NULL, _OVER);
66!
2453
  }
2454

2455
  if (pNew2 != NULL && pOld2 != NULL) {
66!
2456
    int32_t numOfVnodes = mndGetVnodesNum(pMnode, pNew2->id);
16✔
2457
    if (numOfVnodes >= pNew2->numOfSupportVnodes) {
16!
2458
      mError("vgId:%d, no enough vnodes in dnode:%d, numOfVnodes:%d support:%d", newVg.vgId, pNew2->id, numOfVnodes,
×
2459
             pNew2->numOfSupportVnodes);
2460
      code = TSDB_CODE_MND_NO_ENOUGH_VNODES;
×
2461
      goto _OVER;
×
2462
    }
2463
    int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
16✔
2464
    if (pNew2->memAvail - vgMem - pNew2->memUsed <= 0) {
16!
2465
      mError("db:%s, vgId:%d, no enough memory:%" PRId64 " in dnode:%d avail:%" PRId64 " used:%" PRId64,
×
2466
             pVgroup->dbName, pVgroup->vgId, vgMem, pNew2->id, pNew2->memAvail, pNew2->memUsed);
2467
      code = TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE;
×
2468
      goto _OVER;
×
2469
    } else {
2470
      pNew2->memUsed += vgMem;
16✔
2471
    }
2472
    TAOS_CHECK_GOTO(mndAddIncVgroupReplicaToTrans(pMnode, pTrans, pDb, &newVg, pNew2->id), NULL, _OVER);
16!
2473
    TAOS_CHECK_GOTO(mndAddDecVgroupReplicaFromTrans(pMnode, pTrans, pDb, &newVg, pOld2->id), NULL, _OVER);
16!
2474
  }
2475

2476
  if (pNew3 != NULL && pOld3 != NULL) {
66!
2477
    int32_t numOfVnodes = mndGetVnodesNum(pMnode, pNew3->id);
8✔
2478
    if (numOfVnodes >= pNew3->numOfSupportVnodes) {
8!
2479
      mError("vgId:%d, no enough vnodes in dnode:%d, numOfVnodes:%d support:%d", newVg.vgId, pNew3->id, numOfVnodes,
×
2480
             pNew3->numOfSupportVnodes);
2481
      code = TSDB_CODE_MND_NO_ENOUGH_VNODES;
×
2482
      goto _OVER;
×
2483
    }
2484
    int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
8✔
2485
    if (pNew3->memAvail - vgMem - pNew3->memUsed <= 0) {
8!
2486
      mError("db:%s, vgId:%d, no enough memory:%" PRId64 " in dnode:%d avail:%" PRId64 " used:%" PRId64,
×
2487
             pVgroup->dbName, pVgroup->vgId, vgMem, pNew3->id, pNew3->memAvail, pNew3->memUsed);
2488
      code = TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE;
×
2489
      goto _OVER;
×
2490
    } else {
2491
      pNew3->memUsed += vgMem;
8✔
2492
    }
2493
    TAOS_CHECK_GOTO(mndAddIncVgroupReplicaToTrans(pMnode, pTrans, pDb, &newVg, pNew3->id), NULL, _OVER);
8!
2494
    TAOS_CHECK_GOTO(mndAddDecVgroupReplicaFromTrans(pMnode, pTrans, pDb, &newVg, pOld3->id), NULL, _OVER);
8!
2495
  }
2496

2497
  {
2498
    SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
66✔
2499
    if (pRaw == NULL) {
66!
2500
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2501
      if (terrno != 0) code = terrno;
×
2502
      goto _OVER;
×
2503
    }
2504
    if ((code = mndTransAppendCommitlog(pTrans, pRaw)) != 0) {
66!
2505
      sdbFreeRaw(pRaw);
×
2506
      goto _OVER;
×
2507
    }
2508
    code = sdbSetRawStatus(pRaw, SDB_STATUS_READY);
66✔
2509
    if (code != 0) {
66!
2510
      mError("vgId:%d, failed to set raw status since %s at line:%d", newVg.vgId, tstrerror(code), __LINE__);
×
2511
      goto _OVER;
×
2512
    }
2513
  }
2514

2515
  mInfo("vgId:%d, vgroup info after redistribute, replica:%d", newVg.vgId, newVg.replica);
66!
2516
  for (int32_t i = 0; i < newVg.replica; ++i) {
208✔
2517
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg.vgId, i, newVg.vnodeGid[i].dnodeId);
142!
2518
  }
2519

2520
  TAOS_CHECK_GOTO(mndTransPrepare(pMnode, pTrans), NULL, _OVER);
66✔
2521
  code = 0;
56✔
2522

2523
_OVER:
68✔
2524
  mndTransDrop(pTrans);
68✔
2525
  mndReleaseDb(pMnode, pDb);
68✔
2526
  TAOS_RETURN(code);
68✔
2527
}
2528

2529
static int32_t mndProcessRedistributeVgroupMsg(SRpcMsg *pReq) {
84✔
2530
  SMnode    *pMnode = pReq->info.node;
84✔
2531
  SDnodeObj *pNew1 = NULL;
84✔
2532
  SDnodeObj *pNew2 = NULL;
84✔
2533
  SDnodeObj *pNew3 = NULL;
84✔
2534
  SDnodeObj *pOld1 = NULL;
84✔
2535
  SDnodeObj *pOld2 = NULL;
84✔
2536
  SDnodeObj *pOld3 = NULL;
84✔
2537
  SVgObj    *pVgroup = NULL;
84✔
2538
  SDbObj    *pDb = NULL;
84✔
2539
  int32_t    code = -1;
84✔
2540
  int64_t    curMs = taosGetTimestampMs();
84✔
2541
  int32_t    newDnodeId[3] = {0};
84✔
2542
  int32_t    oldDnodeId[3] = {0};
84✔
2543
  int32_t    newIndex = -1;
84✔
2544
  int32_t    oldIndex = -1;
84✔
2545

2546
  SRedistributeVgroupReq req = {0};
84✔
2547
  if (tDeserializeSRedistributeVgroupReq(pReq->pCont, pReq->contLen, &req) != 0) {
84!
2548
    code = TSDB_CODE_INVALID_MSG;
×
2549
    goto _OVER;
×
2550
  }
2551

2552
  mInfo("vgId:%d, start to redistribute vgroup to dnode %d:%d:%d", req.vgId, req.dnodeId1, req.dnodeId2, req.dnodeId3);
84!
2553
  if ((code = mndCheckOperPrivilege(pMnode, pReq->info.conn.user, MND_OPER_REDISTRIBUTE_VGROUP)) != 0) {
84✔
2554
    goto _OVER;
1✔
2555
  }
2556

2557
  pVgroup = mndAcquireVgroup(pMnode, req.vgId);
83✔
2558
  if (pVgroup == NULL) {
83✔
2559
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
3✔
2560
    if (terrno != 0) code = terrno;
3!
2561
    goto _OVER;
3✔
2562
  }
2563
  if (pVgroup->mountVgId) {
80!
2564
    code = TSDB_CODE_MND_MOUNT_OBJ_NOT_SUPPORT;
×
2565
    goto _OVER;
×
2566
  }
2567
  pDb = mndAcquireDb(pMnode, pVgroup->dbName);
80✔
2568
  if (pDb == NULL) {
80!
2569
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2570
    if (terrno != 0) code = terrno;
×
2571
    goto _OVER;
×
2572
  }
2573

2574
  if (pVgroup->replica == 1) {
80✔
2575
    if (req.dnodeId1 <= 0 || req.dnodeId2 > 0 || req.dnodeId3 > 0) {
31!
2576
      code = TSDB_CODE_MND_INVALID_REPLICA;
×
2577
      goto _OVER;
×
2578
    }
2579

2580
    if (req.dnodeId1 == pVgroup->vnodeGid[0].dnodeId) {
31!
2581
      // terrno = TSDB_CODE_MND_VGROUP_UN_CHANGED;
2582
      code = 0;
×
2583
      goto _OVER;
×
2584
    }
2585

2586
    pNew1 = mndAcquireDnode(pMnode, req.dnodeId1);
31✔
2587
    if (pNew1 == NULL) {
31!
2588
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2589
      if (terrno != 0) code = terrno;
×
2590
      goto _OVER;
×
2591
    }
2592
    if (!mndIsDnodeOnline(pNew1, curMs)) {
31!
2593
      code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2594
      goto _OVER;
×
2595
    }
2596

2597
    pOld1 = mndAcquireDnode(pMnode, pVgroup->vnodeGid[0].dnodeId);
31✔
2598
    if (pOld1 == NULL) {
31!
2599
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2600
      if (terrno != 0) code = terrno;
×
2601
      goto _OVER;
×
2602
    }
2603
    if (!mndIsDnodeOnline(pOld1, curMs)) {
31✔
2604
      code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
2✔
2605
      goto _OVER;
2✔
2606
    }
2607

2608
    code = mndRedistributeVgroup(pMnode, pReq, pDb, pVgroup, pNew1, pOld1, NULL, NULL, NULL, NULL);
29✔
2609

2610
  } else if (pVgroup->replica == 3) {
49!
2611
    if (req.dnodeId1 <= 0 || req.dnodeId2 <= 0 || req.dnodeId3 <= 0) {
49!
2612
      code = TSDB_CODE_MND_INVALID_REPLICA;
4✔
2613
      goto _OVER;
4✔
2614
    }
2615

2616
    if (req.dnodeId1 == req.dnodeId2 || req.dnodeId1 == req.dnodeId3 || req.dnodeId2 == req.dnodeId3) {
45!
2617
      code = TSDB_CODE_MND_INVALID_REPLICA;
1✔
2618
      goto _OVER;
1✔
2619
    }
2620

2621
    if (req.dnodeId1 != pVgroup->vnodeGid[0].dnodeId && req.dnodeId1 != pVgroup->vnodeGid[1].dnodeId &&
44✔
2622
        req.dnodeId1 != pVgroup->vnodeGid[2].dnodeId) {
22✔
2623
      newDnodeId[++newIndex] = req.dnodeId1;
19✔
2624
      mInfo("vgId:%d, dnode:%d will be added, index:%d", pVgroup->vgId, newDnodeId[newIndex], newIndex);
19!
2625
    }
2626

2627
    if (req.dnodeId2 != pVgroup->vnodeGid[0].dnodeId && req.dnodeId2 != pVgroup->vnodeGid[1].dnodeId &&
44✔
2628
        req.dnodeId2 != pVgroup->vnodeGid[2].dnodeId) {
30✔
2629
      newDnodeId[++newIndex] = req.dnodeId2;
22✔
2630
      mInfo("vgId:%d, dnode:%d will be added, index:%d", pVgroup->vgId, newDnodeId[newIndex], newIndex);
22!
2631
    }
2632

2633
    if (req.dnodeId3 != pVgroup->vnodeGid[0].dnodeId && req.dnodeId3 != pVgroup->vnodeGid[1].dnodeId &&
44✔
2634
        req.dnodeId3 != pVgroup->vnodeGid[2].dnodeId) {
35✔
2635
      newDnodeId[++newIndex] = req.dnodeId3;
29✔
2636
      mInfo("vgId:%d, dnode:%d will be added, index:%d", pVgroup->vgId, newDnodeId[newIndex], newIndex);
29!
2637
    }
2638

2639
    if (req.dnodeId1 != pVgroup->vnodeGid[0].dnodeId && req.dnodeId2 != pVgroup->vnodeGid[0].dnodeId &&
44✔
2640
        req.dnodeId3 != pVgroup->vnodeGid[0].dnodeId) {
30✔
2641
      oldDnodeId[++oldIndex] = pVgroup->vnodeGid[0].dnodeId;
23✔
2642
      mInfo("vgId:%d, dnode:%d will be removed, index:%d", pVgroup->vgId, oldDnodeId[oldIndex], oldIndex);
23!
2643
    }
2644

2645
    if (req.dnodeId1 != pVgroup->vnodeGid[1].dnodeId && req.dnodeId2 != pVgroup->vnodeGid[1].dnodeId &&
44✔
2646
        req.dnodeId3 != pVgroup->vnodeGid[1].dnodeId) {
22✔
2647
      oldDnodeId[++oldIndex] = pVgroup->vnodeGid[1].dnodeId;
20✔
2648
      mInfo("vgId:%d, dnode:%d will be removed, index:%d", pVgroup->vgId, oldDnodeId[oldIndex], oldIndex);
20!
2649
    }
2650

2651
    if (req.dnodeId1 != pVgroup->vnodeGid[2].dnodeId && req.dnodeId2 != pVgroup->vnodeGid[2].dnodeId &&
44✔
2652
        req.dnodeId3 != pVgroup->vnodeGid[2].dnodeId) {
33✔
2653
      oldDnodeId[++oldIndex] = pVgroup->vnodeGid[2].dnodeId;
27✔
2654
      mInfo("vgId:%d, dnode:%d will be removed, index:%d", pVgroup->vgId, oldDnodeId[oldIndex], oldIndex);
27!
2655
    }
2656

2657
    if (newDnodeId[0] != 0) {
44✔
2658
      pNew1 = mndAcquireDnode(pMnode, newDnodeId[0]);
42✔
2659
      if (pNew1 == NULL) {
42!
2660
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2661
        if (terrno != 0) code = terrno;
×
2662
        goto _OVER;
×
2663
      }
2664
      if (!mndIsDnodeOnline(pNew1, curMs)) {
42✔
2665
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
1✔
2666
        goto _OVER;
1✔
2667
      }
2668
    }
2669

2670
    if (newDnodeId[1] != 0) {
43✔
2671
      pNew2 = mndAcquireDnode(pMnode, newDnodeId[1]);
18✔
2672
      if (pNew2 == NULL) {
18!
2673
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2674
        if (terrno != 0) code = terrno;
×
2675
        goto _OVER;
×
2676
      }
2677
      if (!mndIsDnodeOnline(pNew2, curMs)) {
18!
2678
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2679
        goto _OVER;
×
2680
      }
2681
    }
2682

2683
    if (newDnodeId[2] != 0) {
43✔
2684
      pNew3 = mndAcquireDnode(pMnode, newDnodeId[2]);
10✔
2685
      if (pNew3 == NULL) {
10!
2686
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2687
        if (terrno != 0) code = terrno;
×
2688
        goto _OVER;
×
2689
      }
2690
      if (!mndIsDnodeOnline(pNew3, curMs)) {
10!
2691
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2692
        goto _OVER;
×
2693
      }
2694
    }
2695

2696
    if (oldDnodeId[0] != 0) {
43✔
2697
      pOld1 = mndAcquireDnode(pMnode, oldDnodeId[0]);
41✔
2698
      if (pOld1 == NULL) {
41!
2699
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2700
        if (terrno != 0) code = terrno;
×
2701
        goto _OVER;
×
2702
      }
2703
      if (!mndIsDnodeOnline(pOld1, curMs)) {
41✔
2704
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
2✔
2705
        goto _OVER;
2✔
2706
      }
2707
    }
2708

2709
    if (oldDnodeId[1] != 0) {
41✔
2710
      pOld2 = mndAcquireDnode(pMnode, oldDnodeId[1]);
16✔
2711
      if (pOld2 == NULL) {
16!
2712
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2713
        if (terrno != 0) code = terrno;
×
2714
        goto _OVER;
×
2715
      }
2716
      if (!mndIsDnodeOnline(pOld2, curMs)) {
16!
2717
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2718
        goto _OVER;
×
2719
      }
2720
    }
2721

2722
    if (oldDnodeId[2] != 0) {
41✔
2723
      pOld3 = mndAcquireDnode(pMnode, oldDnodeId[2]);
8✔
2724
      if (pOld3 == NULL) {
8!
2725
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2726
        if (terrno != 0) code = terrno;
×
2727
        goto _OVER;
×
2728
      }
2729
      if (!mndIsDnodeOnline(pOld3, curMs)) {
8!
2730
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2731
        goto _OVER;
×
2732
      }
2733
    }
2734

2735
    if (pNew1 == NULL && pOld1 == NULL && pNew2 == NULL && pOld2 == NULL && pNew3 == NULL && pOld3 == NULL) {
41!
2736
      // terrno = TSDB_CODE_MND_VGROUP_UN_CHANGED;
2737
      code = 0;
2✔
2738
      goto _OVER;
2✔
2739
    }
2740

2741
    code = mndRedistributeVgroup(pMnode, pReq, pDb, pVgroup, pNew1, pOld1, pNew2, pOld2, pNew3, pOld3);
39✔
2742

2743
  } else {
2744
    code = TSDB_CODE_MND_REQ_REJECTED;
×
2745
    goto _OVER;
×
2746
  }
2747

2748
  if (code == 0) code = TSDB_CODE_ACTION_IN_PROGRESS;
68✔
2749

2750
  char obj[33] = {0};
68✔
2751
  (void)tsnprintf(obj, sizeof(obj), "%d", req.vgId);
68✔
2752

2753
  auditRecord(pReq, pMnode->clusterId, "RedistributeVgroup", "", obj, req.sql, req.sqlLen);
68✔
2754

2755
_OVER:
84✔
2756
  if (code != 0 && code != TSDB_CODE_ACTION_IN_PROGRESS) {
84✔
2757
    mError("vgId:%d, failed to redistribute to dnode %d:%d:%d since %s", req.vgId, req.dnodeId1, req.dnodeId2,
26!
2758
           req.dnodeId3, tstrerror(code));
2759
  }
2760

2761
  mndReleaseDnode(pMnode, pNew1);
84✔
2762
  mndReleaseDnode(pMnode, pNew2);
84✔
2763
  mndReleaseDnode(pMnode, pNew3);
84✔
2764
  mndReleaseDnode(pMnode, pOld1);
84✔
2765
  mndReleaseDnode(pMnode, pOld2);
84✔
2766
  mndReleaseDnode(pMnode, pOld3);
84✔
2767
  mndReleaseVgroup(pMnode, pVgroup);
84✔
2768
  mndReleaseDb(pMnode, pDb);
84✔
2769
  tFreeSRedistributeVgroupReq(&req);
84✔
2770

2771
  TAOS_RETURN(code);
84✔
2772
}
2773

2774
static void *mndBuildSForceBecomeFollowerReq(SMnode *pMnode, SVgObj *pVgroup, int32_t dnodeId, int32_t *pContLen) {
12✔
2775
  SForceBecomeFollowerReq balanceReq = {
12✔
2776
      .vgId = pVgroup->vgId,
12✔
2777
  };
2778

2779
  int32_t contLen = tSerializeSForceBecomeFollowerReq(NULL, 0, &balanceReq);
12✔
2780
  if (contLen < 0) {
12!
2781
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
2782
    return NULL;
×
2783
  }
2784
  contLen += sizeof(SMsgHead);
12✔
2785

2786
  void *pReq = taosMemoryMalloc(contLen);
12!
2787
  if (pReq == NULL) {
12!
2788
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
2789
    return NULL;
×
2790
  }
2791

2792
  SMsgHead *pHead = pReq;
12✔
2793
  pHead->contLen = htonl(contLen);
12✔
2794
  pHead->vgId = htonl(pVgroup->vgId);
12✔
2795

2796
  if (tSerializeSForceBecomeFollowerReq((char *)pReq + sizeof(SMsgHead), contLen, &balanceReq) < 0) {
12!
2797
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
2798
    taosMemoryFree(pReq);
×
2799
    return NULL;
×
2800
  }
2801
  *pContLen = contLen;
12✔
2802
  return pReq;
12✔
2803
}
2804

2805
int32_t mndAddBalanceVgroupLeaderAction(SMnode *pMnode, STrans *pTrans, SVgObj *pVgroup, int32_t dnodeId) {
12✔
2806
  int32_t    code = 0;
12✔
2807
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
12✔
2808
  if (pDnode == NULL) {
12!
2809
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2810
    if (terrno != 0) code = terrno;
×
2811
    TAOS_RETURN(code);
×
2812
  }
2813

2814
  STransAction action = {0};
12✔
2815
  action.epSet = mndGetDnodeEpset(pDnode);
12✔
2816
  mndReleaseDnode(pMnode, pDnode);
12✔
2817

2818
  int32_t contLen = 0;
12✔
2819
  void   *pReq = mndBuildSForceBecomeFollowerReq(pMnode, pVgroup, dnodeId, &contLen);
12✔
2820
  if (pReq == NULL) {
12!
2821
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2822
    if (terrno != 0) code = terrno;
×
2823
    TAOS_RETURN(code);
×
2824
  }
2825

2826
  action.pCont = pReq;
12✔
2827
  action.contLen = contLen;
12✔
2828
  action.msgType = TDMT_SYNC_FORCE_FOLLOWER;
12✔
2829

2830
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
12!
2831
    taosMemoryFree(pReq);
×
2832
    TAOS_RETURN(code);
×
2833
  }
2834

2835
  TAOS_RETURN(code);
12✔
2836
}
2837

2838
int32_t mndAddVgroupBalanceToTrans(SMnode *pMnode, SVgObj *pVgroup, STrans *pTrans) {
15✔
2839
  int32_t code = 0;
15✔
2840
  SSdb   *pSdb = pMnode->pSdb;
15✔
2841

2842
  int32_t vgid = pVgroup->vgId;
15✔
2843
  int8_t  replica = pVgroup->replica;
15✔
2844

2845
  if (pVgroup->replica <= 1) {
15✔
2846
    mInfo("trans:%d, vgid:%d no need to balance, replica:%d", pTrans->id, vgid, replica);
1!
2847
    return -1;
1✔
2848
  }
2849

2850
  int32_t dnodeId = 0;
14✔
2851

2852
  for (int i = 0; i < replica; i++) {
29✔
2853
    if (pVgroup->vnodeGid[i].syncState == TAOS_SYNC_STATE_LEADER) {
27✔
2854
      dnodeId = pVgroup->vnodeGid[i].dnodeId;
12✔
2855
      break;
12✔
2856
    }
2857
  }
2858

2859
  bool       exist = false;
14✔
2860
  bool       online = false;
14✔
2861
  int64_t    curMs = taosGetTimestampMs();
14✔
2862
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
14✔
2863
  if (pDnode != NULL) {
14✔
2864
    exist = true;
12✔
2865
    online = mndIsDnodeOnline(pDnode, curMs);
12✔
2866
    mndReleaseDnode(pMnode, pDnode);
12✔
2867
  }
2868

2869
  if (exist && online) {
26!
2870
    mInfo("trans:%d, vgid:%d leader to dnode:%d", pTrans->id, vgid, dnodeId);
12!
2871

2872
    if ((code = mndAddBalanceVgroupLeaderAction(pMnode, pTrans, pVgroup, dnodeId)) != 0) {
12!
2873
      mError("trans:%d, vgid:%d failed to be balanced to dnode:%d", pTrans->id, vgid, dnodeId);
×
2874
      TAOS_RETURN(code);
×
2875
    }
2876

2877
    SDbObj *pDb = mndAcquireDb(pMnode, pVgroup->dbName);
12✔
2878
    if (pDb == NULL) {
12!
2879
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2880
      if (terrno != 0) code = terrno;
×
2881
      mError("trans:%d, vgid:%d failed to be balanced to dnode:%d, because db not exist", pTrans->id, vgid, dnodeId);
×
2882
      TAOS_RETURN(code);
×
2883
    }
2884

2885
    mndReleaseDb(pMnode, pDb);
12✔
2886
  } else {
2887
    mInfo("trans:%d, vgid:%d cant be balanced to dnode:%d, exist:%d, online:%d", pTrans->id, vgid, dnodeId, exist,
2!
2888
          online);
2889
  }
2890

2891
  TAOS_RETURN(code);
14✔
2892
}
2893

2894
extern int32_t mndProcessVgroupBalanceLeaderMsgImp(SRpcMsg *pReq);
2895

2896
int32_t mndProcessVgroupBalanceLeaderMsg(SRpcMsg *pReq) { return mndProcessVgroupBalanceLeaderMsgImp(pReq); }
6✔
2897

2898
#ifndef TD_ENTERPRISE
2899
int32_t mndProcessVgroupBalanceLeaderMsgImp(SRpcMsg *pReq) { return 0; }
2900
#endif
2901

2902
static int32_t mndCheckDnodeMemory(SMnode *pMnode, SDbObj *pOldDb, SDbObj *pNewDb, SVgObj *pOldVgroup,
418✔
2903
                                   SVgObj *pNewVgroup, SArray *pArray) {
2904
  for (int32_t i = 0; i < (int32_t)taosArrayGetSize(pArray); ++i) {
1,126✔
2905
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
708✔
2906
    bool       inVgroup = false;
708✔
2907
    int64_t    oldMemUsed = 0;
708✔
2908
    int64_t    newMemUsed = 0;
708✔
2909
    mDebug("db:%s, vgId:%d, check dnode:%d, avail:%" PRId64 " used:%" PRId64, pNewVgroup->dbName, pNewVgroup->vgId,
708!
2910
           pDnode->id, pDnode->memAvail, pDnode->memUsed);
2911
    for (int32_t j = 0; j < pOldVgroup->replica; ++j) {
2,004✔
2912
      SVnodeGid *pVgId = &pOldVgroup->vnodeGid[j];
1,296✔
2913
      if (pDnode->id == pVgId->dnodeId) {
1,296✔
2914
        oldMemUsed = mndGetVgroupMemory(pMnode, pOldDb, pOldVgroup);
614✔
2915
        inVgroup = true;
614✔
2916
      }
2917
    }
2918
    for (int32_t j = 0; j < pNewVgroup->replica; ++j) {
2,004✔
2919
      SVnodeGid *pVgId = &pNewVgroup->vnodeGid[j];
1,296✔
2920
      if (pDnode->id == pVgId->dnodeId) {
1,296✔
2921
        newMemUsed = mndGetVgroupMemory(pMnode, pNewDb, pNewVgroup);
614✔
2922
        inVgroup = true;
614✔
2923
      }
2924
    }
2925

2926
    mDebug("db:%s, vgId:%d, memory in dnode:%d, oldUsed:%" PRId64 ", newUsed:%" PRId64, pNewVgroup->dbName,
708!
2927
           pNewVgroup->vgId, pDnode->id, oldMemUsed, newMemUsed);
2928

2929
    pDnode->memUsed = pDnode->memUsed - oldMemUsed + newMemUsed;
708✔
2930
    if (pDnode->memAvail - pDnode->memUsed <= 0) {
708!
2931
      mError("db:%s, vgId:%d, no enough memory in dnode:%d, avail:%" PRId64 " used:%" PRId64, pNewVgroup->dbName,
×
2932
             pNewVgroup->vgId, pDnode->id, pDnode->memAvail, pDnode->memUsed);
2933
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE);
×
2934
    } else if (inVgroup) {
708✔
2935
      mInfo("db:%s, vgId:%d, memory in dnode:%d, avail:%" PRId64 " used:%" PRId64, pNewVgroup->dbName, pNewVgroup->vgId,
614!
2936
            pDnode->id, pDnode->memAvail, pDnode->memUsed);
2937
    } else {
2938
    }
2939
  }
2940
  return 0;
418✔
2941
}
2942

2943
int32_t mndBuildAlterVgroupAction(SMnode *pMnode, STrans *pTrans, SDbObj *pOldDb, SDbObj *pNewDb, SVgObj *pVgroup,
522✔
2944
                                  SArray *pArray, SVgObj *pNewVgroup) {
2945
  int32_t code = 0;
522✔
2946
  memcpy(pNewVgroup, pVgroup, sizeof(SVgObj));
522✔
2947

2948
  if (pVgroup->replica <= 0 || pVgroup->replica == pNewDb->cfg.replications) {
522!
2949
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfigAction(pMnode, pTrans, pNewDb, pVgroup));
418!
2950
    TAOS_CHECK_RETURN(mndCheckDnodeMemory(pMnode, pOldDb, pNewDb, pNewVgroup, pVgroup, pArray));
418!
2951
    return 0;
418✔
2952
  }
2953

2954
  // mndTransSetGroupParallel(pTrans);
2955

2956
  if (pNewDb->cfg.replications == 3) {
104✔
2957
    mInfo("trans:%d, db:%s, vgId:%d, will add 2 vnodes, vn:0 dnode:%d", pTrans->id, pVgroup->dbName, pVgroup->vgId,
100!
2958
          pVgroup->vnodeGid[0].dnodeId);
2959

2960
    // add second
2961
    if (pNewVgroup->replica == 1) {
100!
2962
      TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, pNewVgroup, pArray));
100✔
2963
    }
2964

2965
    // learner stage
2966
    pNewVgroup->vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
99✔
2967
    pNewVgroup->vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_LEARNER;
99✔
2968
    TAOS_CHECK_RETURN(
99!
2969
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
2970

2971
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pNewDb, pNewVgroup, &pNewVgroup->vnodeGid[1]));
99!
2972

2973
    // follower stage
2974
    pNewVgroup->vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
99✔
2975
    TAOS_CHECK_RETURN(mndAddAlterVnodeTypeAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[1].dnodeId));
99!
2976
    TAOS_CHECK_RETURN(
99!
2977
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
2978

2979
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, pNewVgroup));
99!
2980

2981
    // add third
2982
    if (pNewVgroup->replica == 2) {
99!
2983
      TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, pNewVgroup, pArray));
99✔
2984
    }
2985

2986
    pNewVgroup->vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
88✔
2987
    pNewVgroup->vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
88✔
2988
    pNewVgroup->vnodeGid[2].nodeRole = TAOS_SYNC_ROLE_VOTER;
88✔
2989
    TAOS_CHECK_RETURN(
88!
2990
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
2991
    TAOS_CHECK_RETURN(
88!
2992
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[1].dnodeId));
2993
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pNewDb, pNewVgroup, &pNewVgroup->vnodeGid[2]));
88!
2994

2995
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, pNewVgroup));
88!
2996
  } else if (pNewDb->cfg.replications == 1) {
4!
2997
    mInfo("trans:%d, db:%s, vgId:%d, will remove 2 vnodes, vn:0 dnode:%d vn:1 dnode:%d vn:2 dnode:%d", pTrans->id,
4!
2998
          pVgroup->dbName, pVgroup->vgId, pVgroup->vnodeGid[0].dnodeId, pVgroup->vnodeGid[1].dnodeId,
2999
          pVgroup->vnodeGid[2].dnodeId);
3000

3001
    SVnodeGid del1 = {0};
4✔
3002
    SVnodeGid del2 = {0};
4✔
3003
    TAOS_CHECK_RETURN(mndRemoveVnodeFromVgroup(pMnode, pTrans, pNewVgroup, pArray, &del1));
4!
3004
    TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pNewDb, pNewVgroup, &del1, true));
4!
3005
    TAOS_CHECK_RETURN(
4!
3006
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
3007
    TAOS_CHECK_RETURN(
4!
3008
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[1].dnodeId));
3009
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, pNewVgroup));
4!
3010

3011
    TAOS_CHECK_RETURN(mndRemoveVnodeFromVgroup(pMnode, pTrans, pNewVgroup, pArray, &del2));
4!
3012
    TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pNewDb, pNewVgroup, &del2, true));
4!
3013
    TAOS_CHECK_RETURN(
4!
3014
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
3015
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, pNewVgroup));
4!
3016
  } else if (pNewDb->cfg.replications == 2) {
×
3017
    mInfo("trans:%d, db:%s, vgId:%d, will add 1 vnode, vn:0 dnode:%d", pTrans->id, pVgroup->dbName, pVgroup->vgId,
×
3018
          pVgroup->vnodeGid[0].dnodeId);
3019

3020
    // add second
3021
    TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, pNewVgroup, pArray));
×
3022

3023
    // learner stage
3024
    pNewVgroup->vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3025
    pNewVgroup->vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3026
    TAOS_CHECK_RETURN(
×
3027
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
3028

3029
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pNewDb, pNewVgroup, &pNewVgroup->vnodeGid[1]));
×
3030

3031
    // follower stage
3032
    pNewVgroup->vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3033
    TAOS_CHECK_RETURN(mndAddAlterVnodeTypeAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[1].dnodeId));
×
3034
    TAOS_CHECK_RETURN(
×
3035
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
3036

3037
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, pNewVgroup));
×
3038
  } else {
3039
    return -1;
×
3040
  }
3041

3042
  mndSortVnodeGid(pNewVgroup);
92✔
3043

3044
  {
3045
    SSdbRaw *pVgRaw = mndVgroupActionEncode(pNewVgroup);
92✔
3046
    if (pVgRaw == NULL) {
92!
3047
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3048
      if (terrno != 0) code = terrno;
×
3049
      TAOS_RETURN(code);
×
3050
    }
3051
    if ((code = mndTransAppendCommitlog(pTrans, pVgRaw)) != 0) {
92!
3052
      sdbFreeRaw(pVgRaw);
×
3053
      TAOS_RETURN(code);
×
3054
    }
3055
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
92✔
3056
    if (code != 0) {
92!
3057
      mError("vgId:%d, failed to set raw status since %s at line:%d", pNewVgroup->vgId, tstrerror(code), __LINE__);
×
3058
      TAOS_RETURN(code);
×
3059
    }
3060
  }
3061

3062
  TAOS_RETURN(code);
92✔
3063
}
3064

3065
int32_t mndBuildRaftAlterVgroupAction(SMnode *pMnode, STrans *pTrans, SDbObj *pOldDb, SDbObj *pNewDb, SVgObj *pVgroup,
×
3066
                                      SArray *pArray) {
3067
  int32_t code = 0;
×
3068
  SVgObj  newVgroup = {0};
×
3069
  memcpy(&newVgroup, pVgroup, sizeof(SVgObj));
×
3070

3071
  if (pVgroup->replica <= 0 || pVgroup->replica == pNewDb->cfg.replications) {
×
3072
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfigAction(pMnode, pTrans, pNewDb, pVgroup));
×
3073
    TAOS_CHECK_RETURN(mndCheckDnodeMemory(pMnode, pOldDb, pNewDb, &newVgroup, pVgroup, pArray));
×
3074
    return 0;
×
3075
  }
3076

3077
  mndTransSetSerial(pTrans);
×
3078

3079
  mInfo("trans:%d, vgId:%d, alter vgroup, syncConfChangeVer:%d, version:%d, replica:%d", pTrans->id, pVgroup->vgId,
×
3080
        pVgroup->syncConfChangeVer, pVgroup->version, pVgroup->replica);
3081

3082
  if (newVgroup.replica == 1 && pNewDb->cfg.replications == 3) {
×
3083
    mInfo("db:%s, vgId:%d, will add 2 vnodes, vn:0 dnode:%d", pVgroup->dbName, pVgroup->vgId,
×
3084
          pVgroup->vnodeGid[0].dnodeId);
3085

3086
    // add second
3087
    TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, &newVgroup, pArray));
×
3088
    // add third
3089
    TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, &newVgroup, pArray));
×
3090

3091
    // add learner stage
3092
    newVgroup.vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3093
    newVgroup.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3094
    newVgroup.vnodeGid[2].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3095
    TAOS_CHECK_RETURN(
×
3096
        mndAddChangeConfigAction(pMnode, pTrans, pNewDb, pVgroup, &newVgroup, newVgroup.vnodeGid[0].dnodeId));
3097
    mInfo("trans:%d, vgId:%d, add change config, syncConfChangeVer:%d, version:%d, replica:%d", pTrans->id,
×
3098
          pVgroup->vgId, newVgroup.syncConfChangeVer, pVgroup->version, pVgroup->replica);
3099
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pNewDb, &newVgroup, &newVgroup.vnodeGid[1]));
×
3100
    mInfo("trans:%d, vgId:%d, create vnode, syncConfChangeVer:%d, version:%d, replica:%d", pTrans->id, pVgroup->vgId,
×
3101
          newVgroup.syncConfChangeVer, pVgroup->version, pVgroup->replica);
3102
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pNewDb, &newVgroup, &newVgroup.vnodeGid[2]));
×
3103
    mInfo("trans:%d, vgId:%d, create vnode, syncConfChangeVer:%d, version:%d, replica:%d", pTrans->id, pVgroup->vgId,
×
3104
          newVgroup.syncConfChangeVer, pVgroup->version, pVgroup->replica);
3105

3106
    // check learner
3107
    newVgroup.vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3108
    newVgroup.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3109
    newVgroup.vnodeGid[2].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3110
    TAOS_CHECK_RETURN(
×
3111
        mndAddCheckLearnerCatchupAction(pMnode, pTrans, pNewDb, &newVgroup, newVgroup.vnodeGid[1].dnodeId));
3112
    TAOS_CHECK_RETURN(
×
3113
        mndAddCheckLearnerCatchupAction(pMnode, pTrans, pNewDb, &newVgroup, newVgroup.vnodeGid[2].dnodeId));
3114

3115
    // change raft type
3116
    newVgroup.vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3117
    newVgroup.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3118
    newVgroup.vnodeGid[2].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3119
    TAOS_CHECK_RETURN(
×
3120
        mndAddChangeConfigAction(pMnode, pTrans, pNewDb, pVgroup, &newVgroup, newVgroup.vnodeGid[0].dnodeId));
3121

3122
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, &newVgroup));
×
3123

3124
    newVgroup.vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3125
    newVgroup.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3126
    newVgroup.vnodeGid[2].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3127
    TAOS_CHECK_RETURN(
×
3128
        mndAddChangeConfigAction(pMnode, pTrans, pNewDb, pVgroup, &newVgroup, newVgroup.vnodeGid[0].dnodeId));
3129

3130
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, &newVgroup));
×
3131

3132
    SSdbRaw *pVgRaw = mndVgroupActionEncode(&newVgroup);
×
3133
    if (pVgRaw == NULL) {
×
3134
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3135
      if (terrno != 0) code = terrno;
×
3136
      TAOS_RETURN(code);
×
3137
    }
3138
    if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
×
3139
      sdbFreeRaw(pVgRaw);
×
3140
      TAOS_RETURN(code);
×
3141
    }
3142
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
×
3143
    if (code != 0) {
×
3144
      mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVgroup.vgId, tstrerror(code),
×
3145
             __LINE__);
3146
      TAOS_RETURN(code);
×
3147
    }
3148
  } else if (newVgroup.replica == 3 && pNewDb->cfg.replications == 1) {
×
3149
    mInfo("db:%s, vgId:%d, will remove 2 vnodes, vn:0 dnode:%d vn:1 dnode:%d vn:2 dnode:%d", pVgroup->dbName,
×
3150
          pVgroup->vgId, pVgroup->vnodeGid[0].dnodeId, pVgroup->vnodeGid[1].dnodeId, pVgroup->vnodeGid[2].dnodeId);
3151

3152
    SVnodeGid del1 = {0};
×
3153
    TAOS_CHECK_RETURN(mndRemoveVnodeFromVgroupWithoutSave(pMnode, pTrans, &newVgroup, pArray, &del1));
×
3154

3155
    TAOS_CHECK_RETURN(
×
3156
        mndAddChangeConfigAction(pMnode, pTrans, pNewDb, pVgroup, &newVgroup, newVgroup.vnodeGid[0].dnodeId));
3157

3158
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, &newVgroup));
×
3159

3160
    TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pNewDb, &newVgroup, &del1, true));
×
3161

3162
    SSdbRaw *pVgRaw = mndVgroupActionEncode(&newVgroup);
×
3163
    if (pVgRaw == NULL) {
×
3164
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3165
      if (terrno != 0) code = terrno;
×
3166
      TAOS_RETURN(code);
×
3167
    }
3168
    if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
×
3169
      sdbFreeRaw(pVgRaw);
×
3170
      TAOS_RETURN(code);
×
3171
    }
3172
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
×
3173
    if (code != 0) {
×
3174
      mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVgroup.vgId, tstrerror(code),
×
3175
             __LINE__);
3176
      TAOS_RETURN(code);
×
3177
    }
3178

3179
    SVnodeGid del2 = {0};
×
3180
    TAOS_CHECK_RETURN(mndRemoveVnodeFromVgroupWithoutSave(pMnode, pTrans, &newVgroup, pArray, &del2));
×
3181

3182
    TAOS_CHECK_RETURN(
×
3183
        mndAddChangeConfigAction(pMnode, pTrans, pNewDb, pVgroup, &newVgroup, newVgroup.vnodeGid[0].dnodeId));
3184

3185
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, &newVgroup));
×
3186

3187
    TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pNewDb, &newVgroup, &del2, true));
×
3188

3189
    pVgRaw = mndVgroupActionEncode(&newVgroup);
×
3190
    if (pVgRaw == NULL) {
×
3191
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3192
      if (terrno != 0) code = terrno;
×
3193
      TAOS_RETURN(code);
×
3194
    }
3195
    if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
×
3196
      sdbFreeRaw(pVgRaw);
×
3197
      TAOS_RETURN(code);
×
3198
    }
3199
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
×
3200
    if (code != 0) {
×
3201
      mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVgroup.vgId, tstrerror(code),
×
3202
             __LINE__);
3203
      TAOS_RETURN(code);
×
3204
    }
3205
  } else {
3206
    return -1;
×
3207
  }
3208

3209
  mndSortVnodeGid(&newVgroup);
×
3210

3211
  {
3212
    SSdbRaw *pVgRaw = mndVgroupActionEncode(&newVgroup);
×
3213
    if (pVgRaw == NULL) {
×
3214
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3215
      if (terrno != 0) code = terrno;
×
3216
      TAOS_RETURN(code);
×
3217
    }
3218
    if ((code = mndTransAppendCommitlog(pTrans, pVgRaw)) != 0) {
×
3219
      sdbFreeRaw(pVgRaw);
×
3220
      TAOS_RETURN(code);
×
3221
    }
3222
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
×
3223
    if (code != 0) {
×
3224
      mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVgroup.vgId, tstrerror(code),
×
3225
             __LINE__);
3226
      TAOS_RETURN(code);
×
3227
    }
3228
  }
3229

3230
  TAOS_RETURN(code);
×
3231
}
3232

3233
int32_t mndBuildRestoreAlterVgroupAction(SMnode *pMnode, STrans *pTrans, SDbObj *db, SVgObj *pVgroup, SDnodeObj *pDnode,
10✔
3234
                                         SDnodeObj *pAnotherDnode) {
3235
  int32_t code = 0;
10✔
3236
  SVgObj  newVgroup = {0};
10✔
3237
  memcpy(&newVgroup, pVgroup, sizeof(SVgObj));
10✔
3238

3239
  mInfo("trans:%d, db:%s, vgId:%d, restore vnodes, vn:0 dnode:%d", pTrans->id, pVgroup->dbName, pVgroup->vgId,
10!
3240
        pVgroup->vnodeGid[0].dnodeId);
3241

3242
  if (newVgroup.replica == 1) {
10!
3243
    int selected = 0;
×
3244
    for (int i = 0; i < newVgroup.replica; i++) {
×
3245
      newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3246
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
×
3247
        selected = i;
×
3248
      }
3249
    }
3250
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, db, &newVgroup, &newVgroup.vnodeGid[selected]));
×
3251
  } else if (newVgroup.replica == 2) {
10!
3252
    for (int i = 0; i < newVgroup.replica; i++) {
×
3253
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
×
3254
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3255
      } else {
3256
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3257
      }
3258
    }
3259
    TAOS_CHECK_RETURN(mndRestoreAddAlterVnodeTypeAction(pMnode, pTrans, db, &newVgroup, pAnotherDnode));
×
3260

3261
    for (int i = 0; i < newVgroup.replica; i++) {
×
3262
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
×
3263
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3264
      } else {
3265
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3266
      }
3267
    }
3268
    TAOS_CHECK_RETURN(mndRestoreAddCreateVnodeAction(pMnode, pTrans, db, &newVgroup, pDnode));
×
3269

3270
    for (int i = 0; i < newVgroup.replica; i++) {
×
3271
      newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3272
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
×
3273
      }
3274
    }
3275
    TAOS_CHECK_RETURN(mndRestoreAddAlterVnodeTypeAction(pMnode, pTrans, db, &newVgroup, pDnode));
×
3276
    TAOS_CHECK_RETURN(mndRestoreAddAlterVnodeTypeAction(pMnode, pTrans, db, &newVgroup, pAnotherDnode));
×
3277
  } else if (newVgroup.replica == 3) {
10!
3278
    for (int i = 0; i < newVgroup.replica; i++) {
40✔
3279
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
30✔
3280
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_LEARNER;
10✔
3281
      } else {
3282
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
20✔
3283
      }
3284
    }
3285
    TAOS_CHECK_RETURN(mndRestoreAddCreateVnodeAction(pMnode, pTrans, db, &newVgroup, pDnode));
10!
3286

3287
    for (int i = 0; i < newVgroup.replica; i++) {
40✔
3288
      newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
30✔
3289
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
30✔
3290
      }
3291
    }
3292
    TAOS_CHECK_RETURN(mndRestoreAddAlterVnodeTypeAction(pMnode, pTrans, db, &newVgroup, pDnode));
10!
3293
  }
3294
  SSdbRaw *pVgRaw = mndVgroupActionEncode(&newVgroup);
10✔
3295
  if (pVgRaw == NULL) {
10!
3296
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3297
    if (terrno != 0) code = terrno;
×
3298
    TAOS_RETURN(code);
×
3299
  }
3300
  if ((code = mndTransAppendCommitlog(pTrans, pVgRaw)) != 0) {
10!
3301
    sdbFreeRaw(pVgRaw);
×
3302
    TAOS_RETURN(code);
×
3303
  }
3304
  code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
10✔
3305
  if (code != 0) {
10!
3306
    mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVgroup.vgId, tstrerror(code), __LINE__);
×
3307
    TAOS_RETURN(code);
×
3308
  }
3309

3310
  TAOS_RETURN(code);
10✔
3311
}
3312

3313
static int32_t mndAddAdjustVnodeHashRangeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup) {
×
3314
  return 0;
×
3315
}
3316

3317
typedef int32_t (*FpTransActionCb)(STrans *pTrans, SSdbRaw *pRaw);
3318

3319
static int32_t mndAddVgStatusAction(STrans *pTrans, SVgObj *pVg, ESdbStatus vgStatus, ETrnStage stage) {
183✔
3320
  int32_t         code = 0;
183✔
3321
  FpTransActionCb appendActionCb = (stage == TRN_STAGE_COMMIT_ACTION) ? mndTransAppendCommitlog : mndTransAppendRedolog;
183✔
3322
  SSdbRaw        *pRaw = mndVgroupActionEncode(pVg);
183✔
3323
  if (pRaw == NULL) {
183!
3324
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3325
    if (terrno != 0) code = terrno;
×
3326
    goto _err;
×
3327
  }
3328
  if ((code = appendActionCb(pTrans, pRaw)) != 0) goto _err;
183!
3329
  code = sdbSetRawStatus(pRaw, vgStatus);
183✔
3330
  if (code != 0) {
183!
3331
    mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", pVg->vgId, tstrerror(code), __LINE__);
×
3332
    goto _err;
×
3333
  }
3334
  pRaw = NULL;
183✔
3335
  TAOS_RETURN(code);
183✔
3336
_err:
×
3337
  sdbFreeRaw(pRaw);
×
3338
  TAOS_RETURN(code);
×
3339
}
3340

3341
static int32_t mndAddDbStatusAction(STrans *pTrans, SDbObj *pDb, ESdbStatus dbStatus, ETrnStage stage) {
75✔
3342
  int32_t         code = 0;
75✔
3343
  FpTransActionCb appendActionCb = (stage == TRN_STAGE_COMMIT_ACTION) ? mndTransAppendCommitlog : mndTransAppendRedolog;
75✔
3344
  SSdbRaw        *pRaw = mndDbActionEncode(pDb);
75✔
3345
  if (pRaw == NULL) {
75!
3346
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3347
    if (terrno != 0) code = terrno;
×
3348
    goto _err;
×
3349
  }
3350
  if ((code = appendActionCb(pTrans, pRaw)) != 0) goto _err;
75!
3351
  code = sdbSetRawStatus(pRaw, dbStatus);
75✔
3352
  if (code != 0) {
75!
3353
    mError("db:%s, failed to set raw status to ready, error:%s, line:%d", pDb->name, tstrerror(code), __LINE__);
×
3354
    goto _err;
×
3355
  }
3356
  pRaw = NULL;
75✔
3357
  TAOS_RETURN(code);
75✔
3358
_err:
×
3359
  sdbFreeRaw(pRaw);
×
3360
  TAOS_RETURN(code);
×
3361
}
3362

3363
int32_t mndSplitVgroup(SMnode *pMnode, SRpcMsg *pReq, SDbObj *pDb, SVgObj *pVgroup) {
44✔
3364
  int32_t code = -1;
44✔
3365
  STrans *pTrans = NULL;
44✔
3366
  SDbObj  dbObj = {0};
44✔
3367
  SArray *pArray = mndBuildDnodesArray(pMnode, 0, NULL);
44✔
3368

3369
#if defined(USE_SHARED_STORAGE)
3370
  if (tsSsEnabled) {
44!
3371
    code = TSDB_CODE_OPS_NOT_SUPPORT;
×
3372
    mError("vgId:%d, db:%s, shared storage exists, split vgroup not allowed", pVgroup->vgId, pVgroup->dbName);
×
3373
    goto _OVER;
×
3374
  }
3375
#endif
3376

3377
  if (pDb->cfg.withArbitrator) {
44!
3378
    code = TSDB_CODE_OPS_NOT_SUPPORT;
×
3379
    mError("vgId:%d, db:%s, with arbitrator, split vgroup not allowed", pVgroup->vgId, pVgroup->dbName);
×
3380
    goto _OVER;
×
3381
  }
3382

3383
  pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, TRN_CONFLICT_DB, pReq, "split-vgroup");
44✔
3384
  if (pTrans == NULL) {
44!
3385
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3386
    if (terrno != 0) code = terrno;
×
3387
    goto _OVER;
×
3388
  }
3389
  mndTransSetSerial(pTrans);
44✔
3390
  mInfo("trans:%d, used to split vgroup, vgId:%d", pTrans->id, pVgroup->vgId);
44!
3391

3392
  mndTransSetDbName(pTrans, pDb->name, NULL);
44✔
3393
  TAOS_CHECK_GOTO(mndTransCheckConflictWithCompact(pMnode, pTrans), NULL, _OVER);
44✔
3394

3395
  SVgObj newVg1 = {0};
43✔
3396
  memcpy(&newVg1, pVgroup, sizeof(SVgObj));
43✔
3397
  mInfo("vgId:%d, vgroup info before split, replica:%d hashBegin:%u hashEnd:%u", newVg1.vgId, newVg1.replica,
43!
3398
        newVg1.hashBegin, newVg1.hashEnd);
3399
  for (int32_t i = 0; i < newVg1.replica; ++i) {
150✔
3400
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg1.vgId, i, newVg1.vnodeGid[i].dnodeId);
107!
3401
  }
3402

3403
  if (newVg1.replica == 1) {
43✔
3404
    TAOS_CHECK_GOTO(mndAddVnodeToVgroup(pMnode, pTrans, &newVg1, pArray), NULL, _OVER);
11!
3405

3406
    newVg1.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_LEARNER;
11✔
3407
    TAOS_CHECK_GOTO(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[0].dnodeId), NULL,
11!
3408
                    _OVER);
3409
    TAOS_CHECK_GOTO(mndAddCreateVnodeAction(pMnode, pTrans, pDb, &newVg1, &newVg1.vnodeGid[1]), NULL, _OVER);
11!
3410

3411
    newVg1.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
11✔
3412
    TAOS_CHECK_GOTO(mndAddAlterVnodeTypeAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[1].dnodeId), NULL, _OVER);
11!
3413
    TAOS_CHECK_GOTO(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[0].dnodeId), NULL,
11!
3414
                    _OVER);
3415

3416
    TAOS_CHECK_GOTO(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg1), NULL, _OVER);
11!
3417
  } else if (newVg1.replica == 3) {
32!
3418
    SVnodeGid del1 = {0};
32✔
3419
    TAOS_CHECK_GOTO(mndRemoveVnodeFromVgroup(pMnode, pTrans, &newVg1, pArray, &del1), NULL, _OVER);
32!
3420
    TAOS_CHECK_GOTO(mndAddDropVnodeAction(pMnode, pTrans, pDb, &newVg1, &del1, true), NULL, _OVER);
32!
3421
    TAOS_CHECK_GOTO(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[0].dnodeId), NULL,
32!
3422
                    _OVER);
3423
    TAOS_CHECK_GOTO(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[1].dnodeId), NULL,
32!
3424
                    _OVER);
3425
  } else {
3426
    goto _OVER;
×
3427
  }
3428

3429
  for (int32_t i = 0; i < newVg1.replica; ++i) {
129✔
3430
    TAOS_CHECK_GOTO(mndAddDisableVnodeWriteAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[i].dnodeId), NULL,
86!
3431
                    _OVER);
3432
  }
3433
  TAOS_CHECK_GOTO(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg1), NULL, _OVER);
43!
3434

3435
  SVgObj newVg2 = {0};
43✔
3436
  memcpy(&newVg2, &newVg1, sizeof(SVgObj));
43✔
3437
  newVg1.replica = 1;
43✔
3438
  newVg1.hashEnd = newVg1.hashBegin / 2 + newVg1.hashEnd / 2;
43✔
3439
  memset(&newVg1.vnodeGid[1], 0, sizeof(SVnodeGid));
43✔
3440

3441
  newVg2.replica = 1;
43✔
3442
  newVg2.hashBegin = newVg1.hashEnd + 1;
43✔
3443
  memcpy(&newVg2.vnodeGid[0], &newVg2.vnodeGid[1], sizeof(SVnodeGid));
43✔
3444
  memset(&newVg2.vnodeGid[1], 0, sizeof(SVnodeGid));
43✔
3445

3446
  mInfo("vgId:%d, vgroup info after split, replica:%d hashrange:[%u, %u] vnode:0 dnode:%d", newVg1.vgId, newVg1.replica,
43!
3447
        newVg1.hashBegin, newVg1.hashEnd, newVg1.vnodeGid[0].dnodeId);
3448
  for (int32_t i = 0; i < newVg1.replica; ++i) {
86✔
3449
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg1.vgId, i, newVg1.vnodeGid[i].dnodeId);
43!
3450
  }
3451
  mInfo("vgId:%d, vgroup info after split, replica:%d hashrange:[%u, %u] vnode:0 dnode:%d", newVg2.vgId, newVg2.replica,
43!
3452
        newVg2.hashBegin, newVg2.hashEnd, newVg2.vnodeGid[0].dnodeId);
3453
  for (int32_t i = 0; i < newVg1.replica; ++i) {
86✔
3454
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg2.vgId, i, newVg2.vnodeGid[i].dnodeId);
43!
3455
  }
3456

3457
  // alter vgId and hash range
3458
  int32_t maxVgId = sdbGetMaxId(pMnode->pSdb, SDB_VGROUP);
43✔
3459
  int32_t srcVgId = newVg1.vgId;
43✔
3460
  newVg1.vgId = maxVgId;
43✔
3461
  TAOS_CHECK_GOTO(mndAddNewVgPrepareAction(pMnode, pTrans, &newVg1), NULL, _OVER);
43!
3462
  TAOS_CHECK_GOTO(mndAddAlterVnodeHashRangeAction(pMnode, pTrans, srcVgId, &newVg1), NULL, _OVER);
43!
3463

3464
  maxVgId++;
43✔
3465
  srcVgId = newVg2.vgId;
43✔
3466
  newVg2.vgId = maxVgId;
43✔
3467
  TAOS_CHECK_GOTO(mndAddNewVgPrepareAction(pMnode, pTrans, &newVg2), NULL, _OVER);
43!
3468
  TAOS_CHECK_GOTO(mndAddAlterVnodeHashRangeAction(pMnode, pTrans, srcVgId, &newVg2), NULL, _OVER);
43!
3469

3470
  TAOS_CHECK_GOTO(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg1), NULL, _OVER);
43!
3471
  TAOS_CHECK_GOTO(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg2), NULL, _OVER);
43!
3472

3473
  TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, &newVg1, SDB_STATUS_READY, TRN_STAGE_REDO_ACTION), NULL, _OVER);
43!
3474
  TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, &newVg2, SDB_STATUS_READY, TRN_STAGE_REDO_ACTION), NULL, _OVER);
43!
3475
  TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, pVgroup, SDB_STATUS_DROPPED, TRN_STAGE_REDO_ACTION), NULL, _OVER);
43!
3476

3477
  // update db status
3478
  memcpy(&dbObj, pDb, sizeof(SDbObj));
43✔
3479
  if (dbObj.cfg.pRetensions != NULL) {
43!
3480
    dbObj.cfg.pRetensions = taosArrayDup(pDb->cfg.pRetensions, NULL);
×
3481
    if (dbObj.cfg.pRetensions == NULL) {
×
3482
      code = terrno;
×
3483
      goto _OVER;
×
3484
    }
3485
  }
3486
  dbObj.vgVersion++;
43✔
3487
  dbObj.updateTime = taosGetTimestampMs();
43✔
3488
  dbObj.cfg.numOfVgroups++;
43✔
3489
  TAOS_CHECK_GOTO(mndAddDbStatusAction(pTrans, &dbObj, SDB_STATUS_READY, TRN_STAGE_REDO_ACTION), NULL, _OVER);
43!
3490

3491
  // adjust vgroup replica
3492
  if (pDb->cfg.replications != newVg1.replica) {
43✔
3493
    SVgObj tmpGroup = {0};
32✔
3494
    TAOS_CHECK_GOTO(mndBuildAlterVgroupAction(pMnode, pTrans, pDb, pDb, &newVg1, pArray, &tmpGroup), NULL, _OVER);
32!
3495
  } else {
3496
    TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, &newVg1, SDB_STATUS_READY, TRN_STAGE_COMMIT_ACTION), NULL, _OVER);
11!
3497
  }
3498

3499
  if (pDb->cfg.replications != newVg2.replica) {
43✔
3500
    SVgObj tmpGroup = {0};
32✔
3501
    TAOS_CHECK_GOTO(mndBuildAlterVgroupAction(pMnode, pTrans, pDb, pDb, &newVg2, pArray, &tmpGroup), NULL, _OVER);
32✔
3502
  } else {
3503
    TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, &newVg2, SDB_STATUS_READY, TRN_STAGE_COMMIT_ACTION), NULL, _OVER);
11!
3504
  }
3505

3506
  TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, pVgroup, SDB_STATUS_DROPPED, TRN_STAGE_COMMIT_ACTION), NULL, _OVER);
32!
3507

3508
  // commit db status
3509
  dbObj.vgVersion++;
32✔
3510
  dbObj.updateTime = taosGetTimestampMs();
32✔
3511
  TAOS_CHECK_GOTO(mndAddDbStatusAction(pTrans, &dbObj, SDB_STATUS_READY, TRN_STAGE_COMMIT_ACTION), NULL, _OVER);
32!
3512

3513
  TAOS_CHECK_GOTO(mndTransPrepare(pMnode, pTrans), NULL, _OVER);
32!
3514
  code = 0;
32✔
3515

3516
_OVER:
44✔
3517
  taosArrayDestroy(pArray);
44✔
3518
  mndTransDrop(pTrans);
44✔
3519
  taosArrayDestroy(dbObj.cfg.pRetensions);
44✔
3520
  TAOS_RETURN(code);
44✔
3521
}
3522

3523
extern int32_t mndProcessSplitVgroupMsgImp(SRpcMsg *pReq);
3524

3525
static int32_t mndProcessSplitVgroupMsg(SRpcMsg *pReq) { return mndProcessSplitVgroupMsgImp(pReq); }
44✔
3526

3527
#ifndef TD_ENTERPRISE
3528
int32_t mndProcessSplitVgroupMsgImp(SRpcMsg *pReq) { return 0; }
3529
#endif
3530

3531
static int32_t mndSetBalanceVgroupInfoToTrans(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
22✔
3532
                                              SDnodeObj *pSrc, SDnodeObj *pDst) {
3533
  int32_t code = 0;
22✔
3534
  SVgObj  newVg = {0};
22✔
3535
  memcpy(&newVg, pVgroup, sizeof(SVgObj));
22✔
3536
  mInfo("vgId:%d, vgroup info before balance, replica:%d", newVg.vgId, newVg.replica);
22!
3537
  for (int32_t i = 0; i < newVg.replica; ++i) {
64✔
3538
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg.vgId, i, newVg.vnodeGid[i].dnodeId);
42!
3539
  }
3540

3541
  TAOS_CHECK_RETURN(mndAddIncVgroupReplicaToTrans(pMnode, pTrans, pDb, &newVg, pDst->id));
22!
3542
  TAOS_CHECK_RETURN(mndAddDecVgroupReplicaFromTrans(pMnode, pTrans, pDb, &newVg, pSrc->id));
22!
3543

3544
  {
3545
    SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
22✔
3546
    if (pRaw == NULL) {
22!
3547
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3548
      if (terrno != 0) code = terrno;
×
3549
      TAOS_RETURN(code);
×
3550
    }
3551
    if ((code = mndTransAppendCommitlog(pTrans, pRaw)) != 0) {
22!
3552
      sdbFreeRaw(pRaw);
×
3553
      TAOS_RETURN(code);
×
3554
    }
3555
    code = sdbSetRawStatus(pRaw, SDB_STATUS_READY);
22✔
3556
    if (code != 0) {
22!
3557
      mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVg.vgId, tstrerror(code), __LINE__);
×
3558
      TAOS_RETURN(code);
×
3559
    }
3560
  }
3561

3562
  mInfo("vgId:%d, vgroup info after balance, replica:%d", newVg.vgId, newVg.replica);
22!
3563
  for (int32_t i = 0; i < newVg.replica; ++i) {
64✔
3564
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg.vgId, i, newVg.vnodeGid[i].dnodeId);
42!
3565
  }
3566
  TAOS_RETURN(code);
22✔
3567
}
3568

3569
static int32_t mndBalanceVgroupBetweenDnode(SMnode *pMnode, STrans *pTrans, SDnodeObj *pSrc, SDnodeObj *pDst,
22✔
3570
                                            SHashObj *pBalancedVgroups) {
3571
  void   *pIter = NULL;
22✔
3572
  int32_t code = -1;
22✔
3573
  SSdb   *pSdb = pMnode->pSdb;
22✔
3574

3575
  while (1) {
14✔
3576
    SVgObj *pVgroup = NULL;
36✔
3577
    pIter = sdbFetch(pSdb, SDB_VGROUP, pIter, (void **)&pVgroup);
36✔
3578
    if (pIter == NULL) break;
36!
3579
    if (taosHashGet(pBalancedVgroups, &pVgroup->vgId, sizeof(int32_t)) != NULL) {
36✔
3580
      sdbRelease(pSdb, pVgroup);
12✔
3581
      continue;
14✔
3582
    }
3583

3584
    bool existInSrc = false;
24✔
3585
    bool existInDst = false;
24✔
3586
    for (int32_t i = 0; i < pVgroup->replica; ++i) {
68✔
3587
      SVnodeGid *pGid = &pVgroup->vnodeGid[i];
44✔
3588
      if (pGid->dnodeId == pSrc->id) existInSrc = true;
44✔
3589
      if (pGid->dnodeId == pDst->id) existInDst = true;
44!
3590
    }
3591

3592
    if (!existInSrc || existInDst) {
24!
3593
      sdbRelease(pSdb, pVgroup);
2✔
3594
      continue;
2✔
3595
    }
3596

3597
    SDbObj *pDb = mndAcquireDb(pMnode, pVgroup->dbName);
22✔
3598
    if (pDb == NULL) {
22!
3599
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3600
      if (terrno != 0) code = terrno;
×
3601
      mError("vgId:%d, balance vgroup can't find db obj dbName:%s", pVgroup->vgId, pVgroup->dbName);
×
3602
      goto _OUT;
×
3603
    }
3604

3605
    if (pDb->cfg.withArbitrator) {
22!
3606
      mInfo("vgId:%d, db:%s, with arbitrator, balance vgroup not allowed", pVgroup->vgId, pVgroup->dbName);
×
3607
      goto _OUT;
×
3608
    }
3609

3610
    code = mndSetBalanceVgroupInfoToTrans(pMnode, pTrans, pDb, pVgroup, pSrc, pDst);
22✔
3611
    if (code == 0) {
22!
3612
      code = taosHashPut(pBalancedVgroups, &pVgroup->vgId, sizeof(int32_t), &pVgroup->vgId, sizeof(int32_t));
22✔
3613
    }
3614

3615
  _OUT:
×
3616
    mndReleaseDb(pMnode, pDb);
22✔
3617
    sdbRelease(pSdb, pVgroup);
22✔
3618
    sdbCancelFetch(pSdb, pIter);
22✔
3619
    break;
22✔
3620
  }
3621

3622
  return code;
22✔
3623
}
3624

3625
static int32_t mndBalanceVgroup(SMnode *pMnode, SRpcMsg *pReq, SArray *pArray) {
16✔
3626
  int32_t   code = -1;
16✔
3627
  int32_t   numOfVgroups = 0;
16✔
3628
  STrans   *pTrans = NULL;
16✔
3629
  SHashObj *pBalancedVgroups = NULL;
16✔
3630

3631
  pBalancedVgroups = taosHashInit(16, taosGetDefaultHashFunction(TSDB_DATA_TYPE_INT), false, HASH_NO_LOCK);
16✔
3632
  if (pBalancedVgroups == NULL) goto _OVER;
16!
3633

3634
  pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, TRN_CONFLICT_GLOBAL, pReq, "balance-vgroup");
16✔
3635
  if (pTrans == NULL) {
16!
3636
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3637
    if (terrno != 0) code = terrno;
×
3638
    goto _OVER;
×
3639
  }
3640
  mndTransSetSerial(pTrans);
16✔
3641
  mInfo("trans:%d, used to balance vgroup", pTrans->id);
16!
3642
  TAOS_CHECK_GOTO(mndTransCheckConflict(pMnode, pTrans), NULL, _OVER);
16✔
3643
  TAOS_CHECK_GOTO(mndTransCheckConflictWithCompact(pMnode, pTrans), NULL, _OVER);
15✔
3644

3645
  while (1) {
22✔
3646
    taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes);
36✔
3647
    for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
155✔
3648
      SDnodeObj *pDnode = taosArrayGet(pArray, i);
119✔
3649
      mInfo("dnode:%d, equivalent vnodes:%d others:%d support:%d, score:%f", pDnode->id, pDnode->numOfVnodes,
119!
3650
            pDnode->numOfSupportVnodes, pDnode->numOfOtherNodes, mndGetDnodeScore(pDnode, 0, 1));
3651
    }
3652

3653
    SDnodeObj *pSrc = taosArrayGet(pArray, taosArrayGetSize(pArray) - 1);
36✔
3654
    SDnodeObj *pDst = taosArrayGet(pArray, 0);
36✔
3655

3656
    float srcScore = mndGetDnodeScore(pSrc, -1, 1);
36✔
3657
    float dstScore = mndGetDnodeScore(pDst, 1, 1);
36✔
3658
    mInfo("trans:%d, after balance, src dnode:%d score:%f, dst dnode:%d score:%f", pTrans->id, pSrc->id, dstScore,
36!
3659
          pDst->id, dstScore);
3660

3661
    if (srcScore > dstScore - 0.000001) {
36✔
3662
      code = mndBalanceVgroupBetweenDnode(pMnode, pTrans, pSrc, pDst, pBalancedVgroups);
22✔
3663
      if (code == 0) {
22!
3664
        pSrc->numOfVnodes--;
22✔
3665
        pDst->numOfVnodes++;
22✔
3666
        numOfVgroups++;
22✔
3667
        continue;
22✔
3668
      } else {
3669
        mInfo("trans:%d, no vgroup need to balance from dnode:%d to dnode:%d", pTrans->id, pSrc->id, pDst->id);
×
3670
        break;
×
3671
      }
3672
    } else {
3673
      mInfo("trans:%d, no vgroup need to balance any more", pTrans->id);
14!
3674
      break;
14✔
3675
    }
3676
  }
3677

3678
  if (numOfVgroups <= 0) {
14!
3679
    mInfo("no need to balance vgroup");
×
3680
    code = 0;
×
3681
  } else {
3682
    mInfo("start to balance vgroup, numOfVgroups:%d", numOfVgroups);
14!
3683
    if (mndTransPrepare(pMnode, pTrans) != 0) goto _OVER;
14!
3684
    code = TSDB_CODE_ACTION_IN_PROGRESS;
14✔
3685
  }
3686

3687
_OVER:
16✔
3688
  taosHashCleanup(pBalancedVgroups);
16✔
3689
  mndTransDrop(pTrans);
16✔
3690
  TAOS_RETURN(code);
16✔
3691
}
3692

3693
static int32_t mndProcessBalanceVgroupMsg(SRpcMsg *pReq) {
19✔
3694
  SMnode *pMnode = pReq->info.node;
19✔
3695
  int32_t code = -1;
19✔
3696
  SArray *pArray = NULL;
19✔
3697
  void   *pIter = NULL;
19✔
3698
  int64_t curMs = taosGetTimestampMs();
19✔
3699

3700
  SBalanceVgroupReq req = {0};
19✔
3701
  if (tDeserializeSBalanceVgroupReq(pReq->pCont, pReq->contLen, &req) != 0) {
19!
3702
    code = TSDB_CODE_INVALID_MSG;
×
3703
    goto _OVER;
×
3704
  }
3705

3706
  mInfo("start to balance vgroup");
19!
3707
  if ((code = mndCheckOperPrivilege(pMnode, pReq->info.conn.user, MND_OPER_BALANCE_VGROUP)) != 0) {
19✔
3708
    goto _OVER;
1✔
3709
  }
3710

3711
  if (sdbGetSize(pMnode->pSdb, SDB_MOUNT) > 0) {
18!
3712
    code = TSDB_CODE_MND_MOUNT_NOT_EMPTY;
×
3713
    goto _OVER;
×
3714
  }
3715

3716
  while (1) {
55✔
3717
    SDnodeObj *pDnode = NULL;
73✔
3718
    pIter = sdbFetch(pMnode->pSdb, SDB_DNODE, pIter, (void **)&pDnode);
73✔
3719
    if (pIter == NULL) break;
73✔
3720
    if (!mndIsDnodeOnline(pDnode, curMs)) {
57✔
3721
      sdbCancelFetch(pMnode->pSdb, pIter);
2✔
3722
      code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
2✔
3723
      mError("failed to balance vgroup since %s, dnode:%d", terrstr(), pDnode->id);
2!
3724
      sdbRelease(pMnode->pSdb, pDnode);
2✔
3725
      goto _OVER;
2✔
3726
    }
3727

3728
    sdbRelease(pMnode->pSdb, pDnode);
55✔
3729
  }
3730

3731
  pArray = mndBuildDnodesArray(pMnode, 0, NULL);
16✔
3732
  if (pArray == NULL) {
16!
3733
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3734
    if (terrno != 0) code = terrno;
×
3735
    goto _OVER;
×
3736
  }
3737

3738
  if (taosArrayGetSize(pArray) < 2) {
16!
3739
    mInfo("no need to balance vgroup since dnode num less than 2");
×
3740
    code = 0;
×
3741
  } else {
3742
    code = mndBalanceVgroup(pMnode, pReq, pArray);
16✔
3743
  }
3744

3745
  auditRecord(pReq, pMnode->clusterId, "balanceVgroup", "", "", req.sql, req.sqlLen);
16✔
3746

3747
_OVER:
19✔
3748
  if (code != 0 && code != TSDB_CODE_ACTION_IN_PROGRESS) {
19!
3749
    mError("failed to balance vgroup since %s", tstrerror(code));
5!
3750
  }
3751

3752
  taosArrayDestroy(pArray);
19✔
3753
  tFreeSBalanceVgroupReq(&req);
19✔
3754
  TAOS_RETURN(code);
19✔
3755
}
3756

3757
bool mndVgroupInDb(SVgObj *pVgroup, int64_t dbUid) { return !pVgroup->isTsma && pVgroup->dbUid == dbUid; }
338,947!
3758

3759
bool mndVgroupInDnode(SVgObj *pVgroup, int32_t dnodeId) {
16✔
3760
  for (int i = 0; i < pVgroup->replica; i++) {
42✔
3761
    if (pVgroup->vnodeGid[i].dnodeId == dnodeId) return true;
36✔
3762
  }
3763
  return false;
6✔
3764
}
3765

3766
static void *mndBuildCompactVnodeReq(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, int32_t *pContLen, int64_t compactTs,
99✔
3767
                                     STimeWindow tw, bool metaOnly) {
3768
  SCompactVnodeReq compactReq = {0};
99✔
3769
  compactReq.dbUid = pDb->uid;
99✔
3770
  compactReq.compactStartTime = compactTs;
99✔
3771
  compactReq.tw = tw;
99✔
3772
  compactReq.metaOnly = metaOnly;
99✔
3773
  tstrncpy(compactReq.db, pDb->name, TSDB_DB_FNAME_LEN);
99✔
3774

3775
  mInfo("vgId:%d, build compact vnode config req", pVgroup->vgId);
99!
3776
  int32_t contLen = tSerializeSCompactVnodeReq(NULL, 0, &compactReq);
99✔
3777
  if (contLen < 0) {
99!
3778
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
3779
    return NULL;
×
3780
  }
3781
  contLen += sizeof(SMsgHead);
99✔
3782

3783
  void *pReq = taosMemoryMalloc(contLen);
99!
3784
  if (pReq == NULL) {
99!
3785
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
3786
    return NULL;
×
3787
  }
3788

3789
  SMsgHead *pHead = pReq;
99✔
3790
  pHead->contLen = htonl(contLen);
99✔
3791
  pHead->vgId = htonl(pVgroup->vgId);
99✔
3792

3793
  if (tSerializeSCompactVnodeReq((char *)pReq + sizeof(SMsgHead), contLen, &compactReq) < 0) {
99!
3794
    taosMemoryFree(pReq);
×
3795
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
3796
    return NULL;
×
3797
  }
3798
  *pContLen = contLen;
99✔
3799
  return pReq;
99✔
3800
}
3801

3802
static int32_t mndAddCompactVnodeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int64_t compactTs,
99✔
3803
                                        STimeWindow tw, bool metaOnly) {
3804
  int32_t      code = 0;
99✔
3805
  STransAction action = {0};
99✔
3806
  action.epSet = mndGetVgroupEpset(pMnode, pVgroup);
99✔
3807

3808
  int32_t contLen = 0;
99✔
3809
  void   *pReq = mndBuildCompactVnodeReq(pMnode, pDb, pVgroup, &contLen, compactTs, tw, metaOnly);
99✔
3810
  if (pReq == NULL) {
99!
3811
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3812
    if (terrno != 0) code = terrno;
×
3813
    TAOS_RETURN(code);
×
3814
  }
3815

3816
  action.pCont = pReq;
99✔
3817
  action.contLen = contLen;
99✔
3818
  action.msgType = TDMT_VND_COMPACT;
99✔
3819

3820
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
99!
3821
    taosMemoryFree(pReq);
×
3822
    TAOS_RETURN(code);
×
3823
  }
3824

3825
  TAOS_RETURN(code);
99✔
3826
}
3827

3828
int32_t mndBuildCompactVgroupAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int64_t compactTs,
99✔
3829
                                    STimeWindow tw, bool metaOnly) {
3830
  TAOS_CHECK_RETURN(mndAddCompactVnodeAction(pMnode, pTrans, pDb, pVgroup, compactTs, tw, metaOnly));
99!
3831
  return 0;
99✔
3832
}
3833

3834
static void *mndBuildSsMigrateVgroupReq(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, int32_t *pContLen, SSsMigrateObj* pMigrateObj) {
×
3835
  SSsMigrateVgroupReq req = {.ssMigrateId = pMigrateObj->id, .nodeId = 0, .timestamp = pMigrateObj->startTime };
×
3836

3837
  mInfo("vgId:%d, build ssmigrate vnode config req", pVgroup->vgId);
×
3838
  int32_t contLen = tSerializeSSsMigrateVgroupReq(NULL, 0, &req);
×
3839
  if (contLen < 0) {
×
3840
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
3841
    return NULL;
×
3842
  }
3843
  contLen += sizeof(SMsgHead);
×
3844

3845
  void *pReq = taosMemoryMalloc(contLen);
×
3846
  if (pReq == NULL) {
×
3847
    return NULL;
×
3848
  }
3849

3850
  SMsgHead *pHead = pReq;
×
3851
  pHead->contLen = htonl(contLen);
×
3852
  pHead->vgId = htonl(pVgroup->vgId);
×
3853

3854
  if (tSerializeSSsMigrateVgroupReq((char *)pReq + sizeof(SMsgHead), contLen - sizeof(SMsgHead), &req) < 0) {
×
3855
    taosMemoryFree(pReq);
×
3856
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
3857
    return NULL;
×
3858
  }
3859
  *pContLen = contLen;
×
3860
  return pReq;
×
3861
}
3862

3863
static int32_t mndAddSsMigrateVgroupAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, SSsMigrateObj* pMigrateObj) {
×
3864
  int32_t      code = 0;
×
3865
  STransAction action = {0};
×
3866
  action.epSet = mndGetVgroupEpset(pMnode, pVgroup);
×
3867

3868
  int32_t contLen = 0;
×
3869
  void   *pReq = mndBuildSsMigrateVgroupReq(pMnode, pDb, pVgroup, &contLen, pMigrateObj);
×
3870
  if (pReq == NULL) {
×
3871
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3872
    if (terrno != 0) code = terrno;
×
3873
    TAOS_RETURN(code);
×
3874
  }
3875

3876
  action.pCont = pReq;
×
3877
  action.contLen = contLen;
×
3878
  action.msgType = TDMT_VND_SSMIGRATE;
×
3879

3880
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
×
3881
    taosMemoryFree(pReq);
×
3882
    TAOS_RETURN(code);
×
3883
  }
3884

3885
  TAOS_RETURN(code);
×
3886
}
3887

3888
int32_t mndBuildSsMigrateVgroupAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, SSsMigrateObj* pMigrateObj) {
×
3889
  TAOS_CHECK_RETURN(mndAddSsMigrateVgroupAction(pMnode, pTrans, pDb, pVgroup, pMigrateObj));
×
3890
  return 0;
×
3891
}
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc